| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 5159, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.0067842605156037995, |
| "grad_norm": 11.89448977442727, |
| "learning_rate": 3.1007751937984497e-07, |
| "loss": 0.7467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.753227710723877, |
| "step": 5, |
| "valid_targets_mean": 2444.9, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 0.013568521031207599, |
| "grad_norm": 11.235151503546374, |
| "learning_rate": 6.976744186046513e-07, |
| "loss": 0.7355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7996399998664856, |
| "step": 10, |
| "valid_targets_mean": 2697.8, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 0.0203527815468114, |
| "grad_norm": 10.797290846276908, |
| "learning_rate": 1.0852713178294575e-06, |
| "loss": 0.7424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7481732368469238, |
| "step": 15, |
| "valid_targets_mean": 2544.7, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 0.027137042062415198, |
| "grad_norm": 8.962671209264652, |
| "learning_rate": 1.4728682170542638e-06, |
| "loss": 0.721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.750222384929657, |
| "step": 20, |
| "valid_targets_mean": 2245.1, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.033921302578018994, |
| "grad_norm": 5.830676916492257, |
| "learning_rate": 1.86046511627907e-06, |
| "loss": 0.7025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6887879371643066, |
| "step": 25, |
| "valid_targets_mean": 3070.0, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 0.0407055630936228, |
| "grad_norm": 4.8564311609396285, |
| "learning_rate": 2.2480620155038763e-06, |
| "loss": 0.6958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6251484155654907, |
| "step": 30, |
| "valid_targets_mean": 2736.8, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 0.04748982360922659, |
| "grad_norm": 3.646908378962616, |
| "learning_rate": 2.635658914728683e-06, |
| "loss": 0.6536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6334314942359924, |
| "step": 35, |
| "valid_targets_mean": 2762.1, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 0.054274084124830396, |
| "grad_norm": 2.9965745618812183, |
| "learning_rate": 3.0232558139534885e-06, |
| "loss": 0.612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6031469106674194, |
| "step": 40, |
| "valid_targets_mean": 2219.0, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 0.06105834464043419, |
| "grad_norm": 2.746946360828467, |
| "learning_rate": 3.4108527131782946e-06, |
| "loss": 0.5748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5974681973457336, |
| "step": 45, |
| "valid_targets_mean": 2428.1, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 0.06784260515603799, |
| "grad_norm": 1.5002667732002524, |
| "learning_rate": 3.798449612403101e-06, |
| "loss": 0.5401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.528899073600769, |
| "step": 50, |
| "valid_targets_mean": 2882.4, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 0.07462686567164178, |
| "grad_norm": 1.1607016531427559, |
| "learning_rate": 4.186046511627907e-06, |
| "loss": 0.5035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5087602734565735, |
| "step": 55, |
| "valid_targets_mean": 2938.0, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 0.0814111261872456, |
| "grad_norm": 0.9535068201891985, |
| "learning_rate": 4.573643410852713e-06, |
| "loss": 0.4885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4569432735443115, |
| "step": 60, |
| "valid_targets_mean": 2973.9, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 0.08819538670284939, |
| "grad_norm": 1.1135265052091592, |
| "learning_rate": 4.9612403100775195e-06, |
| "loss": 0.5046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5376325845718384, |
| "step": 65, |
| "valid_targets_mean": 2420.6, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 0.09497964721845319, |
| "grad_norm": 0.9604258885113336, |
| "learning_rate": 5.348837209302326e-06, |
| "loss": 0.4622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44064652919769287, |
| "step": 70, |
| "valid_targets_mean": 2443.4, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 0.10176390773405698, |
| "grad_norm": 0.7991192270229877, |
| "learning_rate": 5.736434108527133e-06, |
| "loss": 0.4649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4826815724372864, |
| "step": 75, |
| "valid_targets_mean": 3380.5, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 0.10854816824966079, |
| "grad_norm": 0.769158116469445, |
| "learning_rate": 6.124031007751938e-06, |
| "loss": 0.4427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44103240966796875, |
| "step": 80, |
| "valid_targets_mean": 3035.8, |
| "valid_targets_min": 1083 |
| }, |
| { |
| "epoch": 0.11533242876526459, |
| "grad_norm": 0.7875257411449904, |
| "learning_rate": 6.511627906976745e-06, |
| "loss": 0.4481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4029495120048523, |
| "step": 85, |
| "valid_targets_mean": 2706.4, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 0.12211668928086838, |
| "grad_norm": 0.8473139007291898, |
| "learning_rate": 6.899224806201551e-06, |
| "loss": 0.4384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45044875144958496, |
| "step": 90, |
| "valid_targets_mean": 2473.2, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 0.12890094979647218, |
| "grad_norm": 0.7757846680357573, |
| "learning_rate": 7.286821705426357e-06, |
| "loss": 0.4459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4469519853591919, |
| "step": 95, |
| "valid_targets_mean": 2856.1, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 0.13568521031207598, |
| "grad_norm": 0.8491234814195904, |
| "learning_rate": 7.674418604651164e-06, |
| "loss": 0.4352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.439635306596756, |
| "step": 100, |
| "valid_targets_mean": 2584.4, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 0.14246947082767977, |
| "grad_norm": 0.7130925742464007, |
| "learning_rate": 8.06201550387597e-06, |
| "loss": 0.4203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4034441113471985, |
| "step": 105, |
| "valid_targets_mean": 3170.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 0.14925373134328357, |
| "grad_norm": 0.8093168817770919, |
| "learning_rate": 8.449612403100775e-06, |
| "loss": 0.4547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4224606156349182, |
| "step": 110, |
| "valid_targets_mean": 2654.3, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 0.1560379918588874, |
| "grad_norm": 0.8309738324960866, |
| "learning_rate": 8.837209302325582e-06, |
| "loss": 0.4215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43095940351486206, |
| "step": 115, |
| "valid_targets_mean": 2718.1, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 0.1628222523744912, |
| "grad_norm": 0.793319858169495, |
| "learning_rate": 9.224806201550389e-06, |
| "loss": 0.4186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43605878949165344, |
| "step": 120, |
| "valid_targets_mean": 2385.8, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 0.16960651289009498, |
| "grad_norm": 1.0230399253622091, |
| "learning_rate": 9.612403100775196e-06, |
| "loss": 0.4211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3982701897621155, |
| "step": 125, |
| "valid_targets_mean": 1617.4, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 0.17639077340569878, |
| "grad_norm": 0.8209896026771017, |
| "learning_rate": 1e-05, |
| "loss": 0.4032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4078044891357422, |
| "step": 130, |
| "valid_targets_mean": 2368.6, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 0.18317503392130258, |
| "grad_norm": 0.7095946770161736, |
| "learning_rate": 1.0387596899224808e-05, |
| "loss": 0.414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3884209394454956, |
| "step": 135, |
| "valid_targets_mean": 2926.9, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.18995929443690637, |
| "grad_norm": 0.6958216140407364, |
| "learning_rate": 1.0775193798449613e-05, |
| "loss": 0.4256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37612026929855347, |
| "step": 140, |
| "valid_targets_mean": 3520.8, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 0.19674355495251017, |
| "grad_norm": 0.8291040584046291, |
| "learning_rate": 1.116279069767442e-05, |
| "loss": 0.4085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4283609986305237, |
| "step": 145, |
| "valid_targets_mean": 2811.3, |
| "valid_targets_min": 1326 |
| }, |
| { |
| "epoch": 0.20352781546811397, |
| "grad_norm": 0.8093278558733981, |
| "learning_rate": 1.1550387596899227e-05, |
| "loss": 0.4014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4302545189857483, |
| "step": 150, |
| "valid_targets_mean": 2660.5, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 0.21031207598371776, |
| "grad_norm": 0.7238386266854082, |
| "learning_rate": 1.193798449612403e-05, |
| "loss": 0.4173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37872761487960815, |
| "step": 155, |
| "valid_targets_mean": 2928.2, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 0.21709633649932158, |
| "grad_norm": 0.7853375198765415, |
| "learning_rate": 1.2325581395348838e-05, |
| "loss": 0.4018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40379324555397034, |
| "step": 160, |
| "valid_targets_mean": 2898.9, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 0.22388059701492538, |
| "grad_norm": 0.7686517468969368, |
| "learning_rate": 1.2713178294573645e-05, |
| "loss": 0.4011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4392387270927429, |
| "step": 165, |
| "valid_targets_mean": 2946.6, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 0.23066485753052918, |
| "grad_norm": 0.7993134466572939, |
| "learning_rate": 1.3100775193798451e-05, |
| "loss": 0.3991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41066741943359375, |
| "step": 170, |
| "valid_targets_mean": 2813.2, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 0.23744911804613297, |
| "grad_norm": 0.6677659446481017, |
| "learning_rate": 1.3488372093023257e-05, |
| "loss": 0.3902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3710253834724426, |
| "step": 175, |
| "valid_targets_mean": 3316.8, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 0.24423337856173677, |
| "grad_norm": 0.7909997170086058, |
| "learning_rate": 1.3875968992248064e-05, |
| "loss": 0.3856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41473937034606934, |
| "step": 180, |
| "valid_targets_mean": 2416.4, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.2510176390773406, |
| "grad_norm": 0.8792540068344556, |
| "learning_rate": 1.426356589147287e-05, |
| "loss": 0.3846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3967583477497101, |
| "step": 185, |
| "valid_targets_mean": 2736.9, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 0.25780189959294436, |
| "grad_norm": 0.7958264159408515, |
| "learning_rate": 1.4651162790697674e-05, |
| "loss": 0.4017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40616077184677124, |
| "step": 190, |
| "valid_targets_mean": 2568.8, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 0.2645861601085482, |
| "grad_norm": 0.7604022300459651, |
| "learning_rate": 1.5038759689922481e-05, |
| "loss": 0.3754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33513033390045166, |
| "step": 195, |
| "valid_targets_mean": 2750.9, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 0.27137042062415195, |
| "grad_norm": 0.8244610679195269, |
| "learning_rate": 1.542635658914729e-05, |
| "loss": 0.3939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38060298562049866, |
| "step": 200, |
| "valid_targets_mean": 2832.4, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 0.2781546811397558, |
| "grad_norm": 0.729183257219207, |
| "learning_rate": 1.5813953488372095e-05, |
| "loss": 0.3801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36861342191696167, |
| "step": 205, |
| "valid_targets_mean": 2902.9, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 0.28493894165535955, |
| "grad_norm": 0.8051272259035377, |
| "learning_rate": 1.62015503875969e-05, |
| "loss": 0.391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4003250300884247, |
| "step": 210, |
| "valid_targets_mean": 2374.9, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 0.29172320217096337, |
| "grad_norm": 0.7887590950471755, |
| "learning_rate": 1.6589147286821706e-05, |
| "loss": 0.3754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3678756356239319, |
| "step": 215, |
| "valid_targets_mean": 3166.3, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 0.29850746268656714, |
| "grad_norm": 0.8029733763158426, |
| "learning_rate": 1.697674418604651e-05, |
| "loss": 0.3681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3723628520965576, |
| "step": 220, |
| "valid_targets_mean": 2474.6, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 0.30529172320217096, |
| "grad_norm": 0.7343226056865998, |
| "learning_rate": 1.736434108527132e-05, |
| "loss": 0.3632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38321518898010254, |
| "step": 225, |
| "valid_targets_mean": 3262.1, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 0.3120759837177748, |
| "grad_norm": 0.7607257346962287, |
| "learning_rate": 1.7751937984496125e-05, |
| "loss": 0.3715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34952956438064575, |
| "step": 230, |
| "valid_targets_mean": 2810.3, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 0.31886024423337855, |
| "grad_norm": 0.8227068076920964, |
| "learning_rate": 1.813953488372093e-05, |
| "loss": 0.3819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3929305970668793, |
| "step": 235, |
| "valid_targets_mean": 2834.8, |
| "valid_targets_min": 1701 |
| }, |
| { |
| "epoch": 0.3256445047489824, |
| "grad_norm": 0.6827841124705409, |
| "learning_rate": 1.852713178294574e-05, |
| "loss": 0.3618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3641515374183655, |
| "step": 240, |
| "valid_targets_mean": 3186.5, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 0.33242876526458615, |
| "grad_norm": 0.7602966954331676, |
| "learning_rate": 1.8914728682170544e-05, |
| "loss": 0.3751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3500159978866577, |
| "step": 245, |
| "valid_targets_mean": 2656.6, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 0.33921302578018997, |
| "grad_norm": 0.7668023931379694, |
| "learning_rate": 1.9302325581395353e-05, |
| "loss": 0.3739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4043837785720825, |
| "step": 250, |
| "valid_targets_mean": 3122.2, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 0.34599728629579374, |
| "grad_norm": 0.7093670546464718, |
| "learning_rate": 1.9689922480620155e-05, |
| "loss": 0.3778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38684576749801636, |
| "step": 255, |
| "valid_targets_mean": 3311.2, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.35278154681139756, |
| "grad_norm": 0.6761466382547776, |
| "learning_rate": 2.0077519379844963e-05, |
| "loss": 0.3692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34655070304870605, |
| "step": 260, |
| "valid_targets_mean": 3112.8, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.35956580732700133, |
| "grad_norm": 0.6694834479453904, |
| "learning_rate": 2.046511627906977e-05, |
| "loss": 0.356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3410634398460388, |
| "step": 265, |
| "valid_targets_mean": 3315.6, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 0.36635006784260515, |
| "grad_norm": 0.8155424962452198, |
| "learning_rate": 2.0852713178294577e-05, |
| "loss": 0.3685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35310614109039307, |
| "step": 270, |
| "valid_targets_mean": 2339.4, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 0.373134328358209, |
| "grad_norm": 0.9070653857602943, |
| "learning_rate": 2.1240310077519383e-05, |
| "loss": 0.3449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3375753164291382, |
| "step": 275, |
| "valid_targets_mean": 3212.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.37991858887381275, |
| "grad_norm": 0.7447980160423101, |
| "learning_rate": 2.1627906976744188e-05, |
| "loss": 0.3549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3524802327156067, |
| "step": 280, |
| "valid_targets_mean": 2781.6, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 0.38670284938941657, |
| "grad_norm": 0.910428084386681, |
| "learning_rate": 2.2015503875968993e-05, |
| "loss": 0.3546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34246036410331726, |
| "step": 285, |
| "valid_targets_mean": 2999.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.39348710990502034, |
| "grad_norm": 0.6635427507067181, |
| "learning_rate": 2.2403100775193802e-05, |
| "loss": 0.3692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35911792516708374, |
| "step": 290, |
| "valid_targets_mean": 3345.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.40027137042062416, |
| "grad_norm": 0.8108891809655495, |
| "learning_rate": 2.2790697674418607e-05, |
| "loss": 0.3676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36157429218292236, |
| "step": 295, |
| "valid_targets_mean": 2752.9, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 0.40705563093622793, |
| "grad_norm": 0.7092963268541641, |
| "learning_rate": 2.3178294573643412e-05, |
| "loss": 0.357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3586769700050354, |
| "step": 300, |
| "valid_targets_mean": 3229.6, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 0.41383989145183175, |
| "grad_norm": 0.8313919502710964, |
| "learning_rate": 2.356589147286822e-05, |
| "loss": 0.369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40778008103370667, |
| "step": 305, |
| "valid_targets_mean": 3072.8, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 0.4206241519674355, |
| "grad_norm": 0.8521822829383703, |
| "learning_rate": 2.3953488372093023e-05, |
| "loss": 0.3571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38653799891471863, |
| "step": 310, |
| "valid_targets_mean": 2318.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.42740841248303935, |
| "grad_norm": 0.7709743279914623, |
| "learning_rate": 2.434108527131783e-05, |
| "loss": 0.3515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36175817251205444, |
| "step": 315, |
| "valid_targets_mean": 2692.5, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 0.43419267299864317, |
| "grad_norm": 0.7913741131309853, |
| "learning_rate": 2.4728682170542637e-05, |
| "loss": 0.3564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34055837988853455, |
| "step": 320, |
| "valid_targets_mean": 2549.1, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 0.44097693351424694, |
| "grad_norm": 0.7251245992538848, |
| "learning_rate": 2.5116279069767445e-05, |
| "loss": 0.3424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3071543574333191, |
| "step": 325, |
| "valid_targets_mean": 2746.8, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 0.44776119402985076, |
| "grad_norm": 0.877109135791174, |
| "learning_rate": 2.550387596899225e-05, |
| "loss": 0.3515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3644331395626068, |
| "step": 330, |
| "valid_targets_mean": 2258.4, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 0.45454545454545453, |
| "grad_norm": 0.7463994697165139, |
| "learning_rate": 2.589147286821706e-05, |
| "loss": 0.3452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3452218770980835, |
| "step": 335, |
| "valid_targets_mean": 2618.1, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 0.46132971506105835, |
| "grad_norm": 0.826153332286381, |
| "learning_rate": 2.627906976744186e-05, |
| "loss": 0.3557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3592166006565094, |
| "step": 340, |
| "valid_targets_mean": 2649.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 0.4681139755766621, |
| "grad_norm": 0.7556466009720993, |
| "learning_rate": 2.6666666666666667e-05, |
| "loss": 0.3796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4219163656234741, |
| "step": 345, |
| "valid_targets_mean": 2855.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 0.47489823609226595, |
| "grad_norm": 0.7276710198296943, |
| "learning_rate": 2.7054263565891475e-05, |
| "loss": 0.3541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.333509236574173, |
| "step": 350, |
| "valid_targets_mean": 2856.6, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.4816824966078697, |
| "grad_norm": 0.8103248615360679, |
| "learning_rate": 2.744186046511628e-05, |
| "loss": 0.3502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3477519452571869, |
| "step": 355, |
| "valid_targets_mean": 2232.4, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 0.48846675712347354, |
| "grad_norm": 0.9073845669791214, |
| "learning_rate": 2.782945736434109e-05, |
| "loss": 0.3475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36534401774406433, |
| "step": 360, |
| "valid_targets_mean": 2373.4, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 0.49525101763907736, |
| "grad_norm": 0.8050927376280175, |
| "learning_rate": 2.8217054263565894e-05, |
| "loss": 0.3677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3501133620738983, |
| "step": 365, |
| "valid_targets_mean": 2434.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 0.5020352781546812, |
| "grad_norm": 0.7660020717643617, |
| "learning_rate": 2.8604651162790703e-05, |
| "loss": 0.3492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3313218355178833, |
| "step": 370, |
| "valid_targets_mean": 2836.5, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 0.508819538670285, |
| "grad_norm": 0.7443344419339243, |
| "learning_rate": 2.8992248062015505e-05, |
| "loss": 0.3423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33690541982650757, |
| "step": 375, |
| "valid_targets_mean": 2837.2, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 0.5156037991858887, |
| "grad_norm": 0.779004361301433, |
| "learning_rate": 2.937984496124031e-05, |
| "loss": 0.3473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34115269780158997, |
| "step": 380, |
| "valid_targets_mean": 2826.7, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.5223880597014925, |
| "grad_norm": 0.9341133562668817, |
| "learning_rate": 2.976744186046512e-05, |
| "loss": 0.3386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3078441023826599, |
| "step": 385, |
| "valid_targets_mean": 1897.9, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 0.5291723202170964, |
| "grad_norm": 0.9049226382408442, |
| "learning_rate": 3.0155038759689924e-05, |
| "loss": 0.3555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34988129138946533, |
| "step": 390, |
| "valid_targets_mean": 3014.6, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 0.5359565807327001, |
| "grad_norm": 0.8125257555203335, |
| "learning_rate": 3.054263565891473e-05, |
| "loss": 0.3505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3929121792316437, |
| "step": 395, |
| "valid_targets_mean": 2705.0, |
| "valid_targets_min": 1179 |
| }, |
| { |
| "epoch": 0.5427408412483039, |
| "grad_norm": 0.7384330929303173, |
| "learning_rate": 3.093023255813954e-05, |
| "loss": 0.324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30182796716690063, |
| "step": 400, |
| "valid_targets_mean": 3520.5, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 0.5495251017639078, |
| "grad_norm": 0.9344307339860809, |
| "learning_rate": 3.1317829457364343e-05, |
| "loss": 0.3489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37407636642456055, |
| "step": 405, |
| "valid_targets_mean": 2585.3, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 0.5563093622795116, |
| "grad_norm": 0.706765156270403, |
| "learning_rate": 3.170542635658915e-05, |
| "loss": 0.3633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3846889138221741, |
| "step": 410, |
| "valid_targets_mean": 3670.8, |
| "valid_targets_min": 1083 |
| }, |
| { |
| "epoch": 0.5630936227951153, |
| "grad_norm": 0.7091546038528599, |
| "learning_rate": 3.2093023255813954e-05, |
| "loss": 0.3388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2954094111919403, |
| "step": 415, |
| "valid_targets_mean": 2686.8, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 0.5698778833107191, |
| "grad_norm": 0.720646680324316, |
| "learning_rate": 3.248062015503876e-05, |
| "loss": 0.359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36445194482803345, |
| "step": 420, |
| "valid_targets_mean": 3180.9, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 0.576662143826323, |
| "grad_norm": 0.7561273241851728, |
| "learning_rate": 3.286821705426357e-05, |
| "loss": 0.3382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.330274760723114, |
| "step": 425, |
| "valid_targets_mean": 2636.8, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 0.5834464043419267, |
| "grad_norm": 0.8694755557547249, |
| "learning_rate": 3.3255813953488377e-05, |
| "loss": 0.3452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3319804072380066, |
| "step": 430, |
| "valid_targets_mean": 2225.6, |
| "valid_targets_min": 1286 |
| }, |
| { |
| "epoch": 0.5902306648575305, |
| "grad_norm": 0.68772821314539, |
| "learning_rate": 3.364341085271318e-05, |
| "loss": 0.3435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33189690113067627, |
| "step": 435, |
| "valid_targets_mean": 3022.4, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 0.5970149253731343, |
| "grad_norm": 0.9588382883930207, |
| "learning_rate": 3.403100775193799e-05, |
| "loss": 0.3443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3494105339050293, |
| "step": 440, |
| "valid_targets_mean": 2476.9, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 0.6037991858887382, |
| "grad_norm": 0.7838789395466246, |
| "learning_rate": 3.441860465116279e-05, |
| "loss": 0.3446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32996422052383423, |
| "step": 445, |
| "valid_targets_mean": 2342.1, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 0.6105834464043419, |
| "grad_norm": 0.7416365052685329, |
| "learning_rate": 3.48062015503876e-05, |
| "loss": 0.3324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3227633237838745, |
| "step": 450, |
| "valid_targets_mean": 3124.1, |
| "valid_targets_min": 1365 |
| }, |
| { |
| "epoch": 0.6173677069199457, |
| "grad_norm": 0.6258235950313648, |
| "learning_rate": 3.51937984496124e-05, |
| "loss": 0.3313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29047924280166626, |
| "step": 455, |
| "valid_targets_mean": 3342.6, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 0.6241519674355496, |
| "grad_norm": 0.6880630346475627, |
| "learning_rate": 3.5581395348837215e-05, |
| "loss": 0.3664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.352108359336853, |
| "step": 460, |
| "valid_targets_mean": 3073.2, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 0.6309362279511533, |
| "grad_norm": 0.7002916188745265, |
| "learning_rate": 3.596899224806202e-05, |
| "loss": 0.3412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33518415689468384, |
| "step": 465, |
| "valid_targets_mean": 2779.1, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 0.6377204884667571, |
| "grad_norm": 0.7760406431300181, |
| "learning_rate": 3.6356589147286826e-05, |
| "loss": 0.3503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32304704189300537, |
| "step": 470, |
| "valid_targets_mean": 2418.1, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 0.6445047489823609, |
| "grad_norm": 0.81128665595444, |
| "learning_rate": 3.674418604651163e-05, |
| "loss": 0.3423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35187655687332153, |
| "step": 475, |
| "valid_targets_mean": 2206.1, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 0.6512890094979648, |
| "grad_norm": 0.6699530012511279, |
| "learning_rate": 3.7131782945736436e-05, |
| "loss": 0.3289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30837348103523254, |
| "step": 480, |
| "valid_targets_mean": 3204.2, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 0.6580732700135685, |
| "grad_norm": 0.8161088245962455, |
| "learning_rate": 3.751937984496124e-05, |
| "loss": 0.341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3431815803050995, |
| "step": 485, |
| "valid_targets_mean": 2313.1, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 0.6648575305291723, |
| "grad_norm": 0.6636433541876118, |
| "learning_rate": 3.7906976744186053e-05, |
| "loss": 0.3527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3255542516708374, |
| "step": 490, |
| "valid_targets_mean": 3133.2, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 0.6716417910447762, |
| "grad_norm": 0.7193982612960406, |
| "learning_rate": 3.829457364341086e-05, |
| "loss": 0.3413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3598499894142151, |
| "step": 495, |
| "valid_targets_mean": 2609.6, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 0.6784260515603799, |
| "grad_norm": 0.7893940888720667, |
| "learning_rate": 3.8682170542635664e-05, |
| "loss": 0.3461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3467223644256592, |
| "step": 500, |
| "valid_targets_mean": 2836.8, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 0.6852103120759837, |
| "grad_norm": 0.7057772565861374, |
| "learning_rate": 3.906976744186047e-05, |
| "loss": 0.3299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3372578024864197, |
| "step": 505, |
| "valid_targets_mean": 2930.9, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 0.6919945725915875, |
| "grad_norm": 0.6963494863151088, |
| "learning_rate": 3.9457364341085275e-05, |
| "loss": 0.3462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3436594605445862, |
| "step": 510, |
| "valid_targets_mean": 3018.2, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 0.6987788331071914, |
| "grad_norm": 0.7394424529088445, |
| "learning_rate": 3.984496124031008e-05, |
| "loss": 0.3466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3247559666633606, |
| "step": 515, |
| "valid_targets_mean": 2679.7, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 0.7055630936227951, |
| "grad_norm": 0.6838375834791657, |
| "learning_rate": 3.9999958795491475e-05, |
| "loss": 0.3409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3312002420425415, |
| "step": 520, |
| "valid_targets_mean": 3034.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 0.7123473541383989, |
| "grad_norm": 0.6067455993466966, |
| "learning_rate": 3.999970699077645e-05, |
| "loss": 0.3146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3216730058193207, |
| "step": 525, |
| "valid_targets_mean": 3705.9, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 0.7191316146540027, |
| "grad_norm": 0.6985270320464033, |
| "learning_rate": 3.9999226275618605e-05, |
| "loss": 0.3366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33391982316970825, |
| "step": 530, |
| "valid_targets_mean": 2748.6, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.7259158751696065, |
| "grad_norm": 0.7662978798224946, |
| "learning_rate": 3.9998516655520055e-05, |
| "loss": 0.3397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3417017459869385, |
| "step": 535, |
| "valid_targets_mean": 2394.5, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 0.7327001356852103, |
| "grad_norm": 0.669919043363021, |
| "learning_rate": 3.999757813860289e-05, |
| "loss": 0.336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31267890334129333, |
| "step": 540, |
| "valid_targets_mean": 3009.2, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 0.7394843962008141, |
| "grad_norm": 0.7274166571678258, |
| "learning_rate": 3.999641073560909e-05, |
| "loss": 0.3236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31356334686279297, |
| "step": 545, |
| "valid_targets_mean": 2435.3, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 0.746268656716418, |
| "grad_norm": 0.7210784987955194, |
| "learning_rate": 3.999501445990039e-05, |
| "loss": 0.3518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.358939528465271, |
| "step": 550, |
| "valid_targets_mean": 2823.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 0.7530529172320217, |
| "grad_norm": 0.7953791505748733, |
| "learning_rate": 3.9993389327458125e-05, |
| "loss": 0.3391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3532836139202118, |
| "step": 555, |
| "valid_targets_mean": 2465.7, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 0.7598371777476255, |
| "grad_norm": 0.8035999831102332, |
| "learning_rate": 3.9991535356883055e-05, |
| "loss": 0.3176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3166276812553406, |
| "step": 560, |
| "valid_targets_mean": 2324.9, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 0.7666214382632293, |
| "grad_norm": 0.8057221319350136, |
| "learning_rate": 3.9989452569395154e-05, |
| "loss": 0.3283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37396541237831116, |
| "step": 565, |
| "valid_targets_mean": 2373.8, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 0.7734056987788331, |
| "grad_norm": 0.8130298785771777, |
| "learning_rate": 3.9987140988833355e-05, |
| "loss": 0.3452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32148557901382446, |
| "step": 570, |
| "valid_targets_mean": 2525.6, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 0.7801899592944369, |
| "grad_norm": 0.7048055789019534, |
| "learning_rate": 3.9984600641655305e-05, |
| "loss": 0.334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3230056166648865, |
| "step": 575, |
| "valid_targets_mean": 2960.2, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 0.7869742198100407, |
| "grad_norm": 0.7505005839634938, |
| "learning_rate": 3.998183155693702e-05, |
| "loss": 0.3561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36198025941848755, |
| "step": 580, |
| "valid_targets_mean": 2640.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 0.7937584803256446, |
| "grad_norm": 0.5953296109502596, |
| "learning_rate": 3.997883376637258e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35237035155296326, |
| "step": 585, |
| "valid_targets_mean": 4056.9, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 0.8005427408412483, |
| "grad_norm": 0.6965335680749082, |
| "learning_rate": 3.997560730427379e-05, |
| "loss": 0.3361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.349098265171051, |
| "step": 590, |
| "valid_targets_mean": 2842.4, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 0.8073270013568521, |
| "grad_norm": 0.8417459794727778, |
| "learning_rate": 3.99721522075697e-05, |
| "loss": 0.3176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3189961016178131, |
| "step": 595, |
| "valid_targets_mean": 2172.4, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 0.8141112618724559, |
| "grad_norm": 0.8232217865179002, |
| "learning_rate": 3.99684685158063e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35521090030670166, |
| "step": 600, |
| "valid_targets_mean": 3057.4, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 0.8208955223880597, |
| "grad_norm": 0.6415450067556615, |
| "learning_rate": 3.996455627114598e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30212873220443726, |
| "step": 605, |
| "valid_targets_mean": 3003.2, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 0.8276797829036635, |
| "grad_norm": 0.7030806565946134, |
| "learning_rate": 3.996041551836707e-05, |
| "loss": 0.3382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34246373176574707, |
| "step": 610, |
| "valid_targets_mean": 2909.0, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 0.8344640434192673, |
| "grad_norm": 0.6504343613445783, |
| "learning_rate": 3.9956046304863354e-05, |
| "loss": 0.3362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3366634249687195, |
| "step": 615, |
| "valid_targets_mean": 3280.8, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 0.841248303934871, |
| "grad_norm": 0.8323739984409763, |
| "learning_rate": 3.9951448680643485e-05, |
| "loss": 0.326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31927552819252014, |
| "step": 620, |
| "valid_targets_mean": 2005.1, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.8480325644504749, |
| "grad_norm": 0.7434853063494745, |
| "learning_rate": 3.994662269833044e-05, |
| "loss": 0.3414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33908501267433167, |
| "step": 625, |
| "valid_targets_mean": 2536.9, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 0.8548168249660787, |
| "grad_norm": 0.6740114975827273, |
| "learning_rate": 3.994156841316093e-05, |
| "loss": 0.322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3202781677246094, |
| "step": 630, |
| "valid_targets_mean": 2874.8, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 0.8616010854816825, |
| "grad_norm": 0.7855713565247058, |
| "learning_rate": 3.9936285882984723e-05, |
| "loss": 0.3335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34169870615005493, |
| "step": 635, |
| "valid_targets_mean": 2232.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 0.8683853459972863, |
| "grad_norm": 0.6561553473826617, |
| "learning_rate": 3.993077516826403e-05, |
| "loss": 0.3374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3322102427482605, |
| "step": 640, |
| "valid_targets_mean": 2907.2, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 0.8751696065128901, |
| "grad_norm": 0.7829492620549515, |
| "learning_rate": 3.9925036332072775e-05, |
| "loss": 0.3253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32236772775650024, |
| "step": 645, |
| "valid_targets_mean": 2319.2, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 0.8819538670284939, |
| "grad_norm": 0.7216603888066516, |
| "learning_rate": 3.99190694400959e-05, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35016581416130066, |
| "step": 650, |
| "valid_targets_mean": 2640.7, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 0.8887381275440976, |
| "grad_norm": 0.6378166749356016, |
| "learning_rate": 3.991287456062861e-05, |
| "loss": 0.3396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34149160981178284, |
| "step": 655, |
| "valid_targets_mean": 3447.8, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 0.8955223880597015, |
| "grad_norm": 0.7082789982684017, |
| "learning_rate": 3.9906451764575544e-05, |
| "loss": 0.3388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.348561555147171, |
| "step": 660, |
| "valid_targets_mean": 2913.9, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 0.9023066485753053, |
| "grad_norm": 0.7353124573695241, |
| "learning_rate": 3.989980112545007e-05, |
| "loss": 0.315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3169977068901062, |
| "step": 665, |
| "valid_targets_mean": 2372.2, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 0.9090909090909091, |
| "grad_norm": 0.6779717293015843, |
| "learning_rate": 3.989292271937332e-05, |
| "loss": 0.3354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3415604531764984, |
| "step": 670, |
| "valid_targets_mean": 3224.8, |
| "valid_targets_min": 1172 |
| }, |
| { |
| "epoch": 0.9158751696065129, |
| "grad_norm": 0.6802704573331115, |
| "learning_rate": 3.988581662507339e-05, |
| "loss": 0.3256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3390202820301056, |
| "step": 675, |
| "valid_targets_mean": 2996.1, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 0.9226594301221167, |
| "grad_norm": 0.7137326701115103, |
| "learning_rate": 3.987848292388445e-05, |
| "loss": 0.3156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3149383068084717, |
| "step": 680, |
| "valid_targets_mean": 2476.1, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 0.9294436906377205, |
| "grad_norm": 0.7976853977114939, |
| "learning_rate": 3.987092169974576e-05, |
| "loss": 0.3385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34196972846984863, |
| "step": 685, |
| "valid_targets_mean": 2134.6, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 0.9362279511533242, |
| "grad_norm": 0.7571960144185641, |
| "learning_rate": 3.986313303920074e-05, |
| "loss": 0.3058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31737232208251953, |
| "step": 690, |
| "valid_targets_mean": 2642.4, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 0.9430122116689281, |
| "grad_norm": 0.7686352923550949, |
| "learning_rate": 3.985511703139599e-05, |
| "loss": 0.3108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30339232087135315, |
| "step": 695, |
| "valid_targets_mean": 2095.3, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 0.9497964721845319, |
| "grad_norm": 0.6986874211530488, |
| "learning_rate": 3.984687376808025e-05, |
| "loss": 0.3319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34129583835601807, |
| "step": 700, |
| "valid_targets_mean": 2803.9, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 0.9565807327001357, |
| "grad_norm": 0.7610343107451978, |
| "learning_rate": 3.983840334360336e-05, |
| "loss": 0.3358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33215272426605225, |
| "step": 705, |
| "valid_targets_mean": 2625.3, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 0.9633649932157394, |
| "grad_norm": 0.6276014942943633, |
| "learning_rate": 3.982970585491516e-05, |
| "loss": 0.3281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3128705620765686, |
| "step": 710, |
| "valid_targets_mean": 3215.4, |
| "valid_targets_min": 1391 |
| }, |
| { |
| "epoch": 0.9701492537313433, |
| "grad_norm": 0.6798894086802646, |
| "learning_rate": 3.982078140156441e-05, |
| "loss": 0.3062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2989204525947571, |
| "step": 715, |
| "valid_targets_mean": 2666.4, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 0.9769335142469471, |
| "grad_norm": 0.7410349510063327, |
| "learning_rate": 3.981163008569764e-05, |
| "loss": 0.3355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31131139397621155, |
| "step": 720, |
| "valid_targets_mean": 3063.8, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 0.9837177747625508, |
| "grad_norm": 0.6643176359530586, |
| "learning_rate": 3.9802252012057974e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3558084964752197, |
| "step": 725, |
| "valid_targets_mean": 3521.2, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 0.9905020352781547, |
| "grad_norm": 0.7267283614828455, |
| "learning_rate": 3.979264728798392e-05, |
| "loss": 0.3334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3494442105293274, |
| "step": 730, |
| "valid_targets_mean": 2547.4, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 0.9972862957937585, |
| "grad_norm": 0.6814846127090516, |
| "learning_rate": 3.9782816023408194e-05, |
| "loss": 0.3327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3272936940193176, |
| "step": 735, |
| "valid_targets_mean": 2686.4, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 1.0040705563093624, |
| "grad_norm": 0.6861216126300802, |
| "learning_rate": 3.977275833085638e-05, |
| "loss": 0.302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31268030405044556, |
| "step": 740, |
| "valid_targets_mean": 2643.2, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.010854816824966, |
| "grad_norm": 0.6898996438799597, |
| "learning_rate": 3.976247432544571e-05, |
| "loss": 0.283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2911531925201416, |
| "step": 745, |
| "valid_targets_mean": 2797.4, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 1.01763907734057, |
| "grad_norm": 0.8254261194413537, |
| "learning_rate": 3.9751964124883735e-05, |
| "loss": 0.3147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3192952275276184, |
| "step": 750, |
| "valid_targets_mean": 2253.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.0244233378561738, |
| "grad_norm": 0.7754318957680647, |
| "learning_rate": 3.974122784946694e-05, |
| "loss": 0.2937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27857261896133423, |
| "step": 755, |
| "valid_targets_mean": 2432.6, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 1.0312075983717774, |
| "grad_norm": 0.7881514631070836, |
| "learning_rate": 3.97302656220794e-05, |
| "loss": 0.3074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.320145845413208, |
| "step": 760, |
| "valid_targets_mean": 2445.4, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.0379918588873813, |
| "grad_norm": 0.6506473704894072, |
| "learning_rate": 3.9719077568191376e-05, |
| "loss": 0.2972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28449857234954834, |
| "step": 765, |
| "valid_targets_mean": 3023.9, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 1.044776119402985, |
| "grad_norm": 0.8042677555990032, |
| "learning_rate": 3.970766381585786e-05, |
| "loss": 0.2826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26466116309165955, |
| "step": 770, |
| "valid_targets_mean": 2212.1, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 1.0515603799185889, |
| "grad_norm": 0.676421887365203, |
| "learning_rate": 3.969602449571712e-05, |
| "loss": 0.2962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29949331283569336, |
| "step": 775, |
| "valid_targets_mean": 3120.0, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 1.0583446404341927, |
| "grad_norm": 0.7474747697048539, |
| "learning_rate": 3.96841597409892e-05, |
| "loss": 0.3093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30292749404907227, |
| "step": 780, |
| "valid_targets_mean": 2577.1, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 1.0651289009497964, |
| "grad_norm": 0.7960660690648608, |
| "learning_rate": 3.9672069687474415e-05, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28914356231689453, |
| "step": 785, |
| "valid_targets_mean": 2216.7, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.0719131614654003, |
| "grad_norm": 0.6763388576498762, |
| "learning_rate": 3.965975447355176e-05, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30142050981521606, |
| "step": 790, |
| "valid_targets_mean": 2811.3, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 1.0786974219810042, |
| "grad_norm": 0.8330584303910075, |
| "learning_rate": 3.964721424017735e-05, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.303778737783432, |
| "step": 795, |
| "valid_targets_mean": 2451.8, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 1.0854816824966078, |
| "grad_norm": 0.7262140518757996, |
| "learning_rate": 3.963444913088281e-05, |
| "loss": 0.2993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3419913649559021, |
| "step": 800, |
| "valid_targets_mean": 3062.5, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 1.0922659430122117, |
| "grad_norm": 0.701846588477317, |
| "learning_rate": 3.9621459291773626e-05, |
| "loss": 0.2948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3039608597755432, |
| "step": 805, |
| "valid_targets_mean": 2721.3, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 1.0990502035278156, |
| "grad_norm": 0.764825483304104, |
| "learning_rate": 3.960824487152746e-05, |
| "loss": 0.3129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3330846428871155, |
| "step": 810, |
| "valid_targets_mean": 2494.1, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 1.1058344640434192, |
| "grad_norm": 0.8702738985222226, |
| "learning_rate": 3.959480602139247e-05, |
| "loss": 0.2953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2918407917022705, |
| "step": 815, |
| "valid_targets_mean": 2434.2, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 1.112618724559023, |
| "grad_norm": 0.6076347441974812, |
| "learning_rate": 3.958114289518557e-05, |
| "loss": 0.2949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2711153030395508, |
| "step": 820, |
| "valid_targets_mean": 3189.2, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 1.1194029850746268, |
| "grad_norm": 0.6404883109837152, |
| "learning_rate": 3.956725564929066e-05, |
| "loss": 0.2885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2949562072753906, |
| "step": 825, |
| "valid_targets_mean": 3202.6, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 1.1261872455902306, |
| "grad_norm": 0.6942618107302919, |
| "learning_rate": 3.955314444265685e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29515475034713745, |
| "step": 830, |
| "valid_targets_mean": 2622.8, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 1.1329715061058345, |
| "grad_norm": 0.7378195219174956, |
| "learning_rate": 3.9538809436796635e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31367671489715576, |
| "step": 835, |
| "valid_targets_mean": 2731.7, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 1.1397557666214382, |
| "grad_norm": 0.7537202284076141, |
| "learning_rate": 3.952425079578405e-05, |
| "loss": 0.3048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3013504147529602, |
| "step": 840, |
| "valid_targets_mean": 2165.1, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 1.146540027137042, |
| "grad_norm": 0.7523754539948808, |
| "learning_rate": 3.9509468686252776e-05, |
| "loss": 0.3017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2941988706588745, |
| "step": 845, |
| "valid_targets_mean": 2384.8, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 1.153324287652646, |
| "grad_norm": 0.5769173901162691, |
| "learning_rate": 3.9494463277394256e-05, |
| "loss": 0.2817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2812822461128235, |
| "step": 850, |
| "valid_targets_mean": 3832.6, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 1.1601085481682496, |
| "grad_norm": 0.6902875767301633, |
| "learning_rate": 3.947923474095575e-05, |
| "loss": 0.2994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2795878052711487, |
| "step": 855, |
| "valid_targets_mean": 2588.9, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 1.1668928086838535, |
| "grad_norm": 0.6932765985873842, |
| "learning_rate": 3.946378325123836e-05, |
| "loss": 0.3018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29586702585220337, |
| "step": 860, |
| "valid_targets_mean": 2557.6, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 1.1736770691994574, |
| "grad_norm": 0.8142184847264059, |
| "learning_rate": 3.9448108985095036e-05, |
| "loss": 0.3229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3577713966369629, |
| "step": 865, |
| "valid_targets_mean": 2609.6, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 1.180461329715061, |
| "grad_norm": 0.6535181326922942, |
| "learning_rate": 3.943221212192859e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3148359954357147, |
| "step": 870, |
| "valid_targets_mean": 3229.5, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 1.187245590230665, |
| "grad_norm": 0.6505841244224432, |
| "learning_rate": 3.941609284368956e-05, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2802058458328247, |
| "step": 875, |
| "valid_targets_mean": 3026.5, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 1.1940298507462686, |
| "grad_norm": 0.6960891267075039, |
| "learning_rate": 3.939975133487422e-05, |
| "loss": 0.2933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3029175400733948, |
| "step": 880, |
| "valid_targets_mean": 2756.3, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 1.2008141112618724, |
| "grad_norm": 0.6800823657754136, |
| "learning_rate": 3.938318778252241e-05, |
| "loss": 0.3207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29470711946487427, |
| "step": 885, |
| "valid_targets_mean": 3122.9, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 1.2075983717774763, |
| "grad_norm": 0.7814295994587976, |
| "learning_rate": 3.9366402376215405e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31138426065444946, |
| "step": 890, |
| "valid_targets_mean": 2320.1, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 1.21438263229308, |
| "grad_norm": 0.7335457886775086, |
| "learning_rate": 3.934939530807376e-05, |
| "loss": 0.308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2950824797153473, |
| "step": 895, |
| "valid_targets_mean": 2272.6, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 1.2211668928086838, |
| "grad_norm": 0.7406055989848646, |
| "learning_rate": 3.933216677275512e-05, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30795565247535706, |
| "step": 900, |
| "valid_targets_mean": 2708.2, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 1.2279511533242877, |
| "grad_norm": 0.7271310816643761, |
| "learning_rate": 3.931471696745194e-05, |
| "loss": 0.2949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3034670650959015, |
| "step": 905, |
| "valid_targets_mean": 2719.8, |
| "valid_targets_min": 1144 |
| }, |
| { |
| "epoch": 1.2347354138398914, |
| "grad_norm": 0.6098483261250427, |
| "learning_rate": 3.929704609188927e-05, |
| "loss": 0.2926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30650919675827026, |
| "step": 910, |
| "valid_targets_mean": 3541.2, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 1.2415196743554953, |
| "grad_norm": 0.6695184378675495, |
| "learning_rate": 3.9279154348322495e-05, |
| "loss": 0.2949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29480671882629395, |
| "step": 915, |
| "valid_targets_mean": 2631.8, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 1.2483039348710991, |
| "grad_norm": 0.6364092125880288, |
| "learning_rate": 3.926104194153495e-05, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2782565951347351, |
| "step": 920, |
| "valid_targets_mean": 2974.1, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 1.2550881953867028, |
| "grad_norm": 0.8301944651771248, |
| "learning_rate": 3.924270907883562e-05, |
| "loss": 0.2939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2791467607021332, |
| "step": 925, |
| "valid_targets_mean": 2883.7, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 1.2618724559023067, |
| "grad_norm": 0.8022627958583087, |
| "learning_rate": 3.922415597005677e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.281793475151062, |
| "step": 930, |
| "valid_targets_mean": 1910.9, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 1.2686567164179103, |
| "grad_norm": 0.6363883403354091, |
| "learning_rate": 3.920538282755153e-05, |
| "loss": 0.2933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2905217707157135, |
| "step": 935, |
| "valid_targets_mean": 3314.0, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 1.2754409769335142, |
| "grad_norm": 0.637738645846229, |
| "learning_rate": 3.918638986619146e-05, |
| "loss": 0.2977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2899988889694214, |
| "step": 940, |
| "valid_targets_mean": 3262.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 1.282225237449118, |
| "grad_norm": 0.6487116870961588, |
| "learning_rate": 3.9167177303364115e-05, |
| "loss": 0.3026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3026847243309021, |
| "step": 945, |
| "valid_targets_mean": 3640.3, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 1.289009497964722, |
| "grad_norm": 0.7490100317858217, |
| "learning_rate": 3.9147745358970524e-05, |
| "loss": 0.3071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28088971972465515, |
| "step": 950, |
| "valid_targets_mean": 2377.6, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 1.2957937584803256, |
| "grad_norm": 0.7137946081945997, |
| "learning_rate": 3.9128094255422696e-05, |
| "loss": 0.2934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2796930968761444, |
| "step": 955, |
| "valid_targets_mean": 2555.9, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 1.3025780189959295, |
| "grad_norm": 0.5993098074500324, |
| "learning_rate": 3.910822421764106e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2874249219894409, |
| "step": 960, |
| "valid_targets_mean": 3206.5, |
| "valid_targets_min": 1560 |
| }, |
| { |
| "epoch": 1.3093622795115332, |
| "grad_norm": 0.9231815200437856, |
| "learning_rate": 3.9088135473051914e-05, |
| "loss": 0.3072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33113178610801697, |
| "step": 965, |
| "valid_targets_mean": 2220.5, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 1.316146540027137, |
| "grad_norm": 0.6697716973175908, |
| "learning_rate": 3.906782825158479e-05, |
| "loss": 0.2955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.285530149936676, |
| "step": 970, |
| "valid_targets_mean": 2935.3, |
| "valid_targets_min": 1225 |
| }, |
| { |
| "epoch": 1.322930800542741, |
| "grad_norm": 0.7281815877744984, |
| "learning_rate": 3.904730278566986e-05, |
| "loss": 0.3115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3005235493183136, |
| "step": 975, |
| "valid_targets_mean": 2603.3, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.3297150610583446, |
| "grad_norm": 0.748646343253343, |
| "learning_rate": 3.9026559310235234e-05, |
| "loss": 0.29, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2904489040374756, |
| "step": 980, |
| "valid_targets_mean": 2551.4, |
| "valid_targets_min": 1193 |
| }, |
| { |
| "epoch": 1.3364993215739485, |
| "grad_norm": 0.6174464137752114, |
| "learning_rate": 3.900559806270429e-05, |
| "loss": 0.2787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24410629272460938, |
| "step": 985, |
| "valid_targets_mean": 2941.9, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.3432835820895521, |
| "grad_norm": 0.7452637300432898, |
| "learning_rate": 3.898441928299297e-05, |
| "loss": 0.3051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30062615871429443, |
| "step": 990, |
| "valid_targets_mean": 2270.9, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 1.350067842605156, |
| "grad_norm": 0.6464889713515524, |
| "learning_rate": 3.896302321350702e-05, |
| "loss": 0.313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2945151925086975, |
| "step": 995, |
| "valid_targets_mean": 3044.5, |
| "valid_targets_min": 1167 |
| }, |
| { |
| "epoch": 1.3568521031207599, |
| "grad_norm": 0.7017509437824359, |
| "learning_rate": 3.894141009913921e-05, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29814016819000244, |
| "step": 1000, |
| "valid_targets_mean": 2468.2, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 1.3636363636363638, |
| "grad_norm": 0.6780559700998617, |
| "learning_rate": 3.891958018726655e-05, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28629612922668457, |
| "step": 1005, |
| "valid_targets_mean": 2853.8, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 1.3704206241519674, |
| "grad_norm": 0.8191037771052176, |
| "learning_rate": 3.8897533727747434e-05, |
| "loss": 0.2924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3040386438369751, |
| "step": 1010, |
| "valid_targets_mean": 2648.5, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 1.3772048846675713, |
| "grad_norm": 0.668502617185383, |
| "learning_rate": 3.88752709729188e-05, |
| "loss": 0.2884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31058913469314575, |
| "step": 1015, |
| "valid_targets_mean": 3066.1, |
| "valid_targets_min": 1388 |
| }, |
| { |
| "epoch": 1.383989145183175, |
| "grad_norm": 0.7094563085559425, |
| "learning_rate": 3.885279217759324e-05, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27286526560783386, |
| "step": 1020, |
| "valid_targets_mean": 2670.2, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 1.3907734056987788, |
| "grad_norm": 0.6912293288922038, |
| "learning_rate": 3.883009759905607e-05, |
| "loss": 0.2901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29000505805015564, |
| "step": 1025, |
| "valid_targets_mean": 3009.6, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 1.3975576662143827, |
| "grad_norm": 0.598939732528779, |
| "learning_rate": 3.8807187497062394e-05, |
| "loss": 0.3045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27007484436035156, |
| "step": 1030, |
| "valid_targets_mean": 3264.9, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 1.4043419267299864, |
| "grad_norm": 0.6399031295655998, |
| "learning_rate": 3.8784062133834136e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30463242530822754, |
| "step": 1035, |
| "valid_targets_mean": 2838.9, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 1.4111261872455902, |
| "grad_norm": 0.6746984691711082, |
| "learning_rate": 3.876072177405703e-05, |
| "loss": 0.2943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3121001720428467, |
| "step": 1040, |
| "valid_targets_mean": 2916.5, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 1.417910447761194, |
| "grad_norm": 0.7284630600724608, |
| "learning_rate": 3.8737166684877596e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644261121749878, |
| "step": 1045, |
| "valid_targets_mean": 2068.2, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 1.4246947082767978, |
| "grad_norm": 0.6562294087271845, |
| "learning_rate": 3.871339713590007e-05, |
| "loss": 0.2954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2642728388309479, |
| "step": 1050, |
| "valid_targets_mean": 2884.8, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 1.4314789687924017, |
| "grad_norm": 0.6478250945987496, |
| "learning_rate": 3.868941339918335e-05, |
| "loss": 0.2929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32172685861587524, |
| "step": 1055, |
| "valid_targets_mean": 3082.5, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 1.4382632293080055, |
| "grad_norm": 0.644202603849787, |
| "learning_rate": 3.866521574923784e-05, |
| "loss": 0.3059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31228554248809814, |
| "step": 1060, |
| "valid_targets_mean": 3175.8, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 1.4450474898236092, |
| "grad_norm": 0.661879013668605, |
| "learning_rate": 3.864080446302234e-05, |
| "loss": 0.3022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3252270519733429, |
| "step": 1065, |
| "valid_targets_mean": 3194.7, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 1.451831750339213, |
| "grad_norm": 0.6549935813841651, |
| "learning_rate": 3.8616179819940857e-05, |
| "loss": 0.3017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28648945689201355, |
| "step": 1070, |
| "valid_targets_mean": 2721.0, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 1.4586160108548167, |
| "grad_norm": 0.6531723880805292, |
| "learning_rate": 3.859134210183941e-05, |
| "loss": 0.3165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31207776069641113, |
| "step": 1075, |
| "valid_targets_mean": 2777.7, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 1.4654002713704206, |
| "grad_norm": 0.6716764880355328, |
| "learning_rate": 3.856629159300283e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32089391350746155, |
| "step": 1080, |
| "valid_targets_mean": 3052.2, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 1.4721845318860245, |
| "grad_norm": 0.6655307018039186, |
| "learning_rate": 3.8541028580151465e-05, |
| "loss": 0.2882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26921534538269043, |
| "step": 1085, |
| "valid_targets_mean": 2680.0, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 1.4789687924016282, |
| "grad_norm": 0.7389639492671433, |
| "learning_rate": 3.8515553352437927e-05, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28306636214256287, |
| "step": 1090, |
| "valid_targets_mean": 2348.4, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 1.485753052917232, |
| "grad_norm": 0.6679028777069137, |
| "learning_rate": 3.848986620144376e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26913198828697205, |
| "step": 1095, |
| "valid_targets_mean": 2657.7, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 1.4925373134328357, |
| "grad_norm": 0.6297786728759884, |
| "learning_rate": 3.846396742117614e-05, |
| "loss": 0.2942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31999313831329346, |
| "step": 1100, |
| "valid_targets_mean": 3368.2, |
| "valid_targets_min": 1524 |
| }, |
| { |
| "epoch": 1.4993215739484396, |
| "grad_norm": 0.6149463581344302, |
| "learning_rate": 3.843785730806447e-05, |
| "loss": 0.2946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29018402099609375, |
| "step": 1105, |
| "valid_targets_mean": 3319.4, |
| "valid_targets_min": 1354 |
| }, |
| { |
| "epoch": 1.5061058344640434, |
| "grad_norm": 0.809702645817836, |
| "learning_rate": 3.8411536160957004e-05, |
| "loss": 0.2942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29155030846595764, |
| "step": 1110, |
| "valid_targets_mean": 2079.1, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 1.5128900949796473, |
| "grad_norm": 0.6375577416325251, |
| "learning_rate": 3.8385004281117425e-05, |
| "loss": 0.2877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26376283168792725, |
| "step": 1115, |
| "valid_targets_mean": 3094.1, |
| "valid_targets_min": 951 |
| }, |
| { |
| "epoch": 1.519674355495251, |
| "grad_norm": 0.7117061338880089, |
| "learning_rate": 3.83582619722214e-05, |
| "loss": 0.2951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32851043343544006, |
| "step": 1120, |
| "valid_targets_mean": 2709.3, |
| "valid_targets_min": 1321 |
| }, |
| { |
| "epoch": 1.5264586160108549, |
| "grad_norm": 0.7195810818077915, |
| "learning_rate": 3.833130954035311e-05, |
| "loss": 0.2864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29876279830932617, |
| "step": 1125, |
| "valid_targets_mean": 2322.1, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 1.5332428765264585, |
| "grad_norm": 0.6893087648021691, |
| "learning_rate": 3.830414729400172e-05, |
| "loss": 0.2955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32284027338027954, |
| "step": 1130, |
| "valid_targets_mean": 2666.9, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 1.5400271370420624, |
| "grad_norm": 0.6375253452820985, |
| "learning_rate": 3.8276775544057886e-05, |
| "loss": 0.2918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2919315695762634, |
| "step": 1135, |
| "valid_targets_mean": 3260.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 1.5468113975576663, |
| "grad_norm": 0.7850898957886953, |
| "learning_rate": 3.824919460381016e-05, |
| "loss": 0.3168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2958727180957794, |
| "step": 1140, |
| "valid_targets_mean": 3326.9, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 1.5535956580732702, |
| "grad_norm": 0.6951131898750251, |
| "learning_rate": 3.822140478894143e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3108687102794647, |
| "step": 1145, |
| "valid_targets_mean": 2787.1, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 1.5603799185888738, |
| "grad_norm": 0.733903133533046, |
| "learning_rate": 3.8193406417525304e-05, |
| "loss": 0.2998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3235079050064087, |
| "step": 1150, |
| "valid_targets_mean": 2633.2, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 1.5671641791044775, |
| "grad_norm": 0.731200133367719, |
| "learning_rate": 3.816519981002245e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2996997535228729, |
| "step": 1155, |
| "valid_targets_mean": 2690.8, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 1.5739484396200814, |
| "grad_norm": 0.6385315926667753, |
| "learning_rate": 3.8136785289276953e-05, |
| "loss": 0.2806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27406877279281616, |
| "step": 1160, |
| "valid_targets_mean": 3035.6, |
| "valid_targets_min": 1429 |
| }, |
| { |
| "epoch": 1.5807327001356852, |
| "grad_norm": 0.7362793886550267, |
| "learning_rate": 3.81081631805126e-05, |
| "loss": 0.2901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34110113978385925, |
| "step": 1165, |
| "valid_targets_mean": 2940.3, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 1.587516960651289, |
| "grad_norm": 0.7349732590117125, |
| "learning_rate": 3.807933381132917e-05, |
| "loss": 0.3104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2936994135379791, |
| "step": 1170, |
| "valid_targets_mean": 2527.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.5943012211668928, |
| "grad_norm": 0.7064877699762256, |
| "learning_rate": 3.805029751169869e-05, |
| "loss": 0.2972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29555004835128784, |
| "step": 1175, |
| "valid_targets_mean": 2654.1, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 1.6010854816824966, |
| "grad_norm": 0.6447256804044132, |
| "learning_rate": 3.802105461396163e-05, |
| "loss": 0.2908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31151026487350464, |
| "step": 1180, |
| "valid_targets_mean": 2946.4, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 1.6078697421981003, |
| "grad_norm": 0.5108082252163869, |
| "learning_rate": 3.799160545282312e-05, |
| "loss": 0.279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2245091050863266, |
| "step": 1185, |
| "valid_targets_mean": 3714.3, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 1.6146540027137042, |
| "grad_norm": 0.6878930154133356, |
| "learning_rate": 3.796195036534914e-05, |
| "loss": 0.2658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2854118049144745, |
| "step": 1190, |
| "valid_targets_mean": 2541.6, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 1.621438263229308, |
| "grad_norm": 0.8006673353310524, |
| "learning_rate": 3.793208969096261e-05, |
| "loss": 0.2921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28456225991249084, |
| "step": 1195, |
| "valid_targets_mean": 2468.4, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 1.628222523744912, |
| "grad_norm": 0.7653832467394758, |
| "learning_rate": 3.790202377143956e-05, |
| "loss": 0.2975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31006136536598206, |
| "step": 1200, |
| "valid_targets_mean": 2955.1, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 1.6350067842605156, |
| "grad_norm": 0.7315864774837488, |
| "learning_rate": 3.7871752950905174e-05, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3193378448486328, |
| "step": 1205, |
| "valid_targets_mean": 2490.4, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 1.6417910447761193, |
| "grad_norm": 0.7643610632774577, |
| "learning_rate": 3.784127757582987e-05, |
| "loss": 0.302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3098391592502594, |
| "step": 1210, |
| "valid_targets_mean": 2237.9, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 1.6485753052917231, |
| "grad_norm": 0.6008604291150627, |
| "learning_rate": 3.7810597995025336e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2691340446472168, |
| "step": 1215, |
| "valid_targets_mean": 2998.4, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 1.655359565807327, |
| "grad_norm": 0.6364039836954427, |
| "learning_rate": 3.7779714559640555e-05, |
| "loss": 0.2894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29183879494667053, |
| "step": 1220, |
| "valid_targets_mean": 3299.7, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.662143826322931, |
| "grad_norm": 0.8360956147817608, |
| "learning_rate": 3.774862762315772e-05, |
| "loss": 0.2918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30887937545776367, |
| "step": 1225, |
| "valid_targets_mean": 2721.2, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 1.6689280868385346, |
| "grad_norm": 0.6028843978675598, |
| "learning_rate": 3.771733754138829e-05, |
| "loss": 0.2873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2811635732650757, |
| "step": 1230, |
| "valid_targets_mean": 3361.2, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 1.6757123473541384, |
| "grad_norm": 0.7428753179701643, |
| "learning_rate": 3.768584467246883e-05, |
| "loss": 0.3046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30133670568466187, |
| "step": 1235, |
| "valid_targets_mean": 3111.6, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 1.682496607869742, |
| "grad_norm": 0.7569776252384394, |
| "learning_rate": 3.765414937685695e-05, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3009093999862671, |
| "step": 1240, |
| "valid_targets_mean": 2188.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 1.689280868385346, |
| "grad_norm": 0.5814940877820675, |
| "learning_rate": 3.762225201732715e-05, |
| "loss": 0.2836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26204395294189453, |
| "step": 1245, |
| "valid_targets_mean": 3493.9, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 1.6960651289009498, |
| "grad_norm": 0.726614967916978, |
| "learning_rate": 3.7590152958966745e-05, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.321370929479599, |
| "step": 1250, |
| "valid_targets_mean": 2850.1, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 1.7028493894165537, |
| "grad_norm": 0.7426123839264059, |
| "learning_rate": 3.7557852569171585e-05, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2817172110080719, |
| "step": 1255, |
| "valid_targets_mean": 2224.9, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 1.7096336499321574, |
| "grad_norm": 0.8799943306194825, |
| "learning_rate": 3.7525351217641915e-05, |
| "loss": 0.3085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3357008993625641, |
| "step": 1260, |
| "valid_targets_mean": 3111.0, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 1.716417910447761, |
| "grad_norm": 0.6111490118620997, |
| "learning_rate": 3.7492649276378124e-05, |
| "loss": 0.2828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2888554632663727, |
| "step": 1265, |
| "valid_targets_mean": 3284.9, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 1.723202170963365, |
| "grad_norm": 0.6589094616205049, |
| "learning_rate": 3.7459747119676484e-05, |
| "loss": 0.305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30003267526626587, |
| "step": 1270, |
| "valid_targets_mean": 2895.2, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 1.7299864314789688, |
| "grad_norm": 0.640067102221961, |
| "learning_rate": 3.742664512412488e-05, |
| "loss": 0.3087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31731560826301575, |
| "step": 1275, |
| "valid_targets_mean": 3285.7, |
| "valid_targets_min": 1465 |
| }, |
| { |
| "epoch": 1.7367706919945727, |
| "grad_norm": 0.6939365904317435, |
| "learning_rate": 3.7393343668598495e-05, |
| "loss": 0.2927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2893563210964203, |
| "step": 1280, |
| "valid_targets_mean": 2671.6, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 1.7435549525101763, |
| "grad_norm": 0.6861699873490201, |
| "learning_rate": 3.735984313425544e-05, |
| "loss": 0.2781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3145902156829834, |
| "step": 1285, |
| "valid_targets_mean": 2858.2, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 1.7503392130257802, |
| "grad_norm": 0.5893287065962871, |
| "learning_rate": 3.732614390453245e-05, |
| "loss": 0.2994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2815445065498352, |
| "step": 1290, |
| "valid_targets_mean": 3251.5, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 1.7571234735413839, |
| "grad_norm": 0.6605129026405406, |
| "learning_rate": 3.729224636514046e-05, |
| "loss": 0.2863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28478604555130005, |
| "step": 1295, |
| "valid_targets_mean": 2549.3, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 1.7639077340569878, |
| "grad_norm": 0.7080612755113385, |
| "learning_rate": 3.7258150904060184e-05, |
| "loss": 0.2862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30780327320098877, |
| "step": 1300, |
| "valid_targets_mean": 2727.4, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 1.7706919945725916, |
| "grad_norm": 0.6157145299604274, |
| "learning_rate": 3.72238579115377e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31349170207977295, |
| "step": 1305, |
| "valid_targets_mean": 3526.4, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 1.7774762550881955, |
| "grad_norm": 0.6628037819653686, |
| "learning_rate": 3.7189367780079956e-05, |
| "loss": 0.3035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30656638741493225, |
| "step": 1310, |
| "valid_targets_mean": 2991.2, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 1.7842605156037992, |
| "grad_norm": 0.7303577186056781, |
| "learning_rate": 3.7154680904450306e-05, |
| "loss": 0.2947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25550299882888794, |
| "step": 1315, |
| "valid_targets_mean": 2137.6, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 1.7910447761194028, |
| "grad_norm": 0.7432172204712651, |
| "learning_rate": 3.711979768166397e-05, |
| "loss": 0.2878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2851966619491577, |
| "step": 1320, |
| "valid_targets_mean": 2175.0, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 1.7978290366350067, |
| "grad_norm": 0.6101418921075195, |
| "learning_rate": 3.708471851098349e-05, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29730525612831116, |
| "step": 1325, |
| "valid_targets_mean": 3097.9, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 1.8046132971506106, |
| "grad_norm": 0.6995136361312011, |
| "learning_rate": 3.704944379391418e-05, |
| "loss": 0.2947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28219103813171387, |
| "step": 1330, |
| "valid_targets_mean": 2626.4, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 1.8113975576662145, |
| "grad_norm": 0.7747003781816696, |
| "learning_rate": 3.70139739341995e-05, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2927844226360321, |
| "step": 1335, |
| "valid_targets_mean": 2138.4, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 1.8181818181818183, |
| "grad_norm": 0.6296472975547316, |
| "learning_rate": 3.6978309337816475e-05, |
| "loss": 0.3003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2978728413581848, |
| "step": 1340, |
| "valid_targets_mean": 2901.1, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 1.824966078697422, |
| "grad_norm": 0.6529444503372535, |
| "learning_rate": 3.6942450412971006e-05, |
| "loss": 0.2869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2776811420917511, |
| "step": 1345, |
| "valid_targets_mean": 2990.2, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 1.8317503392130257, |
| "grad_norm": 0.6073872705332342, |
| "learning_rate": 3.690639757009322e-05, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2847082316875458, |
| "step": 1350, |
| "valid_targets_mean": 3336.8, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 1.8385345997286295, |
| "grad_norm": 0.6726342078161094, |
| "learning_rate": 3.687015122183278e-05, |
| "loss": 0.2985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31284165382385254, |
| "step": 1355, |
| "valid_targets_mean": 3056.4, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 1.8453188602442334, |
| "grad_norm": 0.6570381591584823, |
| "learning_rate": 3.6833711783054146e-05, |
| "loss": 0.2845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27733927965164185, |
| "step": 1360, |
| "valid_targets_mean": 2751.9, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 1.8521031207598373, |
| "grad_norm": 0.7873750592257918, |
| "learning_rate": 3.6797079670831835e-05, |
| "loss": 0.307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2843400537967682, |
| "step": 1365, |
| "valid_targets_mean": 2333.1, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 1.858887381275441, |
| "grad_norm": 0.6324090204988919, |
| "learning_rate": 3.676025530444563e-05, |
| "loss": 0.2728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2516278326511383, |
| "step": 1370, |
| "valid_targets_mean": 2830.2, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 1.8656716417910446, |
| "grad_norm": 0.7359610094620258, |
| "learning_rate": 3.672323910537581e-05, |
| "loss": 0.2843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31318145990371704, |
| "step": 1375, |
| "valid_targets_mean": 2449.1, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 1.8724559023066485, |
| "grad_norm": 0.6497309545854958, |
| "learning_rate": 3.668603149729832e-05, |
| "loss": 0.2844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26779574155807495, |
| "step": 1380, |
| "valid_targets_mean": 2840.0, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 1.8792401628222524, |
| "grad_norm": 0.6267804873051095, |
| "learning_rate": 3.664863290607989e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28004786372184753, |
| "step": 1385, |
| "valid_targets_mean": 2897.0, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 1.8860244233378562, |
| "grad_norm": 0.6879680447864663, |
| "learning_rate": 3.6611043759773195e-05, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31352704763412476, |
| "step": 1390, |
| "valid_targets_mean": 2756.0, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 1.8928086838534601, |
| "grad_norm": 0.6301096600514708, |
| "learning_rate": 3.6573264488611944e-05, |
| "loss": 0.2915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3064451217651367, |
| "step": 1395, |
| "valid_targets_mean": 3032.6, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 1.8995929443690638, |
| "grad_norm": 0.6958211841970261, |
| "learning_rate": 3.6535295525005964e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2943972647190094, |
| "step": 1400, |
| "valid_targets_mean": 2836.4, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 1.9063772048846674, |
| "grad_norm": 0.7887387389485876, |
| "learning_rate": 3.649713730353623e-05, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28154975175857544, |
| "step": 1405, |
| "valid_targets_mean": 2262.3, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 1.9131614654002713, |
| "grad_norm": 1.5313410215337464, |
| "learning_rate": 3.645879026094991e-05, |
| "loss": 0.3075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29764658212661743, |
| "step": 1410, |
| "valid_targets_mean": 2811.7, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 1.9199457259158752, |
| "grad_norm": 0.7151356767653663, |
| "learning_rate": 3.642025483615536e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3090359568595886, |
| "step": 1415, |
| "valid_targets_mean": 2566.2, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 1.926729986431479, |
| "grad_norm": 0.7117696747551553, |
| "learning_rate": 3.6381531470217095e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32978102564811707, |
| "step": 1420, |
| "valid_targets_mean": 2933.4, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 1.9335142469470827, |
| "grad_norm": 0.7645454065347908, |
| "learning_rate": 3.634262060635075e-05, |
| "loss": 0.2951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31343501806259155, |
| "step": 1425, |
| "valid_targets_mean": 2486.8, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 1.9402985074626866, |
| "grad_norm": 0.6774335342238738, |
| "learning_rate": 3.6303522689918015e-05, |
| "loss": 0.2876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2950223684310913, |
| "step": 1430, |
| "valid_targets_mean": 2928.6, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 1.9470827679782903, |
| "grad_norm": 0.6640212258014019, |
| "learning_rate": 3.6264238168421505e-05, |
| "loss": 0.2872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2745462656021118, |
| "step": 1435, |
| "valid_targets_mean": 2628.1, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 1.9538670284938942, |
| "grad_norm": 0.6832788009297351, |
| "learning_rate": 3.622476749149967e-05, |
| "loss": 0.2829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2921183705329895, |
| "step": 1440, |
| "valid_targets_mean": 2838.4, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 1.960651289009498, |
| "grad_norm": 1.02465763567763, |
| "learning_rate": 3.618511111092164e-05, |
| "loss": 0.2885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30975252389907837, |
| "step": 1445, |
| "valid_targets_mean": 2425.6, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 1.967435549525102, |
| "grad_norm": 0.853915586974603, |
| "learning_rate": 3.6145269480582035e-05, |
| "loss": 0.309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3293916583061218, |
| "step": 1450, |
| "valid_targets_mean": 3230.9, |
| "valid_targets_min": 1358 |
| }, |
| { |
| "epoch": 1.9742198100407056, |
| "grad_norm": 0.7500252855517454, |
| "learning_rate": 3.61052430564958e-05, |
| "loss": 0.2786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.285286545753479, |
| "step": 1455, |
| "valid_targets_mean": 1947.4, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 1.9810040705563092, |
| "grad_norm": 0.6777810077646718, |
| "learning_rate": 3.606503229679299e-05, |
| "loss": 0.302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30354389548301697, |
| "step": 1460, |
| "valid_targets_mean": 2624.3, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 1.987788331071913, |
| "grad_norm": 0.7750533185261688, |
| "learning_rate": 3.6024637661713463e-05, |
| "loss": 0.2893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2793115973472595, |
| "step": 1465, |
| "valid_targets_mean": 2612.2, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 1.994572591587517, |
| "grad_norm": 0.7919665782855059, |
| "learning_rate": 3.59840596136017e-05, |
| "loss": 0.2908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27840328216552734, |
| "step": 1470, |
| "valid_targets_mean": 2205.1, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 2.001356852103121, |
| "grad_norm": 0.6677080223559784, |
| "learning_rate": 3.5943298616901434e-05, |
| "loss": 0.2717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252011239528656, |
| "step": 1475, |
| "valid_targets_mean": 3309.2, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 2.0081411126187247, |
| "grad_norm": 0.7207007939374871, |
| "learning_rate": 3.590235513815041e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2334105670452118, |
| "step": 1480, |
| "valid_targets_mean": 2218.1, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 2.014925373134328, |
| "grad_norm": 0.7632243131847694, |
| "learning_rate": 3.586122964597499e-05, |
| "loss": 0.2697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2754613161087036, |
| "step": 1485, |
| "valid_targets_mean": 2588.3, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 2.021709633649932, |
| "grad_norm": 0.7149262249272994, |
| "learning_rate": 3.581992261108478e-05, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22789128124713898, |
| "step": 1490, |
| "valid_targets_mean": 2391.2, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 2.028493894165536, |
| "grad_norm": 0.7021382513288259, |
| "learning_rate": 3.577843450626729e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2544996738433838, |
| "step": 1495, |
| "valid_targets_mean": 3086.4, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 2.03527815468114, |
| "grad_norm": 0.6740781431872369, |
| "learning_rate": 3.573676580638252e-05, |
| "loss": 0.2586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2830080986022949, |
| "step": 1500, |
| "valid_targets_mean": 3231.4, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 2.0420624151967437, |
| "grad_norm": 0.6625091780634826, |
| "learning_rate": 3.569491698835747e-05, |
| "loss": 0.2481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644336223602295, |
| "step": 1505, |
| "valid_targets_mean": 3546.1, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 2.0488466757123476, |
| "grad_norm": 0.772346491835651, |
| "learning_rate": 3.565288853118073e-05, |
| "loss": 0.2565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25193676352500916, |
| "step": 1510, |
| "valid_targets_mean": 2011.5, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 2.055630936227951, |
| "grad_norm": 0.7015358520017895, |
| "learning_rate": 3.561068091589699e-05, |
| "loss": 0.2513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2524373531341553, |
| "step": 1515, |
| "valid_targets_mean": 2833.7, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 2.062415196743555, |
| "grad_norm": 0.6819591135273353, |
| "learning_rate": 3.556829462560152e-05, |
| "loss": 0.2622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2732108533382416, |
| "step": 1520, |
| "valid_targets_mean": 3037.2, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 2.0691994572591588, |
| "grad_norm": 0.7308638462885366, |
| "learning_rate": 3.552573014543465e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24330492317676544, |
| "step": 1525, |
| "valid_targets_mean": 2520.2, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 2.0759837177747626, |
| "grad_norm": 0.7835094284328342, |
| "learning_rate": 3.548298796257623e-05, |
| "loss": 0.2589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2812742590904236, |
| "step": 1530, |
| "valid_targets_mean": 2378.4, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 2.0827679782903665, |
| "grad_norm": 0.6968412144913585, |
| "learning_rate": 3.5440068566240006e-05, |
| "loss": 0.2536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25412964820861816, |
| "step": 1535, |
| "valid_targets_mean": 2384.0, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 2.08955223880597, |
| "grad_norm": 0.7616955455624203, |
| "learning_rate": 3.539697244766809e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29562467336654663, |
| "step": 1540, |
| "valid_targets_mean": 2267.1, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 2.096336499321574, |
| "grad_norm": 0.7131875884565378, |
| "learning_rate": 3.5353700100125285e-05, |
| "loss": 0.256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2696763873100281, |
| "step": 1545, |
| "valid_targets_mean": 2582.3, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 2.1031207598371777, |
| "grad_norm": 0.7768997711520144, |
| "learning_rate": 3.531025201889346e-05, |
| "loss": 0.2649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27121901512145996, |
| "step": 1550, |
| "valid_targets_mean": 2734.2, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 2.1099050203527816, |
| "grad_norm": 0.5972671434746235, |
| "learning_rate": 3.526662870126588e-05, |
| "loss": 0.2467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21913185715675354, |
| "step": 1555, |
| "valid_targets_mean": 3436.5, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 2.1166892808683855, |
| "grad_norm": 0.8928905338020054, |
| "learning_rate": 3.5222830646541495e-05, |
| "loss": 0.2407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2423502504825592, |
| "step": 1560, |
| "valid_targets_mean": 3034.4, |
| "valid_targets_min": 1466 |
| }, |
| { |
| "epoch": 2.123473541383989, |
| "grad_norm": 0.7792302275809843, |
| "learning_rate": 3.517885835601927e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23429229855537415, |
| "step": 1565, |
| "valid_targets_mean": 2170.3, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 2.130257801899593, |
| "grad_norm": 0.6637166367797426, |
| "learning_rate": 3.5134712332992396e-05, |
| "loss": 0.2545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2654414474964142, |
| "step": 1570, |
| "valid_targets_mean": 3309.1, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 2.1370420624151967, |
| "grad_norm": 0.7708919189354086, |
| "learning_rate": 3.5090393082742555e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26184701919555664, |
| "step": 1575, |
| "valid_targets_mean": 2298.2, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 2.1438263229308006, |
| "grad_norm": 0.7215973806908841, |
| "learning_rate": 3.504590111253414e-05, |
| "loss": 0.2532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27381983399391174, |
| "step": 1580, |
| "valid_targets_mean": 2703.3, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 2.1506105834464044, |
| "grad_norm": 0.8043249601230251, |
| "learning_rate": 3.5001236931608446e-05, |
| "loss": 0.2609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2702006995677948, |
| "step": 1585, |
| "valid_targets_mean": 2177.4, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 2.1573948439620083, |
| "grad_norm": 0.6914069724407004, |
| "learning_rate": 3.495640105117784e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27623242139816284, |
| "step": 1590, |
| "valid_targets_mean": 2991.8, |
| "valid_targets_min": 1354 |
| }, |
| { |
| "epoch": 2.1641791044776117, |
| "grad_norm": 0.8082050307344478, |
| "learning_rate": 3.491139398441989e-05, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2768654525279999, |
| "step": 1595, |
| "valid_targets_mean": 2209.0, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 2.1709633649932156, |
| "grad_norm": 0.7574042859615202, |
| "learning_rate": 3.4866216246471536e-05, |
| "loss": 0.2571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28827136754989624, |
| "step": 1600, |
| "valid_targets_mean": 2482.6, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 2.1777476255088195, |
| "grad_norm": 0.6561439016270234, |
| "learning_rate": 3.482086835442313e-05, |
| "loss": 0.2579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2732161581516266, |
| "step": 1605, |
| "valid_targets_mean": 3250.7, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 2.1845318860244234, |
| "grad_norm": 0.6444399840162086, |
| "learning_rate": 3.47753508273126e-05, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27326977252960205, |
| "step": 1610, |
| "valid_targets_mean": 2993.8, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 2.1913161465400273, |
| "grad_norm": 0.6624015010390857, |
| "learning_rate": 3.472966418611944e-05, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2766575217247009, |
| "step": 1615, |
| "valid_targets_mean": 3185.8, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 2.198100407055631, |
| "grad_norm": 0.6436526455011548, |
| "learning_rate": 3.468380895375876e-05, |
| "loss": 0.2685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2507815957069397, |
| "step": 1620, |
| "valid_targets_mean": 3060.2, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 2.2048846675712346, |
| "grad_norm": 0.6752004219899516, |
| "learning_rate": 3.463778565507536e-05, |
| "loss": 0.2596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24225379526615143, |
| "step": 1625, |
| "valid_targets_mean": 2709.7, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 2.2116689280868385, |
| "grad_norm": 0.6096818559003151, |
| "learning_rate": 3.45915948168376e-05, |
| "loss": 0.2615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24749873578548431, |
| "step": 1630, |
| "valid_targets_mean": 3076.5, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 2.2184531886024423, |
| "grad_norm": 0.6382946984463229, |
| "learning_rate": 3.454523696773152e-05, |
| "loss": 0.2564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28292831778526306, |
| "step": 1635, |
| "valid_targets_mean": 3444.9, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 2.225237449118046, |
| "grad_norm": 0.7180530567460727, |
| "learning_rate": 3.4498712638354646e-05, |
| "loss": 0.2605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2660506069660187, |
| "step": 1640, |
| "valid_targets_mean": 2654.6, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 2.23202170963365, |
| "grad_norm": 0.6477313971324171, |
| "learning_rate": 3.445202236121006e-05, |
| "loss": 0.249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23461966216564178, |
| "step": 1645, |
| "valid_targets_mean": 2946.6, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 2.2388059701492535, |
| "grad_norm": 0.758634223425707, |
| "learning_rate": 3.440516667070017e-05, |
| "loss": 0.2496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2572581470012665, |
| "step": 1650, |
| "valid_targets_mean": 2419.9, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 2.2455902306648574, |
| "grad_norm": 0.7525020456973835, |
| "learning_rate": 3.435814610312068e-05, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2762409448623657, |
| "step": 1655, |
| "valid_targets_mean": 2593.2, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 2.2523744911804613, |
| "grad_norm": 0.6900366742315267, |
| "learning_rate": 3.431096119665443e-05, |
| "loss": 0.258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2573353052139282, |
| "step": 1660, |
| "valid_targets_mean": 2404.2, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 2.259158751696065, |
| "grad_norm": 0.7966484389836349, |
| "learning_rate": 3.426361249136522e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2512604892253876, |
| "step": 1665, |
| "valid_targets_mean": 2740.3, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 2.265943012211669, |
| "grad_norm": 0.6267399197635503, |
| "learning_rate": 3.421610052919163e-05, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2536308467388153, |
| "step": 1670, |
| "valid_targets_mean": 2806.4, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 2.2727272727272725, |
| "grad_norm": 0.710274498225842, |
| "learning_rate": 3.4168425853940865e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23908887803554535, |
| "step": 1675, |
| "valid_targets_mean": 2732.9, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.2795115332428764, |
| "grad_norm": 0.6223626538847287, |
| "learning_rate": 3.412058901128245e-05, |
| "loss": 0.2396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23127231001853943, |
| "step": 1680, |
| "valid_targets_mean": 2821.8, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 2.2862957937584802, |
| "grad_norm": 0.6294319468393673, |
| "learning_rate": 3.407259054874206e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2410857379436493, |
| "step": 1685, |
| "valid_targets_mean": 2965.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.293080054274084, |
| "grad_norm": 0.8008654337703052, |
| "learning_rate": 3.402443101569521e-05, |
| "loss": 0.2499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26027989387512207, |
| "step": 1690, |
| "valid_targets_mean": 2395.8, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 2.299864314789688, |
| "grad_norm": 0.7218010335927416, |
| "learning_rate": 3.397611096336097e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3087459206581116, |
| "step": 1695, |
| "valid_targets_mean": 2789.3, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 2.306648575305292, |
| "grad_norm": 0.7847076898478889, |
| "learning_rate": 3.392763094479568e-05, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26217982172966003, |
| "step": 1700, |
| "valid_targets_mean": 2132.0, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 2.3134328358208958, |
| "grad_norm": 0.7515258396714922, |
| "learning_rate": 3.387899151488659e-05, |
| "loss": 0.2671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2646181583404541, |
| "step": 1705, |
| "valid_targets_mean": 2402.3, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.320217096336499, |
| "grad_norm": 0.6310084529124328, |
| "learning_rate": 3.383019323034552e-05, |
| "loss": 0.2712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26773834228515625, |
| "step": 1710, |
| "valid_targets_mean": 3745.5, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 2.327001356852103, |
| "grad_norm": 0.6476866135246807, |
| "learning_rate": 3.378123664970252e-05, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23596899211406708, |
| "step": 1715, |
| "valid_targets_mean": 2782.4, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 2.333785617367707, |
| "grad_norm": 0.6635878932623026, |
| "learning_rate": 3.373212233329941e-05, |
| "loss": 0.268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2669086158275604, |
| "step": 1720, |
| "valid_targets_mean": 2656.4, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 2.340569877883311, |
| "grad_norm": 0.8372787858249849, |
| "learning_rate": 3.368285084328343e-05, |
| "loss": 0.2622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27093416452407837, |
| "step": 1725, |
| "valid_targets_mean": 2007.2, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 2.3473541383989147, |
| "grad_norm": 0.7084081316996159, |
| "learning_rate": 3.363342274360076e-05, |
| "loss": 0.2597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27293896675109863, |
| "step": 1730, |
| "valid_targets_mean": 2628.9, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 2.354138398914518, |
| "grad_norm": 0.7361649736055962, |
| "learning_rate": 3.358383859999011e-05, |
| "loss": 0.2715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24949458241462708, |
| "step": 1735, |
| "valid_targets_mean": 2166.1, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 2.360922659430122, |
| "grad_norm": 0.6601077278545686, |
| "learning_rate": 3.353409897997621e-05, |
| "loss": 0.2585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252005398273468, |
| "step": 1740, |
| "valid_targets_mean": 2885.6, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 2.367706919945726, |
| "grad_norm": 0.7833459948759297, |
| "learning_rate": 3.348420445286331e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25346460938453674, |
| "step": 1745, |
| "valid_targets_mean": 2880.2, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.37449118046133, |
| "grad_norm": 0.6917728614350838, |
| "learning_rate": 3.3434155589728695e-05, |
| "loss": 0.2581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21869820356369019, |
| "step": 1750, |
| "valid_targets_mean": 2367.4, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 2.3812754409769337, |
| "grad_norm": 0.6338539881836546, |
| "learning_rate": 3.338395296341614e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2602981925010681, |
| "step": 1755, |
| "valid_targets_mean": 3345.6, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 2.388059701492537, |
| "grad_norm": 0.6645949196725213, |
| "learning_rate": 3.333359714852932e-05, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2770848870277405, |
| "step": 1760, |
| "valid_targets_mean": 2870.8, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 2.394843962008141, |
| "grad_norm": 0.6971754384837836, |
| "learning_rate": 3.328308872142528e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24311913549900055, |
| "step": 1765, |
| "valid_targets_mean": 2503.1, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 2.401628222523745, |
| "grad_norm": 0.6356007444165893, |
| "learning_rate": 3.3232428260207804e-05, |
| "loss": 0.2657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26365482807159424, |
| "step": 1770, |
| "valid_targets_mean": 3150.6, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 2.4084124830393487, |
| "grad_norm": 0.7060984927170915, |
| "learning_rate": 3.318161634472083e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27592113614082336, |
| "step": 1775, |
| "valid_targets_mean": 2829.7, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 2.4151967435549526, |
| "grad_norm": 0.6510612732829962, |
| "learning_rate": 3.3130653556541774e-05, |
| "loss": 0.2494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24161876738071442, |
| "step": 1780, |
| "valid_targets_mean": 3045.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 2.4219810040705565, |
| "grad_norm": 0.6847258251540859, |
| "learning_rate": 3.30795404789749e-05, |
| "loss": 0.264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27078160643577576, |
| "step": 1785, |
| "valid_targets_mean": 3208.2, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 2.42876526458616, |
| "grad_norm": 0.7808291039965765, |
| "learning_rate": 3.302827769704464e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25728699564933777, |
| "step": 1790, |
| "valid_targets_mean": 2815.0, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 2.435549525101764, |
| "grad_norm": 0.7272148707674393, |
| "learning_rate": 3.29768657974889e-05, |
| "loss": 0.25, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.258420467376709, |
| "step": 1795, |
| "valid_targets_mean": 2726.6, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 2.4423337856173677, |
| "grad_norm": 0.7459339825138199, |
| "learning_rate": 3.2925305368752346e-05, |
| "loss": 0.2616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28670960664749146, |
| "step": 1800, |
| "valid_targets_mean": 2654.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 2.4491180461329716, |
| "grad_norm": 0.7287330807026949, |
| "learning_rate": 3.2873597000979626e-05, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25203102827072144, |
| "step": 1805, |
| "valid_targets_mean": 3238.3, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 2.4559023066485755, |
| "grad_norm": 0.7104083422326701, |
| "learning_rate": 3.28217412860087e-05, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21682174503803253, |
| "step": 1810, |
| "valid_targets_mean": 3128.4, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 2.4626865671641793, |
| "grad_norm": 0.6057916542411326, |
| "learning_rate": 3.276973881736399e-05, |
| "loss": 0.259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25353389978408813, |
| "step": 1815, |
| "valid_targets_mean": 3672.1, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 2.4694708276797828, |
| "grad_norm": 0.7923986851890575, |
| "learning_rate": 3.2717590190249617e-05, |
| "loss": 0.2632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22225558757781982, |
| "step": 1820, |
| "valid_targets_mean": 2796.2, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 2.4762550881953866, |
| "grad_norm": 0.6652659164621177, |
| "learning_rate": 3.2665296001542606e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28310340642929077, |
| "step": 1825, |
| "valid_targets_mean": 3224.8, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 2.4830393487109905, |
| "grad_norm": 0.7654192310941611, |
| "learning_rate": 3.261285684978601e-05, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2906759977340698, |
| "step": 1830, |
| "valid_targets_mean": 2817.2, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 2.4898236092265944, |
| "grad_norm": 0.7118429223959195, |
| "learning_rate": 3.256027333518209e-05, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2705893814563751, |
| "step": 1835, |
| "valid_targets_mean": 2739.5, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 2.4966078697421983, |
| "grad_norm": 0.7194235047620599, |
| "learning_rate": 3.250754605958546e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2895210385322571, |
| "step": 1840, |
| "valid_targets_mean": 2776.8, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 2.5033921302578017, |
| "grad_norm": 0.7159119323725041, |
| "learning_rate": 3.245467562649615e-05, |
| "loss": 0.2531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22497795522212982, |
| "step": 1845, |
| "valid_targets_mean": 2419.1, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 2.5101763907734056, |
| "grad_norm": 0.6776377638938433, |
| "learning_rate": 3.240166264105274e-05, |
| "loss": 0.257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2763141989707947, |
| "step": 1850, |
| "valid_targets_mean": 2846.4, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.5169606512890095, |
| "grad_norm": 0.6865655138064035, |
| "learning_rate": 3.234850771002542e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24978536367416382, |
| "step": 1855, |
| "valid_targets_mean": 2978.5, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.5237449118046134, |
| "grad_norm": 0.6699601179099225, |
| "learning_rate": 3.2295211441809043e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25676673650741577, |
| "step": 1860, |
| "valid_targets_mean": 2917.8, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 2.5305291723202172, |
| "grad_norm": 0.6889764980124685, |
| "learning_rate": 3.224177444641616e-05, |
| "loss": 0.2743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3100902736186981, |
| "step": 1865, |
| "valid_targets_mean": 2546.6, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 2.5373134328358207, |
| "grad_norm": 0.6793757318097332, |
| "learning_rate": 3.218819733547006e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2357414960861206, |
| "step": 1870, |
| "valid_targets_mean": 2497.8, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 2.5440976933514245, |
| "grad_norm": 0.8152453145431383, |
| "learning_rate": 3.2134480722197707e-05, |
| "loss": 0.262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29958784580230713, |
| "step": 1875, |
| "valid_targets_mean": 2523.8, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 2.5508819538670284, |
| "grad_norm": 0.7495650389529989, |
| "learning_rate": 3.208062522142282e-05, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2574930191040039, |
| "step": 1880, |
| "valid_targets_mean": 2723.4, |
| "valid_targets_min": 951 |
| }, |
| { |
| "epoch": 2.5576662143826323, |
| "grad_norm": 0.7714988898913233, |
| "learning_rate": 3.202663144955875e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2438960075378418, |
| "step": 1885, |
| "valid_targets_mean": 2427.2, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 2.564450474898236, |
| "grad_norm": 0.8149406397413984, |
| "learning_rate": 3.1972500024601475e-05, |
| "loss": 0.2536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2427600771188736, |
| "step": 1890, |
| "valid_targets_mean": 2379.7, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.5712347354138396, |
| "grad_norm": 0.835575869140074, |
| "learning_rate": 3.1918231566122467e-05, |
| "loss": 0.2634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2951461672782898, |
| "step": 1895, |
| "valid_targets_mean": 2883.2, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 2.578018995929444, |
| "grad_norm": 0.6480761129447208, |
| "learning_rate": 3.186382669526169e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25713399052619934, |
| "step": 1900, |
| "valid_targets_mean": 3203.1, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 2.5848032564450474, |
| "grad_norm": 0.6296775116161838, |
| "learning_rate": 3.180928603472041e-05, |
| "loss": 0.2502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24473142623901367, |
| "step": 1905, |
| "valid_targets_mean": 3100.0, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 2.5915875169606513, |
| "grad_norm": 0.6495398797854156, |
| "learning_rate": 3.175461020875412e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23860132694244385, |
| "step": 1910, |
| "valid_targets_mean": 3028.4, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 2.598371777476255, |
| "grad_norm": 0.6700738944682313, |
| "learning_rate": 3.1699799843165356e-05, |
| "loss": 0.2608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2498638927936554, |
| "step": 1915, |
| "valid_targets_mean": 2918.0, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 2.605156037991859, |
| "grad_norm": 0.6577566326274685, |
| "learning_rate": 3.164485556529657e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25191181898117065, |
| "step": 1920, |
| "valid_targets_mean": 2755.8, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 2.611940298507463, |
| "grad_norm": 0.6054859630469727, |
| "learning_rate": 3.158977800402292e-05, |
| "loss": 0.2537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2440011352300644, |
| "step": 1925, |
| "valid_targets_mean": 3179.1, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 2.6187245590230663, |
| "grad_norm": 0.6786451801971204, |
| "learning_rate": 3.1534567789745084e-05, |
| "loss": 0.2631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2818109095096588, |
| "step": 1930, |
| "valid_targets_mean": 2949.1, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 2.62550881953867, |
| "grad_norm": 0.6942883497416937, |
| "learning_rate": 3.147922555438206e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24890519678592682, |
| "step": 1935, |
| "valid_targets_mean": 2585.8, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 2.632293080054274, |
| "grad_norm": 0.7058789473959215, |
| "learning_rate": 3.14237519313639e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2726551294326782, |
| "step": 1940, |
| "valid_targets_mean": 2646.4, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 2.639077340569878, |
| "grad_norm": 0.6700353317554494, |
| "learning_rate": 3.1368147555624486e-05, |
| "loss": 0.2599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2708538770675659, |
| "step": 1945, |
| "valid_targets_mean": 3069.9, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 2.645861601085482, |
| "grad_norm": 0.7323325511038016, |
| "learning_rate": 3.131241306359426e-05, |
| "loss": 0.2517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2605024576187134, |
| "step": 1950, |
| "valid_targets_mean": 2873.1, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 2.6526458616010853, |
| "grad_norm": 0.6879553895964564, |
| "learning_rate": 3.125654909319294e-05, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2747609615325928, |
| "step": 1955, |
| "valid_targets_mean": 3061.4, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 2.659430122116689, |
| "grad_norm": 0.6920353888734679, |
| "learning_rate": 3.120055628382218e-05, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23946809768676758, |
| "step": 1960, |
| "valid_targets_mean": 2961.5, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 2.666214382632293, |
| "grad_norm": 0.6453205678625881, |
| "learning_rate": 3.1144435276358325e-05, |
| "loss": 0.2582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27227306365966797, |
| "step": 1965, |
| "valid_targets_mean": 3088.8, |
| "valid_targets_min": 1145 |
| }, |
| { |
| "epoch": 2.672998643147897, |
| "grad_norm": 0.6921138419734034, |
| "learning_rate": 3.1088186713145024e-05, |
| "loss": 0.2586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25944316387176514, |
| "step": 1970, |
| "valid_targets_mean": 2601.7, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 2.679782903663501, |
| "grad_norm": 0.6778135167815581, |
| "learning_rate": 3.103181123798587e-05, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24725311994552612, |
| "step": 1975, |
| "valid_targets_mean": 2674.5, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 2.6865671641791042, |
| "grad_norm": 0.7351183532910395, |
| "learning_rate": 3.0975309496137066e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25560200214385986, |
| "step": 1980, |
| "valid_targets_mean": 2353.3, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 2.693351424694708, |
| "grad_norm": 0.6182324179687427, |
| "learning_rate": 3.091868213430004e-05, |
| "loss": 0.2587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22743821144104004, |
| "step": 1985, |
| "valid_targets_mean": 2698.8, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 2.700135685210312, |
| "grad_norm": 0.7363935013486361, |
| "learning_rate": 3.086192980061399e-05, |
| "loss": 0.2633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27139535546302795, |
| "step": 1990, |
| "valid_targets_mean": 2369.6, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 2.706919945725916, |
| "grad_norm": 0.6440601737571228, |
| "learning_rate": 3.080505314464854e-05, |
| "loss": 0.247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23245973885059357, |
| "step": 1995, |
| "valid_targets_mean": 2775.4, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 2.7137042062415198, |
| "grad_norm": 0.6702282934429393, |
| "learning_rate": 3.0748052817396254e-05, |
| "loss": 0.2568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2478809952735901, |
| "step": 2000, |
| "valid_targets_mean": 2646.8, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 2.7204884667571236, |
| "grad_norm": 0.6800473944399235, |
| "learning_rate": 3.0690929471265185e-05, |
| "loss": 0.2654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24637192487716675, |
| "step": 2005, |
| "valid_targets_mean": 2696.4, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 2.7272727272727275, |
| "grad_norm": 0.6303354724046744, |
| "learning_rate": 3.063368376007145e-05, |
| "loss": 0.2606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26109838485717773, |
| "step": 2010, |
| "valid_targets_mean": 3292.2, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 2.734056987788331, |
| "grad_norm": 0.6765904914853859, |
| "learning_rate": 3.057631633903167e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24430710077285767, |
| "step": 2015, |
| "valid_targets_mean": 2731.6, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 2.740841248303935, |
| "grad_norm": 0.6432972439515613, |
| "learning_rate": 3.05188278647556e-05, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23854488134384155, |
| "step": 2020, |
| "valid_targets_mean": 2842.9, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 2.7476255088195387, |
| "grad_norm": 0.6577825459454796, |
| "learning_rate": 3.0461218995238453e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.254770427942276, |
| "step": 2025, |
| "valid_targets_mean": 2721.9, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 2.7544097693351426, |
| "grad_norm": 0.6949351773395782, |
| "learning_rate": 3.0403490389853484e-05, |
| "loss": 0.2488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23568594455718994, |
| "step": 2030, |
| "valid_targets_mean": 2796.5, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 2.7611940298507465, |
| "grad_norm": 0.7323091372332017, |
| "learning_rate": 3.034564270934442e-05, |
| "loss": 0.2481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26838138699531555, |
| "step": 2035, |
| "valid_targets_mean": 2450.1, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.76797829036635, |
| "grad_norm": 0.7072050298374907, |
| "learning_rate": 3.0287676615817854e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2603970468044281, |
| "step": 2040, |
| "valid_targets_mean": 2724.6, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 2.774762550881954, |
| "grad_norm": 0.7013954312412192, |
| "learning_rate": 3.0229592772735717e-05, |
| "loss": 0.2375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2462655007839203, |
| "step": 2045, |
| "valid_targets_mean": 2669.0, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 2.7815468113975577, |
| "grad_norm": 0.7194087010991239, |
| "learning_rate": 3.0171391844907663e-05, |
| "loss": 0.2455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22803866863250732, |
| "step": 2050, |
| "valid_targets_mean": 2516.1, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 2.7883310719131615, |
| "grad_norm": 0.6532424708668592, |
| "learning_rate": 3.011307449848345e-05, |
| "loss": 0.2669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25693702697753906, |
| "step": 2055, |
| "valid_targets_mean": 2905.6, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 2.7951153324287654, |
| "grad_norm": 0.6019841138198014, |
| "learning_rate": 3.0054641400945354e-05, |
| "loss": 0.2691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2629098892211914, |
| "step": 2060, |
| "valid_targets_mean": 3336.9, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 2.801899592944369, |
| "grad_norm": 0.590938009064258, |
| "learning_rate": 2.9996093221100468e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24467141926288605, |
| "step": 2065, |
| "valid_targets_mean": 3226.9, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 2.8086838534599727, |
| "grad_norm": 0.6853913375855859, |
| "learning_rate": 2.993743062907311e-05, |
| "loss": 0.2773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3042706549167633, |
| "step": 2070, |
| "valid_targets_mean": 3042.9, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 2.8154681139755766, |
| "grad_norm": 0.6566966730503214, |
| "learning_rate": 2.9878654296297112e-05, |
| "loss": 0.259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26403605937957764, |
| "step": 2075, |
| "valid_targets_mean": 3035.4, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 2.8222523744911805, |
| "grad_norm": 0.7543020252020352, |
| "learning_rate": 2.981976489550814e-05, |
| "loss": 0.2571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24550700187683105, |
| "step": 2080, |
| "valid_targets_mean": 2845.9, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 2.8290366350067844, |
| "grad_norm": 0.7093980696165589, |
| "learning_rate": 2.9760763100736016e-05, |
| "loss": 0.2486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2348649501800537, |
| "step": 2085, |
| "valid_targets_mean": 2346.6, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 2.835820895522388, |
| "grad_norm": 0.6549172444022449, |
| "learning_rate": 2.970164958729698e-05, |
| "loss": 0.2377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21750161051750183, |
| "step": 2090, |
| "valid_targets_mean": 2408.1, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 2.842605156037992, |
| "grad_norm": 0.8065514310435659, |
| "learning_rate": 2.964242503178597e-05, |
| "loss": 0.2622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26003286242485046, |
| "step": 2095, |
| "valid_targets_mean": 1907.9, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 2.8493894165535956, |
| "grad_norm": 0.578124344699749, |
| "learning_rate": 2.958309011206888e-05, |
| "loss": 0.2461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2605810761451721, |
| "step": 2100, |
| "valid_targets_mean": 3794.0, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 2.8561736770691994, |
| "grad_norm": 0.6706934642907637, |
| "learning_rate": 2.9523645507274798e-05, |
| "loss": 0.2416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2569592297077179, |
| "step": 2105, |
| "valid_targets_mean": 2656.1, |
| "valid_targets_min": 1266 |
| }, |
| { |
| "epoch": 2.8629579375848033, |
| "grad_norm": 0.7102884408604969, |
| "learning_rate": 2.9464091897788232e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27441930770874023, |
| "step": 2110, |
| "valid_targets_mean": 2542.4, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 2.869742198100407, |
| "grad_norm": 0.6396640888363082, |
| "learning_rate": 2.940442996524132e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28722479939460754, |
| "step": 2115, |
| "valid_targets_mean": 3116.9, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 2.876526458616011, |
| "grad_norm": 0.8432323434605307, |
| "learning_rate": 2.9344660392506043e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28614795207977295, |
| "step": 2120, |
| "valid_targets_mean": 3104.6, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 2.8833107191316145, |
| "grad_norm": 0.6395419218584879, |
| "learning_rate": 2.9284783863686382e-05, |
| "loss": 0.2581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2634587287902832, |
| "step": 2125, |
| "valid_targets_mean": 3117.6, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 2.8900949796472184, |
| "grad_norm": 0.5718851345375481, |
| "learning_rate": 2.922480106411053e-05, |
| "loss": 0.2697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2612381875514984, |
| "step": 2130, |
| "valid_targets_mean": 3635.0, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 2.8968792401628223, |
| "grad_norm": 0.6528582956501181, |
| "learning_rate": 2.9164712680322984e-05, |
| "loss": 0.2462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2157207727432251, |
| "step": 2135, |
| "valid_targets_mean": 2491.8, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 2.903663500678426, |
| "grad_norm": 0.8098720111841451, |
| "learning_rate": 2.9104519400076766e-05, |
| "loss": 0.264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25750282406806946, |
| "step": 2140, |
| "valid_targets_mean": 2004.3, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 2.91044776119403, |
| "grad_norm": 0.6201356506537019, |
| "learning_rate": 2.9044221912325486e-05, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2485671043395996, |
| "step": 2145, |
| "valid_targets_mean": 3226.1, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.9172320217096335, |
| "grad_norm": 0.6786949165909485, |
| "learning_rate": 2.8983820907215475e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21794003248214722, |
| "step": 2150, |
| "valid_targets_mean": 2685.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.9240162822252374, |
| "grad_norm": 0.6196782492846893, |
| "learning_rate": 2.8923317076077915e-05, |
| "loss": 0.2589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.259111225605011, |
| "step": 2155, |
| "valid_targets_mean": 3168.1, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 2.9308005427408412, |
| "grad_norm": 0.6506882542165565, |
| "learning_rate": 2.8862711111420893e-05, |
| "loss": 0.2461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25076574087142944, |
| "step": 2160, |
| "valid_targets_mean": 3034.2, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 2.937584803256445, |
| "grad_norm": 0.6853337250211714, |
| "learning_rate": 2.8802003706921468e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2712341547012329, |
| "step": 2165, |
| "valid_targets_mean": 2867.3, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 2.944369063772049, |
| "grad_norm": 0.7641884011034288, |
| "learning_rate": 2.8741195557417775e-05, |
| "loss": 0.2627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2769216001033783, |
| "step": 2170, |
| "valid_targets_mean": 2302.2, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 2.9511533242876524, |
| "grad_norm": 0.6826360549379976, |
| "learning_rate": 2.8680287358901028e-05, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24993981420993805, |
| "step": 2175, |
| "valid_targets_mean": 2850.9, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 2.9579375848032563, |
| "grad_norm": 0.7221044998473106, |
| "learning_rate": 2.861927980850757e-05, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25909918546676636, |
| "step": 2180, |
| "valid_targets_mean": 2386.6, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 2.96472184531886, |
| "grad_norm": 0.7377714080476292, |
| "learning_rate": 2.8558173604510907e-05, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22513189911842346, |
| "step": 2185, |
| "valid_targets_mean": 2357.4, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 2.971506105834464, |
| "grad_norm": 0.5623921608095559, |
| "learning_rate": 2.849696944631369e-05, |
| "loss": 0.2559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26851212978363037, |
| "step": 2190, |
| "valid_targets_mean": 4109.2, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 2.978290366350068, |
| "grad_norm": 0.6103524586471685, |
| "learning_rate": 2.8435668034439738e-05, |
| "loss": 0.2564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2774103879928589, |
| "step": 2195, |
| "valid_targets_mean": 3372.1, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 2.9850746268656714, |
| "grad_norm": 0.6165970882379855, |
| "learning_rate": 2.8374270070525988e-05, |
| "loss": 0.2509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23035350441932678, |
| "step": 2200, |
| "valid_targets_mean": 3327.9, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 2.9918588873812757, |
| "grad_norm": 0.7660874337227206, |
| "learning_rate": 2.8312776257314497e-05, |
| "loss": 0.2542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2771637737751007, |
| "step": 2205, |
| "valid_targets_mean": 2188.8, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 2.998643147896879, |
| "grad_norm": 0.678819967572549, |
| "learning_rate": 2.8251187298644372e-05, |
| "loss": 0.2513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25125089287757874, |
| "step": 2210, |
| "valid_targets_mean": 2593.7, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 3.005427408412483, |
| "grad_norm": 0.6195799648166698, |
| "learning_rate": 2.818950389944374e-05, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21490924060344696, |
| "step": 2215, |
| "valid_targets_mean": 3076.2, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 3.012211668928087, |
| "grad_norm": 0.741799685467653, |
| "learning_rate": 2.812772676572165e-05, |
| "loss": 0.2295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2147355079650879, |
| "step": 2220, |
| "valid_targets_mean": 2800.7, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 3.0189959294436908, |
| "grad_norm": 0.6481778989984706, |
| "learning_rate": 2.806585660456001e-05, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21204230189323425, |
| "step": 2225, |
| "valid_targets_mean": 3253.1, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 3.0257801899592947, |
| "grad_norm": 0.7528798552940739, |
| "learning_rate": 2.8003894124105494e-05, |
| "loss": 0.2308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24220474064350128, |
| "step": 2230, |
| "valid_targets_mean": 2921.9, |
| "valid_targets_min": 1386 |
| }, |
| { |
| "epoch": 3.032564450474898, |
| "grad_norm": 0.7539503673228278, |
| "learning_rate": 2.794184003356144e-05, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2737279236316681, |
| "step": 2235, |
| "valid_targets_mean": 2459.6, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 3.039348710990502, |
| "grad_norm": 0.6860093065024846, |
| "learning_rate": 2.787969504317972e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23056598007678986, |
| "step": 2240, |
| "valid_targets_mean": 3120.1, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.046132971506106, |
| "grad_norm": 0.6742437476536095, |
| "learning_rate": 2.7817459864252606e-05, |
| "loss": 0.2293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2076399177312851, |
| "step": 2245, |
| "valid_targets_mean": 2751.0, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 3.0529172320217097, |
| "grad_norm": 0.6601870684447021, |
| "learning_rate": 2.7755135209104673e-05, |
| "loss": 0.2115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21040399372577667, |
| "step": 2250, |
| "valid_targets_mean": 2970.5, |
| "valid_targets_min": 1266 |
| }, |
| { |
| "epoch": 3.0597014925373136, |
| "grad_norm": 0.7655435099255181, |
| "learning_rate": 2.769272179108458e-05, |
| "loss": 0.2252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24985858798027039, |
| "step": 2255, |
| "valid_targets_mean": 3437.8, |
| "valid_targets_min": 1114 |
| }, |
| { |
| "epoch": 3.066485753052917, |
| "grad_norm": 0.7149714320640186, |
| "learning_rate": 2.7630220324556947e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21348509192466736, |
| "step": 2260, |
| "valid_targets_mean": 2941.0, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 3.073270013568521, |
| "grad_norm": 0.7792687892843089, |
| "learning_rate": 2.756763152489418e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20965218544006348, |
| "step": 2265, |
| "valid_targets_mean": 1918.6, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 3.080054274084125, |
| "grad_norm": 0.6597990538607253, |
| "learning_rate": 2.7504956108468262e-05, |
| "loss": 0.2239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24037772417068481, |
| "step": 2270, |
| "valid_targets_mean": 3295.2, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 3.0868385345997287, |
| "grad_norm": 0.7852404129824124, |
| "learning_rate": 2.7442194792642576e-05, |
| "loss": 0.228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26370474696159363, |
| "step": 2275, |
| "valid_targets_mean": 2461.3, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 3.0936227951153326, |
| "grad_norm": 0.6324909016089244, |
| "learning_rate": 2.737934829576367e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19589462876319885, |
| "step": 2280, |
| "valid_targets_mean": 2882.0, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 3.1004070556309364, |
| "grad_norm": 0.7132616114200901, |
| "learning_rate": 2.7316417337153053e-05, |
| "loss": 0.2263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21955709159374237, |
| "step": 2285, |
| "valid_targets_mean": 2424.4, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 3.10719131614654, |
| "grad_norm": 0.6627034885187564, |
| "learning_rate": 2.7253402637098963e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2161223590373993, |
| "step": 2290, |
| "valid_targets_mean": 2994.9, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 3.1139755766621438, |
| "grad_norm": 0.7133154934701709, |
| "learning_rate": 2.7190304916848114e-05, |
| "loss": 0.2225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22376814484596252, |
| "step": 2295, |
| "valid_targets_mean": 2787.6, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 3.1207598371777476, |
| "grad_norm": 0.7291074383267475, |
| "learning_rate": 2.712712489859743e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23834912478923798, |
| "step": 2300, |
| "valid_targets_mean": 2901.0, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 3.1275440976933515, |
| "grad_norm": 0.7568349432173351, |
| "learning_rate": 2.706386330548581e-05, |
| "loss": 0.2084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19825339317321777, |
| "step": 2305, |
| "valid_targets_mean": 2677.8, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 3.1343283582089554, |
| "grad_norm": 0.7241979030877912, |
| "learning_rate": 2.7000520861585825e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22395247220993042, |
| "step": 2310, |
| "valid_targets_mean": 2555.9, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 3.141112618724559, |
| "grad_norm": 0.7176875343032588, |
| "learning_rate": 2.693709829189544e-05, |
| "loss": 0.2191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21689847111701965, |
| "step": 2315, |
| "valid_targets_mean": 2447.6, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 3.1478968792401627, |
| "grad_norm": 0.8624810704747251, |
| "learning_rate": 2.6873596322329717e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2509344816207886, |
| "step": 2320, |
| "valid_targets_mean": 1913.9, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 3.1546811397557666, |
| "grad_norm": 0.6434418388849583, |
| "learning_rate": 2.6810015679712505e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22354134917259216, |
| "step": 2325, |
| "valid_targets_mean": 3262.2, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 3.1614654002713705, |
| "grad_norm": 0.7907645012767848, |
| "learning_rate": 2.6746357091768116e-05, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22720026969909668, |
| "step": 2330, |
| "valid_targets_mean": 2312.9, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 3.1682496607869743, |
| "grad_norm": 0.7095701119398697, |
| "learning_rate": 2.6682621287113e-05, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23232200741767883, |
| "step": 2335, |
| "valid_targets_mean": 2940.6, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 3.175033921302578, |
| "grad_norm": 0.6882795435130347, |
| "learning_rate": 2.6618808995247408e-05, |
| "loss": 0.2196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22832772135734558, |
| "step": 2340, |
| "valid_targets_mean": 2938.8, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 3.1818181818181817, |
| "grad_norm": 0.6135099997369059, |
| "learning_rate": 2.6554920946547044e-05, |
| "loss": 0.2113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23073089122772217, |
| "step": 2345, |
| "valid_targets_mean": 3286.8, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 3.1886024423337855, |
| "grad_norm": 0.9423077941270365, |
| "learning_rate": 2.649095787225469e-05, |
| "loss": 0.2231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2254088819026947, |
| "step": 2350, |
| "valid_targets_mean": 2568.0, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 3.1953867028493894, |
| "grad_norm": 0.810975408154495, |
| "learning_rate": 2.6426920504471865e-05, |
| "loss": 0.225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21835219860076904, |
| "step": 2355, |
| "valid_targets_mean": 2296.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.2021709633649933, |
| "grad_norm": 0.672655439805317, |
| "learning_rate": 2.636280957615041e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22122296690940857, |
| "step": 2360, |
| "valid_targets_mean": 2792.6, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 3.208955223880597, |
| "grad_norm": 0.7434847650835706, |
| "learning_rate": 2.6298625821084128e-05, |
| "loss": 0.2201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21797284483909607, |
| "step": 2365, |
| "valid_targets_mean": 2498.4, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 3.2157394843962006, |
| "grad_norm": 0.6570222965023365, |
| "learning_rate": 2.6234369973900372e-05, |
| "loss": 0.2208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2033863663673401, |
| "step": 2370, |
| "valid_targets_mean": 2630.6, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 3.2225237449118045, |
| "grad_norm": 0.8657617678949259, |
| "learning_rate": 2.6170042770051635e-05, |
| "loss": 0.228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.225327730178833, |
| "step": 2375, |
| "valid_targets_mean": 1854.9, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 3.2293080054274084, |
| "grad_norm": 0.7046910890483484, |
| "learning_rate": 2.610564494580714e-05, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22602598369121552, |
| "step": 2380, |
| "valid_targets_mean": 2542.6, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.2360922659430122, |
| "grad_norm": 0.6740596140779037, |
| "learning_rate": 2.604117723824441e-05, |
| "loss": 0.2288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23400309681892395, |
| "step": 2385, |
| "valid_targets_mean": 3017.3, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 3.242876526458616, |
| "grad_norm": 0.7404070619144895, |
| "learning_rate": 2.597664038524083e-05, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2237531542778015, |
| "step": 2390, |
| "valid_targets_mean": 2550.8, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 3.24966078697422, |
| "grad_norm": 0.6731318456534926, |
| "learning_rate": 2.5912035125465208e-05, |
| "loss": 0.2131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2236143946647644, |
| "step": 2395, |
| "valid_targets_mean": 2946.1, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 3.2564450474898234, |
| "grad_norm": 0.7464562402100164, |
| "learning_rate": 2.5847362198369297e-05, |
| "loss": 0.2262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2542741298675537, |
| "step": 2400, |
| "valid_targets_mean": 2603.9, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 3.2632293080054273, |
| "grad_norm": 0.7388159380991954, |
| "learning_rate": 2.578262234417937e-05, |
| "loss": 0.2202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21536928415298462, |
| "step": 2405, |
| "valid_targets_mean": 2555.2, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 3.270013568521031, |
| "grad_norm": 0.7355746785542672, |
| "learning_rate": 2.5717816303887703e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21950095891952515, |
| "step": 2410, |
| "valid_targets_mean": 2990.9, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 3.276797829036635, |
| "grad_norm": 0.7517171398028017, |
| "learning_rate": 2.565294481924415e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20042955875396729, |
| "step": 2415, |
| "valid_targets_mean": 2606.8, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 3.283582089552239, |
| "grad_norm": 0.7068185853149664, |
| "learning_rate": 2.5588008632747593e-05, |
| "loss": 0.2311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22197219729423523, |
| "step": 2420, |
| "valid_targets_mean": 3084.1, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 3.290366350067843, |
| "grad_norm": 0.7279583182044714, |
| "learning_rate": 2.5523008487637482e-05, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2149057388305664, |
| "step": 2425, |
| "valid_targets_mean": 2391.9, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.2971506105834463, |
| "grad_norm": 0.6422722168754591, |
| "learning_rate": 2.5457945127885318e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24687312543392181, |
| "step": 2430, |
| "valid_targets_mean": 3709.7, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 3.30393487109905, |
| "grad_norm": 0.6945878436621437, |
| "learning_rate": 2.539281929818614e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2088148444890976, |
| "step": 2435, |
| "valid_targets_mean": 2683.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.310719131614654, |
| "grad_norm": 0.8469589878253486, |
| "learning_rate": 2.5327631743949982e-05, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22623956203460693, |
| "step": 2440, |
| "valid_targets_mean": 2050.2, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 3.317503392130258, |
| "grad_norm": 0.7039682068648079, |
| "learning_rate": 2.5262383211293386e-05, |
| "loss": 0.2256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22464679181575775, |
| "step": 2445, |
| "valid_targets_mean": 3066.5, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 3.324287652645862, |
| "grad_norm": 0.6549956329113884, |
| "learning_rate": 2.51970744470308e-05, |
| "loss": 0.2345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25542882084846497, |
| "step": 2450, |
| "valid_targets_mean": 3588.2, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 3.3310719131614652, |
| "grad_norm": 0.6922641541400616, |
| "learning_rate": 2.5131706198666104e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21417692303657532, |
| "step": 2455, |
| "valid_targets_mean": 2714.5, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 3.337856173677069, |
| "grad_norm": 0.6313775940838555, |
| "learning_rate": 2.506627921438397e-05, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20802749693393707, |
| "step": 2460, |
| "valid_targets_mean": 3045.8, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 3.344640434192673, |
| "grad_norm": 0.6419716617358177, |
| "learning_rate": 2.5000794243041386e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20835299789905548, |
| "step": 2465, |
| "valid_targets_mean": 2813.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.351424694708277, |
| "grad_norm": 0.6155938516766296, |
| "learning_rate": 2.4935252034159016e-05, |
| "loss": 0.2169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23357100784778595, |
| "step": 2470, |
| "valid_targets_mean": 3461.4, |
| "valid_targets_min": 1589 |
| }, |
| { |
| "epoch": 3.3582089552238807, |
| "grad_norm": 0.6931971140884506, |
| "learning_rate": 2.4869653337912652e-05, |
| "loss": 0.2246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23858122527599335, |
| "step": 2475, |
| "valid_targets_mean": 3166.2, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 3.364993215739484, |
| "grad_norm": 0.7398849431239813, |
| "learning_rate": 2.480399890512462e-05, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24428343772888184, |
| "step": 2480, |
| "valid_targets_mean": 2540.5, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 3.371777476255088, |
| "grad_norm": 0.7128166603516436, |
| "learning_rate": 2.4738289487255198e-05, |
| "loss": 0.2252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22879432141780853, |
| "step": 2485, |
| "valid_targets_mean": 2861.1, |
| "valid_targets_min": 1266 |
| }, |
| { |
| "epoch": 3.378561736770692, |
| "grad_norm": 0.7552252749221059, |
| "learning_rate": 2.4672525836394003e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22698278725147247, |
| "step": 2490, |
| "valid_targets_mean": 2579.4, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 3.385345997286296, |
| "grad_norm": 0.8012197815964346, |
| "learning_rate": 2.4606708705251383e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23777778446674347, |
| "step": 2495, |
| "valid_targets_mean": 2214.4, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 3.3921302578018997, |
| "grad_norm": 0.7100109651223878, |
| "learning_rate": 2.4540838847149805e-05, |
| "loss": 0.2169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2334587723016739, |
| "step": 2500, |
| "valid_targets_mean": 2754.7, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 3.3989145183175036, |
| "grad_norm": 0.7594298936519028, |
| "learning_rate": 2.4474917016015233e-05, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21707573533058167, |
| "step": 2505, |
| "valid_targets_mean": 2143.0, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 3.405698778833107, |
| "grad_norm": 0.6554539535978531, |
| "learning_rate": 2.4408943966368502e-05, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22429423034191132, |
| "step": 2510, |
| "valid_targets_mean": 3002.5, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 3.412483039348711, |
| "grad_norm": 0.5678144037578754, |
| "learning_rate": 2.4342920453316677e-05, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21168120205402374, |
| "step": 2515, |
| "valid_targets_mean": 4258.6, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 3.4192672998643148, |
| "grad_norm": 1.1608859512029313, |
| "learning_rate": 2.42768472325444e-05, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2512350082397461, |
| "step": 2520, |
| "valid_targets_mean": 2730.8, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 3.4260515603799186, |
| "grad_norm": 0.6794646407442558, |
| "learning_rate": 2.4210725060305277e-05, |
| "loss": 0.2264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23531343042850494, |
| "step": 2525, |
| "valid_targets_mean": 3514.7, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 3.4328358208955225, |
| "grad_norm": 0.6399640137952785, |
| "learning_rate": 2.4144554693413165e-05, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22536537051200867, |
| "step": 2530, |
| "valid_targets_mean": 3192.2, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 3.4396200814111264, |
| "grad_norm": 0.6662119295193443, |
| "learning_rate": 2.407833688923357e-05, |
| "loss": 0.2236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22147254645824432, |
| "step": 2535, |
| "valid_targets_mean": 2992.2, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 3.44640434192673, |
| "grad_norm": 0.6891237720043712, |
| "learning_rate": 2.401207240567493e-05, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20989638566970825, |
| "step": 2540, |
| "valid_targets_mean": 2869.4, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 3.4531886024423337, |
| "grad_norm": 0.5733593611937268, |
| "learning_rate": 2.3945762001179988e-05, |
| "loss": 0.2258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20587453246116638, |
| "step": 2545, |
| "valid_targets_mean": 3843.9, |
| "valid_targets_min": 1250 |
| }, |
| { |
| "epoch": 3.4599728629579376, |
| "grad_norm": 0.7227077896335035, |
| "learning_rate": 2.3879406434717048e-05, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2688782811164856, |
| "step": 2550, |
| "valid_targets_mean": 3092.1, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 3.4667571234735415, |
| "grad_norm": 0.729804276811994, |
| "learning_rate": 2.381300646577135e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2293173372745514, |
| "step": 2555, |
| "valid_targets_mean": 2722.3, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.4735413839891454, |
| "grad_norm": 0.7089336749170233, |
| "learning_rate": 2.3746562854336347e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24235443770885468, |
| "step": 2560, |
| "valid_targets_mean": 2771.2, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 3.480325644504749, |
| "grad_norm": 0.7144987230267648, |
| "learning_rate": 2.3680076360904996e-05, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22750988602638245, |
| "step": 2565, |
| "valid_targets_mean": 2600.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 3.4871099050203527, |
| "grad_norm": 0.6752212573282049, |
| "learning_rate": 2.3613547746461082e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24150076508522034, |
| "step": 2570, |
| "valid_targets_mean": 3270.1, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 3.4938941655359566, |
| "grad_norm": 0.7590308205931211, |
| "learning_rate": 2.3546977772470494e-05, |
| "loss": 0.2309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22371584177017212, |
| "step": 2575, |
| "valid_targets_mean": 2490.2, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 3.5006784260515604, |
| "grad_norm": 0.7870240421440323, |
| "learning_rate": 2.3480367200872504e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23015907406806946, |
| "step": 2580, |
| "valid_targets_mean": 2033.2, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 3.5074626865671643, |
| "grad_norm": 0.923419749026049, |
| "learning_rate": 2.341371679407106e-05, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.207190603017807, |
| "step": 2585, |
| "valid_targets_mean": 2550.9, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 3.5142469470827677, |
| "grad_norm": 0.7046771506431182, |
| "learning_rate": 2.3347027314926032e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22681497037410736, |
| "step": 2590, |
| "valid_targets_mean": 2633.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 3.5210312075983716, |
| "grad_norm": 0.6097178720133104, |
| "learning_rate": 2.328029952674452e-05, |
| "loss": 0.2303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21856877207756042, |
| "step": 2595, |
| "valid_targets_mean": 4060.4, |
| "valid_targets_min": 1722 |
| }, |
| { |
| "epoch": 3.5278154681139755, |
| "grad_norm": 0.7646075625057801, |
| "learning_rate": 2.321353419327209e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2248585820198059, |
| "step": 2600, |
| "valid_targets_mean": 2429.2, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 3.5345997286295794, |
| "grad_norm": 0.6929279550589781, |
| "learning_rate": 2.314673207868404e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24431878328323364, |
| "step": 2605, |
| "valid_targets_mean": 2962.9, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 3.5413839891451833, |
| "grad_norm": 0.6480909726367313, |
| "learning_rate": 2.307989394757665e-05, |
| "loss": 0.2141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22717615962028503, |
| "step": 2610, |
| "valid_targets_mean": 3731.4, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 3.5481682496607867, |
| "grad_norm": 0.7186879086898086, |
| "learning_rate": 2.301302056495845e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2136261910200119, |
| "step": 2615, |
| "valid_targets_mean": 2418.2, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 3.554952510176391, |
| "grad_norm": 0.806809670872252, |
| "learning_rate": 2.2946112696241414e-05, |
| "loss": 0.2191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22997555136680603, |
| "step": 2620, |
| "valid_targets_mean": 2120.0, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 3.5617367706919945, |
| "grad_norm": 0.6741591468113703, |
| "learning_rate": 2.2879171107232274e-05, |
| "loss": 0.2183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2275179922580719, |
| "step": 2625, |
| "valid_targets_mean": 3001.9, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 3.5685210312075983, |
| "grad_norm": 0.7318902025413816, |
| "learning_rate": 2.2812196564123683e-05, |
| "loss": 0.2223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21598154306411743, |
| "step": 2630, |
| "valid_targets_mean": 2405.4, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 3.575305291723202, |
| "grad_norm": 0.7506970585357591, |
| "learning_rate": 2.274518983348549e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24321120977401733, |
| "step": 2635, |
| "valid_targets_mean": 2461.9, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 3.582089552238806, |
| "grad_norm": 0.6629205823156629, |
| "learning_rate": 2.267815168225596e-05, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2191721647977829, |
| "step": 2640, |
| "valid_targets_mean": 2622.9, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 3.58887381275441, |
| "grad_norm": 0.7533189468195941, |
| "learning_rate": 2.2611082877732954e-05, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24864350259304047, |
| "step": 2645, |
| "valid_targets_mean": 2555.6, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 3.5956580732700134, |
| "grad_norm": 0.6177690316825468, |
| "learning_rate": 2.2543984187565227e-05, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23729315400123596, |
| "step": 2650, |
| "valid_targets_mean": 3457.9, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 3.6024423337856173, |
| "grad_norm": 0.7158165102846912, |
| "learning_rate": 2.2476856379743567e-05, |
| "loss": 0.2329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23067063093185425, |
| "step": 2655, |
| "valid_targets_mean": 2960.2, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 3.609226594301221, |
| "grad_norm": 0.7707372511866211, |
| "learning_rate": 2.2409700222592042e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22069093585014343, |
| "step": 2660, |
| "valid_targets_mean": 2546.6, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 3.616010854816825, |
| "grad_norm": 0.6052180371912904, |
| "learning_rate": 2.23425164847592e-05, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21380861103534698, |
| "step": 2665, |
| "valid_targets_mean": 3455.1, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.622795115332429, |
| "grad_norm": 0.7047656744984836, |
| "learning_rate": 2.227530593520926e-05, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24715712666511536, |
| "step": 2670, |
| "valid_targets_mean": 3540.6, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 3.6295793758480324, |
| "grad_norm": 0.6745230951755198, |
| "learning_rate": 2.2208069343213326e-05, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23651158809661865, |
| "step": 2675, |
| "valid_targets_mean": 3037.1, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 3.6363636363636362, |
| "grad_norm": 0.623368182400207, |
| "learning_rate": 2.2140807478340582e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22128023207187653, |
| "step": 2680, |
| "valid_targets_mean": 3301.1, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 3.64314789687924, |
| "grad_norm": 0.6649128121001402, |
| "learning_rate": 2.2073521110449456e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2295609414577484, |
| "step": 2685, |
| "valid_targets_mean": 3177.9, |
| "valid_targets_min": 1144 |
| }, |
| { |
| "epoch": 3.649932157394844, |
| "grad_norm": 0.6882954051754054, |
| "learning_rate": 2.200621100967886e-05, |
| "loss": 0.2192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2442229986190796, |
| "step": 2690, |
| "valid_targets_mean": 3074.8, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 3.656716417910448, |
| "grad_norm": 0.6820903463422161, |
| "learning_rate": 2.193887794643932e-05, |
| "loss": 0.2324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23110562562942505, |
| "step": 2695, |
| "valid_targets_mean": 3172.8, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 3.6635006784260513, |
| "grad_norm": 0.6997238880911637, |
| "learning_rate": 2.187152269140419e-05, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21552921831607819, |
| "step": 2700, |
| "valid_targets_mean": 2677.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 3.670284938941655, |
| "grad_norm": 0.7131884522201282, |
| "learning_rate": 2.180414601550084e-05, |
| "loss": 0.219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2269384115934372, |
| "step": 2705, |
| "valid_targets_mean": 2801.8, |
| "valid_targets_min": 1388 |
| }, |
| { |
| "epoch": 3.677069199457259, |
| "grad_norm": 0.7172347353831631, |
| "learning_rate": 2.1736748689901792e-05, |
| "loss": 0.2251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22936025261878967, |
| "step": 2710, |
| "valid_targets_mean": 2702.1, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 3.683853459972863, |
| "grad_norm": 0.6583901504326424, |
| "learning_rate": 2.1669331486015942e-05, |
| "loss": 0.2189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.221341073513031, |
| "step": 2715, |
| "valid_targets_mean": 2726.4, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 3.690637720488467, |
| "grad_norm": 0.6670649918476067, |
| "learning_rate": 2.1601895175479677e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18742845952510834, |
| "step": 2720, |
| "valid_targets_mean": 2824.9, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 3.6974219810040707, |
| "grad_norm": 0.7043411361057197, |
| "learning_rate": 2.1534440530148104e-05, |
| "loss": 0.218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.224558025598526, |
| "step": 2725, |
| "valid_targets_mean": 2730.9, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 3.7042062415196746, |
| "grad_norm": 0.8290546440140429, |
| "learning_rate": 2.1466968322086168e-05, |
| "loss": 0.2314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24871769547462463, |
| "step": 2730, |
| "valid_targets_mean": 2595.6, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 3.710990502035278, |
| "grad_norm": 0.6684634109147515, |
| "learning_rate": 2.1399479323559837e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22964484989643097, |
| "step": 2735, |
| "valid_targets_mean": 3235.6, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 3.717774762550882, |
| "grad_norm": 0.6468283601913088, |
| "learning_rate": 2.133197430702725e-05, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22138440608978271, |
| "step": 2740, |
| "valid_targets_mean": 2955.9, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.724559023066486, |
| "grad_norm": 0.6848302786495842, |
| "learning_rate": 2.1264454045129885e-05, |
| "loss": 0.2332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23357048630714417, |
| "step": 2745, |
| "valid_targets_mean": 2971.2, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 3.7313432835820897, |
| "grad_norm": 0.8076399629104075, |
| "learning_rate": 2.1196919310683722e-05, |
| "loss": 0.2277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24134433269500732, |
| "step": 2750, |
| "valid_targets_mean": 2742.0, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 3.7381275440976935, |
| "grad_norm": 0.7937429467781824, |
| "learning_rate": 2.112937087667039e-05, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23753595352172852, |
| "step": 2755, |
| "valid_targets_mean": 2422.7, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 3.744911804613297, |
| "grad_norm": 0.6806559152552468, |
| "learning_rate": 2.106180951622829e-05, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.241061270236969, |
| "step": 2760, |
| "valid_targets_mean": 2973.4, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 3.751696065128901, |
| "grad_norm": 0.695950276005158, |
| "learning_rate": 2.0994236002643822e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20735937356948853, |
| "step": 2765, |
| "valid_targets_mean": 2495.0, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 3.7584803256445047, |
| "grad_norm": 0.8597190728087525, |
| "learning_rate": 2.0926651109342457e-05, |
| "loss": 0.2282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2300506830215454, |
| "step": 2770, |
| "valid_targets_mean": 2055.6, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 3.7652645861601086, |
| "grad_norm": 0.7385601024810353, |
| "learning_rate": 2.0859055609879916e-05, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23074880242347717, |
| "step": 2775, |
| "valid_targets_mean": 2834.2, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 3.7720488466757125, |
| "grad_norm": 0.7000695708428455, |
| "learning_rate": 2.0791450277933322e-05, |
| "loss": 0.2262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21346724033355713, |
| "step": 2780, |
| "valid_targets_mean": 2711.2, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 3.778833107191316, |
| "grad_norm": 0.6921395024706539, |
| "learning_rate": 2.0723835887292334e-05, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2142827957868576, |
| "step": 2785, |
| "valid_targets_mean": 2578.4, |
| "valid_targets_min": 1125 |
| }, |
| { |
| "epoch": 3.78561736770692, |
| "grad_norm": 0.7682439574392755, |
| "learning_rate": 2.0656213211850295e-05, |
| "loss": 0.2211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21348156034946442, |
| "step": 2790, |
| "valid_targets_mean": 2177.8, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 3.7924016282225237, |
| "grad_norm": 0.7600371041182261, |
| "learning_rate": 2.058858302559537e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23701968789100647, |
| "step": 2795, |
| "valid_targets_mean": 2633.8, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 3.7991858887381276, |
| "grad_norm": 0.7139158160982614, |
| "learning_rate": 2.05209461026017e-05, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.233786478638649, |
| "step": 2800, |
| "valid_targets_mean": 2587.3, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 3.8059701492537314, |
| "grad_norm": 0.7176024981852444, |
| "learning_rate": 2.045330321702053e-05, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22029541432857513, |
| "step": 2805, |
| "valid_targets_mean": 2586.6, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 3.812754409769335, |
| "grad_norm": 0.6149619152466096, |
| "learning_rate": 2.0385655143071336e-05, |
| "loss": 0.2159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19177527725696564, |
| "step": 2810, |
| "valid_targets_mean": 3115.8, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 3.819538670284939, |
| "grad_norm": 0.6945022382481121, |
| "learning_rate": 2.031800265503299e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2345021814107895, |
| "step": 2815, |
| "valid_targets_mean": 3089.4, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 3.8263229308005426, |
| "grad_norm": 0.718365382422882, |
| "learning_rate": 2.02503465272349e-05, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21639087796211243, |
| "step": 2820, |
| "valid_targets_mean": 2522.1, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 3.8331071913161465, |
| "grad_norm": 0.7049711808427084, |
| "learning_rate": 2.0182687534048107e-05, |
| "loss": 0.2216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24925465881824493, |
| "step": 2825, |
| "valid_targets_mean": 2881.4, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 3.8398914518317504, |
| "grad_norm": 0.7569193242813216, |
| "learning_rate": 2.011502644987646e-05, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2595372796058655, |
| "step": 2830, |
| "valid_targets_mean": 2309.4, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 3.8466757123473543, |
| "grad_norm": 0.6067978450699282, |
| "learning_rate": 2.0047364049147747e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21039123833179474, |
| "step": 2835, |
| "valid_targets_mean": 3391.3, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 3.853459972862958, |
| "grad_norm": 0.6539018194253448, |
| "learning_rate": 1.9979701106304824e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.241075336933136, |
| "step": 2840, |
| "valid_targets_mean": 2985.6, |
| "valid_targets_min": 1362 |
| }, |
| { |
| "epoch": 3.8602442333785616, |
| "grad_norm": 0.672599881101891, |
| "learning_rate": 1.991203839579674e-05, |
| "loss": 0.2311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2360815405845642, |
| "step": 2845, |
| "valid_targets_mean": 2885.5, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 3.8670284938941655, |
| "grad_norm": 0.7800657928131475, |
| "learning_rate": 1.984437669206989e-05, |
| "loss": 0.2148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20892655849456787, |
| "step": 2850, |
| "valid_targets_mean": 2320.9, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 3.8738127544097694, |
| "grad_norm": 0.6676687527814975, |
| "learning_rate": 1.9776716769559157e-05, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22498619556427002, |
| "step": 2855, |
| "valid_targets_mean": 3164.1, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 3.8805970149253732, |
| "grad_norm": 0.5995122983093996, |
| "learning_rate": 1.970905940267902e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21802213788032532, |
| "step": 2860, |
| "valid_targets_mean": 3898.9, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 3.887381275440977, |
| "grad_norm": 0.647688327782899, |
| "learning_rate": 1.9641405365814717e-05, |
| "loss": 0.2242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21417051553726196, |
| "step": 2865, |
| "valid_targets_mean": 3167.7, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 3.8941655359565805, |
| "grad_norm": 0.6546310967035971, |
| "learning_rate": 1.9573755433313378e-05, |
| "loss": 0.2223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2323242872953415, |
| "step": 2870, |
| "valid_targets_mean": 3041.1, |
| "valid_targets_min": 1319 |
| }, |
| { |
| "epoch": 3.9009497964721844, |
| "grad_norm": 0.7383143695334415, |
| "learning_rate": 1.9506110379475128e-05, |
| "loss": 0.2258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2311961054801941, |
| "step": 2875, |
| "valid_targets_mean": 2362.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.9077340569877883, |
| "grad_norm": 0.8430450237904688, |
| "learning_rate": 1.9438470978544287e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21592223644256592, |
| "step": 2880, |
| "valid_targets_mean": 3625.7, |
| "valid_targets_min": 1167 |
| }, |
| { |
| "epoch": 3.914518317503392, |
| "grad_norm": 0.7707831179099163, |
| "learning_rate": 1.9370838004700455e-05, |
| "loss": 0.2287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24675382673740387, |
| "step": 2885, |
| "valid_targets_mean": 2393.0, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 3.921302578018996, |
| "grad_norm": 0.7280249588483818, |
| "learning_rate": 1.930321223204967e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24415768682956696, |
| "step": 2890, |
| "valid_targets_mean": 2570.4, |
| "valid_targets_min": 1242 |
| }, |
| { |
| "epoch": 3.9280868385345995, |
| "grad_norm": 0.7871720247148984, |
| "learning_rate": 1.9235594434615552e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21705761551856995, |
| "step": 2895, |
| "valid_targets_mean": 2329.9, |
| "valid_targets_min": 934 |
| }, |
| { |
| "epoch": 3.9348710990502034, |
| "grad_norm": 0.6824607839533505, |
| "learning_rate": 1.9167985386330435e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2021501511335373, |
| "step": 2900, |
| "valid_targets_mean": 3006.3, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 3.9416553595658073, |
| "grad_norm": 0.580360164037747, |
| "learning_rate": 1.910038586102652e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18379102647304535, |
| "step": 2905, |
| "valid_targets_mean": 2916.4, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 3.948439620081411, |
| "grad_norm": 0.7244276692797579, |
| "learning_rate": 1.9032796632427e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22763890027999878, |
| "step": 2910, |
| "valid_targets_mean": 2483.5, |
| "valid_targets_min": 831 |
| }, |
| { |
| "epoch": 3.955223880597015, |
| "grad_norm": 0.7606015895849964, |
| "learning_rate": 1.896521847413722e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2129872590303421, |
| "step": 2915, |
| "valid_targets_mean": 2604.8, |
| "valid_targets_min": 1424 |
| }, |
| { |
| "epoch": 3.9620081411126185, |
| "grad_norm": 0.7996005811272329, |
| "learning_rate": 1.8897652159635826e-05, |
| "loss": 0.2351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2276165634393692, |
| "step": 2920, |
| "valid_targets_mean": 2545.5, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 3.9687924016282228, |
| "grad_norm": 0.6306491453103433, |
| "learning_rate": 1.8830098462265892e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2229669839143753, |
| "step": 2925, |
| "valid_targets_mean": 3271.3, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 3.975576662143826, |
| "grad_norm": 0.7155034374723849, |
| "learning_rate": 1.8762558155226086e-05, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23799753189086914, |
| "step": 2930, |
| "valid_targets_mean": 2748.9, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 3.98236092265943, |
| "grad_norm": 0.8976533438979097, |
| "learning_rate": 1.869503201156181e-05, |
| "loss": 0.212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20464091002941132, |
| "step": 2935, |
| "valid_targets_mean": 1909.6, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 3.989145183175034, |
| "grad_norm": 0.6624349548194711, |
| "learning_rate": 1.8627520804156365e-05, |
| "loss": 0.2258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22667071223258972, |
| "step": 2940, |
| "valid_targets_mean": 3271.6, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 3.995929443690638, |
| "grad_norm": 0.6151495628097419, |
| "learning_rate": 1.856002530572209e-05, |
| "loss": 0.2189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21382832527160645, |
| "step": 2945, |
| "valid_targets_mean": 3332.6, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 4.002713704206242, |
| "grad_norm": 0.615787649304689, |
| "learning_rate": 1.8492546288791518e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19524888694286346, |
| "step": 2950, |
| "valid_targets_mean": 3521.4, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 4.009497964721845, |
| "grad_norm": 0.7774165923273912, |
| "learning_rate": 1.842508452570855e-05, |
| "loss": 0.2003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20001152157783508, |
| "step": 2955, |
| "valid_targets_mean": 2349.4, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 4.0162822252374495, |
| "grad_norm": 0.664596861061304, |
| "learning_rate": 1.8357640788619605e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21963298320770264, |
| "step": 2960, |
| "valid_targets_mean": 3053.3, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 4.023066485753053, |
| "grad_norm": 0.7193062756351686, |
| "learning_rate": 1.8290215849464773e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2050497829914093, |
| "step": 2965, |
| "valid_targets_mean": 2874.3, |
| "valid_targets_min": 1465 |
| }, |
| { |
| "epoch": 4.029850746268656, |
| "grad_norm": 0.7682247189848644, |
| "learning_rate": 1.8222810479969e-05, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20245233178138733, |
| "step": 2970, |
| "valid_targets_mean": 2529.4, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 4.036635006784261, |
| "grad_norm": 0.7099650203393719, |
| "learning_rate": 1.815542545163323e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18782241642475128, |
| "step": 2975, |
| "valid_targets_mean": 2867.7, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 4.043419267299864, |
| "grad_norm": 0.6679826007373775, |
| "learning_rate": 1.808806153572561e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18531766533851624, |
| "step": 2980, |
| "valid_targets_mean": 3430.7, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 4.050203527815468, |
| "grad_norm": 0.6971278596727647, |
| "learning_rate": 1.802071950327261e-05, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1951214224100113, |
| "step": 2985, |
| "valid_targets_mean": 2909.7, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 4.056987788331072, |
| "grad_norm": 0.6975225843392714, |
| "learning_rate": 1.7953400125050252e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19596266746520996, |
| "step": 2990, |
| "valid_targets_mean": 3136.7, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 4.063772048846675, |
| "grad_norm": 0.616610532499199, |
| "learning_rate": 1.7886104171575264e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17603719234466553, |
| "step": 2995, |
| "valid_targets_mean": 3788.1, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 4.07055630936228, |
| "grad_norm": 0.8204028517819303, |
| "learning_rate": 1.7818832413096248e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1822405755519867, |
| "step": 3000, |
| "valid_targets_mean": 2084.1, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 4.077340569877883, |
| "grad_norm": 0.8644454831039673, |
| "learning_rate": 1.775158561958489e-05, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21637216210365295, |
| "step": 3005, |
| "valid_targets_mean": 2142.1, |
| "valid_targets_min": 1117 |
| }, |
| { |
| "epoch": 4.084124830393487, |
| "grad_norm": 0.6868713845692973, |
| "learning_rate": 1.768436456072713e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17520518600940704, |
| "step": 3010, |
| "valid_targets_mean": 3152.6, |
| "valid_targets_min": 1144 |
| }, |
| { |
| "epoch": 4.090909090909091, |
| "grad_norm": 0.646335349816201, |
| "learning_rate": 1.7617170005914363e-05, |
| "loss": 0.194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18921396136283875, |
| "step": 3015, |
| "valid_targets_mean": 3166.6, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 4.097693351424695, |
| "grad_norm": 0.7095934220573488, |
| "learning_rate": 1.755000272423461e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18535733222961426, |
| "step": 3020, |
| "valid_targets_mean": 2847.2, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 4.104477611940299, |
| "grad_norm": 0.7722733457306606, |
| "learning_rate": 1.7482863484463747e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1878623217344284, |
| "step": 3025, |
| "valid_targets_mean": 2357.7, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 4.111261872455902, |
| "grad_norm": 0.7558210158635994, |
| "learning_rate": 1.7415753055056693e-05, |
| "loss": 0.2009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20962506532669067, |
| "step": 3030, |
| "valid_targets_mean": 2774.4, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 4.118046132971506, |
| "grad_norm": 0.7019234157644559, |
| "learning_rate": 1.73486722041386e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17214052379131317, |
| "step": 3035, |
| "valid_targets_mean": 2344.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 4.12483039348711, |
| "grad_norm": 0.7056358240413717, |
| "learning_rate": 1.7281621699496086e-05, |
| "loss": 0.1809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18809084594249725, |
| "step": 3040, |
| "valid_targets_mean": 2753.2, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 4.131614654002714, |
| "grad_norm": 0.7928593105079518, |
| "learning_rate": 1.7214602308568426e-05, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16787604987621307, |
| "step": 3045, |
| "valid_targets_mean": 2298.5, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 4.1383989145183175, |
| "grad_norm": 0.7453927190983547, |
| "learning_rate": 1.714761479843879e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2303515374660492, |
| "step": 3050, |
| "valid_targets_mean": 3051.8, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 4.145183175033921, |
| "grad_norm": 0.7004503623184913, |
| "learning_rate": 1.708065993582543e-05, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1861414909362793, |
| "step": 3055, |
| "valid_targets_mean": 2926.8, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 4.151967435549525, |
| "grad_norm": 0.5969912948853561, |
| "learning_rate": 1.701373848707294e-05, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16732157766819, |
| "step": 3060, |
| "valid_targets_mean": 3249.8, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 4.158751696065129, |
| "grad_norm": 0.7889354028527934, |
| "learning_rate": 1.6946851218143464e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2116738259792328, |
| "step": 3065, |
| "valid_targets_mean": 2610.2, |
| "valid_targets_min": 1017 |
| }, |
| { |
| "epoch": 4.165535956580733, |
| "grad_norm": 0.6969382167538735, |
| "learning_rate": 1.6879998894607937e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.184125155210495, |
| "step": 3070, |
| "valid_targets_mean": 2778.3, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 4.1723202170963365, |
| "grad_norm": 0.7661282970421094, |
| "learning_rate": 1.6813182281637318e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18725869059562683, |
| "step": 3075, |
| "valid_targets_mean": 2373.2, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 4.17910447761194, |
| "grad_norm": 0.7127514162035592, |
| "learning_rate": 1.674640214399383e-05, |
| "loss": 0.1981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20451834797859192, |
| "step": 3080, |
| "valid_targets_mean": 3058.9, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 4.185888738127544, |
| "grad_norm": 0.7261600863010719, |
| "learning_rate": 1.6679659246022224e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19646155834197998, |
| "step": 3085, |
| "valid_targets_mean": 2840.0, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 4.192672998643148, |
| "grad_norm": 0.7318920710785716, |
| "learning_rate": 1.6612954351641004e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1673353910446167, |
| "step": 3090, |
| "valid_targets_mean": 2456.0, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 4.199457259158752, |
| "grad_norm": 0.7618896273234488, |
| "learning_rate": 1.65462882243337e-05, |
| "loss": 0.2045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2328355312347412, |
| "step": 3095, |
| "valid_targets_mean": 2732.4, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 4.2062415196743554, |
| "grad_norm": 0.6950613889947367, |
| "learning_rate": 1.6479661627140125e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21082782745361328, |
| "step": 3100, |
| "valid_targets_mean": 3076.4, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 4.213025780189959, |
| "grad_norm": 0.7422212651396944, |
| "learning_rate": 1.6413075322647645e-05, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17804861068725586, |
| "step": 3105, |
| "valid_targets_mean": 2741.3, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 4.219810040705563, |
| "grad_norm": 0.8313162708546203, |
| "learning_rate": 1.634653007298245e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21381892263889313, |
| "step": 3110, |
| "valid_targets_mean": 2521.1, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 4.226594301221167, |
| "grad_norm": 0.7343807869521366, |
| "learning_rate": 1.628002663980083e-05, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18454739451408386, |
| "step": 3115, |
| "valid_targets_mean": 3389.7, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 4.233378561736771, |
| "grad_norm": 0.7180737684834317, |
| "learning_rate": 1.6213565784280448e-05, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20628373324871063, |
| "step": 3120, |
| "valid_targets_mean": 2695.5, |
| "valid_targets_min": 1330 |
| }, |
| { |
| "epoch": 4.240162822252374, |
| "grad_norm": 0.7446535802715553, |
| "learning_rate": 1.6147148267111648e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20070384442806244, |
| "step": 3125, |
| "valid_targets_mean": 2581.9, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 4.246947082767978, |
| "grad_norm": 0.7867961809991622, |
| "learning_rate": 1.608077484848872e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21188589930534363, |
| "step": 3130, |
| "valid_targets_mean": 2598.0, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 4.253731343283582, |
| "grad_norm": 0.7452760690333677, |
| "learning_rate": 1.601444628810124e-05, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19212831556797028, |
| "step": 3135, |
| "valid_targets_mean": 2548.9, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 4.260515603799186, |
| "grad_norm": 0.640609370408385, |
| "learning_rate": 1.5948163345125322e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867392212152481, |
| "step": 3140, |
| "valid_targets_mean": 2978.2, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 4.26729986431479, |
| "grad_norm": 0.7904463927412828, |
| "learning_rate": 1.5881926778214985e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18848653137683868, |
| "step": 3145, |
| "valid_targets_mean": 2162.2, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 4.274084124830393, |
| "grad_norm": 0.6862590326254344, |
| "learning_rate": 1.581573734549342e-05, |
| "loss": 0.2075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19391348958015442, |
| "step": 3150, |
| "valid_targets_mean": 2840.2, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 4.280868385345998, |
| "grad_norm": 0.753930226852254, |
| "learning_rate": 1.574959580454435e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2218829095363617, |
| "step": 3155, |
| "valid_targets_mean": 2770.5, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 4.287652645861601, |
| "grad_norm": 0.7173848707428967, |
| "learning_rate": 1.5683502912403334e-05, |
| "loss": 0.19, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18789169192314148, |
| "step": 3160, |
| "valid_targets_mean": 2473.1, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 4.2944369063772045, |
| "grad_norm": 0.6756808344570617, |
| "learning_rate": 1.5617459425549118e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17631642520427704, |
| "step": 3165, |
| "valid_targets_mean": 2783.0, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 4.301221166892809, |
| "grad_norm": 0.7596274040196479, |
| "learning_rate": 1.555146609989496e-05, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19371306896209717, |
| "step": 3170, |
| "valid_targets_mean": 2678.5, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 4.308005427408412, |
| "grad_norm": 0.7950503499609197, |
| "learning_rate": 1.5485523690780003e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20015594363212585, |
| "step": 3175, |
| "valid_targets_mean": 2270.9, |
| "valid_targets_min": 1330 |
| }, |
| { |
| "epoch": 4.314789687924017, |
| "grad_norm": 0.6284596925256105, |
| "learning_rate": 1.5419632952960605e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16846656799316406, |
| "step": 3180, |
| "valid_targets_mean": 3001.5, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 4.32157394843962, |
| "grad_norm": 0.6201630615003697, |
| "learning_rate": 1.5353794640601716e-05, |
| "loss": 0.1971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18524964153766632, |
| "step": 3185, |
| "valid_targets_mean": 3645.7, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 4.3283582089552235, |
| "grad_norm": 0.711809826493421, |
| "learning_rate": 1.5288009507268237e-05, |
| "loss": 0.1998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21540531516075134, |
| "step": 3190, |
| "valid_targets_mean": 3402.2, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 4.335142469470828, |
| "grad_norm": 0.6972934803265656, |
| "learning_rate": 1.5222278305916398e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18640825152397156, |
| "step": 3195, |
| "valid_targets_mean": 3293.5, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 4.341926729986431, |
| "grad_norm": 0.6481026199784268, |
| "learning_rate": 1.5156601788885148e-05, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1833941638469696, |
| "step": 3200, |
| "valid_targets_mean": 3167.9, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 4.348710990502036, |
| "grad_norm": 0.8208339691617204, |
| "learning_rate": 1.5090980707887516e-05, |
| "loss": 0.2051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2145204246044159, |
| "step": 3205, |
| "valid_targets_mean": 2193.7, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 4.355495251017639, |
| "grad_norm": 0.6739050449873922, |
| "learning_rate": 1.5025415814002053e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19558805227279663, |
| "step": 3210, |
| "valid_targets_mean": 3247.9, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.362279511533243, |
| "grad_norm": 0.7330699785639507, |
| "learning_rate": 1.4959907857664193e-05, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20514100790023804, |
| "step": 3215, |
| "valid_targets_mean": 2830.6, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 4.369063772048847, |
| "grad_norm": 0.7397083988883265, |
| "learning_rate": 1.4894457588657685e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20222502946853638, |
| "step": 3220, |
| "valid_targets_mean": 2764.8, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 4.37584803256445, |
| "grad_norm": 0.8585950766535199, |
| "learning_rate": 1.4829065756106011e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2083539068698883, |
| "step": 3225, |
| "valid_targets_mean": 3063.8, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 4.3826322930800545, |
| "grad_norm": 0.6992154976029811, |
| "learning_rate": 1.47637331084638e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18280436098575592, |
| "step": 3230, |
| "valid_targets_mean": 2991.1, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 4.389416553595658, |
| "grad_norm": 0.7220348383997678, |
| "learning_rate": 1.4698460393508279e-05, |
| "loss": 0.1861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17603710293769836, |
| "step": 3235, |
| "valid_targets_mean": 2676.9, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 4.396200814111262, |
| "grad_norm": 0.6815437556740436, |
| "learning_rate": 1.4633248358330685e-05, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17538878321647644, |
| "step": 3240, |
| "valid_targets_mean": 2802.6, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 4.402985074626866, |
| "grad_norm": 0.7423631904328546, |
| "learning_rate": 1.4568097749327755e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2101781815290451, |
| "step": 3245, |
| "valid_targets_mean": 2564.9, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 4.409769335142469, |
| "grad_norm": 0.6279743544457285, |
| "learning_rate": 1.4503009312193145e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18776188790798187, |
| "step": 3250, |
| "valid_targets_mean": 3485.3, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 4.4165535956580735, |
| "grad_norm": 0.72461497188728, |
| "learning_rate": 1.4437983791908927e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19717328250408173, |
| "step": 3255, |
| "valid_targets_mean": 2907.9, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 4.423337856173677, |
| "grad_norm": 0.8394035988938123, |
| "learning_rate": 1.4373021932737029e-05, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2060231864452362, |
| "step": 3260, |
| "valid_targets_mean": 2521.2, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 4.430122116689281, |
| "grad_norm": 0.7846496377698511, |
| "learning_rate": 1.4308124478210743e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18877476453781128, |
| "step": 3265, |
| "valid_targets_mean": 2120.6, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 4.436906377204885, |
| "grad_norm": 0.7718040186575822, |
| "learning_rate": 1.4243292171126206e-05, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1813274621963501, |
| "step": 3270, |
| "valid_targets_mean": 2067.4, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 4.443690637720488, |
| "grad_norm": 0.8763562192740045, |
| "learning_rate": 1.4178525753533898e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1990664005279541, |
| "step": 3275, |
| "valid_targets_mean": 1895.3, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 4.450474898236092, |
| "grad_norm": 0.7818367524680697, |
| "learning_rate": 1.4113825966730141e-05, |
| "loss": 0.1987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2248629331588745, |
| "step": 3280, |
| "valid_targets_mean": 2445.3, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 4.457259158751696, |
| "grad_norm": 0.7080706103494964, |
| "learning_rate": 1.4049193551248625e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19344773888587952, |
| "step": 3285, |
| "valid_targets_mean": 2806.9, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 4.4640434192673, |
| "grad_norm": 0.6352432822796971, |
| "learning_rate": 1.3984629246851938e-05, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18108458817005157, |
| "step": 3290, |
| "valid_targets_mean": 3230.6, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.470827679782904, |
| "grad_norm": 0.7766733822813426, |
| "learning_rate": 1.3920133792523075e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20187707245349884, |
| "step": 3295, |
| "valid_targets_mean": 2388.1, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 4.477611940298507, |
| "grad_norm": 0.6809158943751472, |
| "learning_rate": 1.3855707926457003e-05, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1838938295841217, |
| "step": 3300, |
| "valid_targets_mean": 2920.3, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 4.484396200814111, |
| "grad_norm": 0.7081716006567864, |
| "learning_rate": 1.3791352386052201e-05, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18974432349205017, |
| "step": 3305, |
| "valid_targets_mean": 2833.9, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 4.491180461329715, |
| "grad_norm": 0.767864152806456, |
| "learning_rate": 1.3727067907902232e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18521273136138916, |
| "step": 3310, |
| "valid_targets_mean": 2255.4, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 4.497964721845319, |
| "grad_norm": 0.688596857727443, |
| "learning_rate": 1.366285522778728e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1874987781047821, |
| "step": 3315, |
| "valid_targets_mean": 2975.4, |
| "valid_targets_min": 1163 |
| }, |
| { |
| "epoch": 4.504748982360923, |
| "grad_norm": 0.7386731368747045, |
| "learning_rate": 1.359871508066577e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20306339859962463, |
| "step": 3320, |
| "valid_targets_mean": 2857.8, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 4.511533242876526, |
| "grad_norm": 0.8257894045478894, |
| "learning_rate": 1.3534648200665933e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18575474619865417, |
| "step": 3325, |
| "valid_targets_mean": 2783.4, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 4.51831750339213, |
| "grad_norm": 0.6867092598234874, |
| "learning_rate": 1.3470655321077403e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18126091361045837, |
| "step": 3330, |
| "valid_targets_mean": 2647.6, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 4.525101763907734, |
| "grad_norm": 0.7798112286441644, |
| "learning_rate": 1.3406737174342834e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23899130523204803, |
| "step": 3335, |
| "valid_targets_mean": 2828.8, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 4.531886024423338, |
| "grad_norm": 0.7069921488313058, |
| "learning_rate": 1.3342894492049504e-05, |
| "loss": 0.2048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20431819558143616, |
| "step": 3340, |
| "valid_targets_mean": 3127.2, |
| "valid_targets_min": 1317 |
| }, |
| { |
| "epoch": 4.5386702849389415, |
| "grad_norm": 0.7506355898759934, |
| "learning_rate": 1.3279128004920958e-05, |
| "loss": 0.1914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1895807385444641, |
| "step": 3345, |
| "valid_targets_mean": 2666.6, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 4.545454545454545, |
| "grad_norm": 0.6725468343286256, |
| "learning_rate": 1.3215438442808624e-05, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2019132673740387, |
| "step": 3350, |
| "valid_targets_mean": 3209.2, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 4.552238805970149, |
| "grad_norm": 0.6889050275687484, |
| "learning_rate": 1.3151826534683474e-05, |
| "loss": 0.1971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1907675564289093, |
| "step": 3355, |
| "valid_targets_mean": 3152.4, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 4.559023066485753, |
| "grad_norm": 0.7190846116998305, |
| "learning_rate": 1.308829300862768e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18840348720550537, |
| "step": 3360, |
| "valid_targets_mean": 2810.2, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 4.565807327001357, |
| "grad_norm": 0.6702795320500231, |
| "learning_rate": 1.3024838591826274e-05, |
| "loss": 0.1987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18903514742851257, |
| "step": 3365, |
| "valid_targets_mean": 3127.1, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 4.5725915875169605, |
| "grad_norm": 0.7488732753982411, |
| "learning_rate": 1.296146401055883e-05, |
| "loss": 0.2061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22193178534507751, |
| "step": 3370, |
| "valid_targets_mean": 3123.5, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 4.579375848032565, |
| "grad_norm": 0.7263613305452004, |
| "learning_rate": 1.2898169990191148e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1917208731174469, |
| "step": 3375, |
| "valid_targets_mean": 2815.2, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.586160108548168, |
| "grad_norm": 0.7868953900274589, |
| "learning_rate": 1.2834957255166948e-05, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17863771319389343, |
| "step": 3380, |
| "valid_targets_mean": 2261.1, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 4.592944369063772, |
| "grad_norm": 0.7888410061782655, |
| "learning_rate": 1.2771826528999602e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20688292384147644, |
| "step": 3385, |
| "valid_targets_mean": 2547.2, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 4.599728629579376, |
| "grad_norm": 0.690580382285912, |
| "learning_rate": 1.2708778534263803e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17476820945739746, |
| "step": 3390, |
| "valid_targets_mean": 2701.8, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 4.606512890094979, |
| "grad_norm": 0.7470662126944148, |
| "learning_rate": 1.2645813992587352e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.187617227435112, |
| "step": 3395, |
| "valid_targets_mean": 2586.8, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.613297150610584, |
| "grad_norm": 1.2159270387590686, |
| "learning_rate": 1.258293362464286e-05, |
| "loss": 0.1988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1858140230178833, |
| "step": 3400, |
| "valid_targets_mean": 2249.7, |
| "valid_targets_min": 1083 |
| }, |
| { |
| "epoch": 4.620081411126187, |
| "grad_norm": 0.7718829974398066, |
| "learning_rate": 1.2520138150139515e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.183822900056839, |
| "step": 3405, |
| "valid_targets_mean": 2386.8, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 4.6268656716417915, |
| "grad_norm": 0.7237060148317359, |
| "learning_rate": 1.2457428287814843e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2160126268863678, |
| "step": 3410, |
| "valid_targets_mean": 3024.9, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 4.633649932157395, |
| "grad_norm": 0.6970676682341086, |
| "learning_rate": 1.2394804755426478e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19945994019508362, |
| "step": 3415, |
| "valid_targets_mean": 2918.2, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 4.640434192672998, |
| "grad_norm": 0.7002590495581039, |
| "learning_rate": 1.233226826974395e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1719842553138733, |
| "step": 3420, |
| "valid_targets_mean": 2718.7, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 4.647218453188603, |
| "grad_norm": 0.6667044269630936, |
| "learning_rate": 1.2269819546540463e-05, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17064428329467773, |
| "step": 3425, |
| "valid_targets_mean": 2865.0, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 4.654002713704206, |
| "grad_norm": 0.6723526548267423, |
| "learning_rate": 1.2207459300584743e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17956231534481049, |
| "step": 3430, |
| "valid_targets_mean": 2932.9, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 4.6607869742198105, |
| "grad_norm": 0.7597739606585969, |
| "learning_rate": 1.2145188245632825e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2012956440448761, |
| "step": 3435, |
| "valid_targets_mean": 2589.2, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 4.667571234735414, |
| "grad_norm": 0.7411616368636825, |
| "learning_rate": 1.2083007094419883e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20920173823833466, |
| "step": 3440, |
| "valid_targets_mean": 2706.8, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 4.674355495251017, |
| "grad_norm": 0.7282082144235389, |
| "learning_rate": 1.2020916558652089e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19379201531410217, |
| "step": 3445, |
| "valid_targets_mean": 2854.1, |
| "valid_targets_min": 1386 |
| }, |
| { |
| "epoch": 4.681139755766622, |
| "grad_norm": 0.7634331226060735, |
| "learning_rate": 1.195891734899846e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17866259813308716, |
| "step": 3450, |
| "valid_targets_mean": 2573.5, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 4.687924016282225, |
| "grad_norm": 0.7399644965932646, |
| "learning_rate": 1.1897010175082722e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17755639553070068, |
| "step": 3455, |
| "valid_targets_mean": 2317.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 4.694708276797829, |
| "grad_norm": 0.6760992330649304, |
| "learning_rate": 1.1835195745475167e-05, |
| "loss": 0.2131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2119104415178299, |
| "step": 3460, |
| "valid_targets_mean": 3410.1, |
| "valid_targets_min": 1576 |
| }, |
| { |
| "epoch": 4.701492537313433, |
| "grad_norm": 0.804513682015714, |
| "learning_rate": 1.17734747676846e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19752076268196106, |
| "step": 3465, |
| "valid_targets_mean": 2760.2, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 4.708276797829036, |
| "grad_norm": 0.707949135936285, |
| "learning_rate": 1.1711847948150186e-05, |
| "loss": 0.1997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20585331320762634, |
| "step": 3470, |
| "valid_targets_mean": 3060.6, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 4.715061058344641, |
| "grad_norm": 0.7166396129531338, |
| "learning_rate": 1.1650315992233385e-05, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20005938410758972, |
| "step": 3475, |
| "valid_targets_mean": 2918.9, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 4.721845318860244, |
| "grad_norm": 0.7074627055555082, |
| "learning_rate": 1.1588879604209881e-05, |
| "loss": 0.201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19769035279750824, |
| "step": 3480, |
| "valid_targets_mean": 2911.6, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 4.728629579375848, |
| "grad_norm": 0.6735143020870807, |
| "learning_rate": 1.1527539487261506e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22932162880897522, |
| "step": 3485, |
| "valid_targets_mean": 3123.0, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 4.735413839891452, |
| "grad_norm": 0.869273594031702, |
| "learning_rate": 1.1466296343468226e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19944173097610474, |
| "step": 3490, |
| "valid_targets_mean": 3747.2, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 4.742198100407055, |
| "grad_norm": 0.6999556266338184, |
| "learning_rate": 1.1405150873800061e-05, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19584204256534576, |
| "step": 3495, |
| "valid_targets_mean": 2844.7, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 4.74898236092266, |
| "grad_norm": 0.8746934337613864, |
| "learning_rate": 1.1344103778109087e-05, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20564094185829163, |
| "step": 3500, |
| "valid_targets_mean": 2151.8, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 4.755766621438263, |
| "grad_norm": 0.7003484221778359, |
| "learning_rate": 1.1283155755121435e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18846553564071655, |
| "step": 3505, |
| "valid_targets_mean": 3061.2, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.762550881953867, |
| "grad_norm": 0.6735835369736797, |
| "learning_rate": 1.1222307502429263e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19506067037582397, |
| "step": 3510, |
| "valid_targets_mean": 3378.4, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 4.769335142469471, |
| "grad_norm": 0.6771476818137822, |
| "learning_rate": 1.116155971648281e-05, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2082287073135376, |
| "step": 3515, |
| "valid_targets_mean": 3448.1, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 4.776119402985074, |
| "grad_norm": 0.6422854879412622, |
| "learning_rate": 1.1100913092582374e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17519763112068176, |
| "step": 3520, |
| "valid_targets_mean": 3188.4, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 4.7829036635006785, |
| "grad_norm": 0.6470472236301349, |
| "learning_rate": 1.1040368324870423e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18372002243995667, |
| "step": 3525, |
| "valid_targets_mean": 3492.9, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 4.789687924016282, |
| "grad_norm": 0.6869308415003494, |
| "learning_rate": 1.0979926106323573e-05, |
| "loss": 0.197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19661110639572144, |
| "step": 3530, |
| "valid_targets_mean": 2938.6, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 4.796472184531886, |
| "grad_norm": 0.7662043660493066, |
| "learning_rate": 1.0919587128744706e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22166971862316132, |
| "step": 3535, |
| "valid_targets_mean": 2690.3, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 4.80325644504749, |
| "grad_norm": 0.7199094564088079, |
| "learning_rate": 1.0859352082755063e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20869404077529907, |
| "step": 3540, |
| "valid_targets_mean": 2830.1, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 4.810040705563093, |
| "grad_norm": 0.7328326298477729, |
| "learning_rate": 1.0799221657786277e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19416038691997528, |
| "step": 3545, |
| "valid_targets_mean": 2855.2, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.8168249660786975, |
| "grad_norm": 0.7338773028161634, |
| "learning_rate": 1.0739196542072554e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18774661421775818, |
| "step": 3550, |
| "valid_targets_mean": 2434.1, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 4.823609226594301, |
| "grad_norm": 0.7453504801028396, |
| "learning_rate": 1.067927742264274e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19881319999694824, |
| "step": 3555, |
| "valid_targets_mean": 2629.6, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 4.830393487109905, |
| "grad_norm": 0.7369431692578411, |
| "learning_rate": 1.0619464985312504e-05, |
| "loss": 0.1935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17585620284080505, |
| "step": 3560, |
| "valid_targets_mean": 2719.1, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 4.837177747625509, |
| "grad_norm": 0.9297708502664351, |
| "learning_rate": 1.0559759914676446e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22836661338806152, |
| "step": 3565, |
| "valid_targets_mean": 2168.1, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 4.843962008141113, |
| "grad_norm": 0.6894574277930866, |
| "learning_rate": 1.0500162894100274e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19786593317985535, |
| "step": 3570, |
| "valid_targets_mean": 3260.4, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 4.850746268656716, |
| "grad_norm": 0.8540680237621792, |
| "learning_rate": 1.0440674605713017e-05, |
| "loss": 0.1912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18931138515472412, |
| "step": 3575, |
| "valid_targets_mean": 2123.2, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 4.85753052917232, |
| "grad_norm": 0.7445669474855375, |
| "learning_rate": 1.0381295730399156e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.191728413105011, |
| "step": 3580, |
| "valid_targets_mean": 2410.1, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 4.864314789687924, |
| "grad_norm": 0.7329229972435735, |
| "learning_rate": 1.03220269477909e-05, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22075408697128296, |
| "step": 3585, |
| "valid_targets_mean": 2925.0, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 4.871099050203528, |
| "grad_norm": 0.6758139766478201, |
| "learning_rate": 1.026286893626033e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19056375324726105, |
| "step": 3590, |
| "valid_targets_mean": 3506.6, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 4.877883310719132, |
| "grad_norm": 0.7551370606263685, |
| "learning_rate": 1.0203822372911714e-05, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2027992308139801, |
| "step": 3595, |
| "valid_targets_mean": 2676.6, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 4.884667571234735, |
| "grad_norm": 0.7381200265506531, |
| "learning_rate": 1.0144887933573686e-05, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18408526480197906, |
| "step": 3600, |
| "valid_targets_mean": 2631.5, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.89145183175034, |
| "grad_norm": 0.7270532833777729, |
| "learning_rate": 1.0086066292791573e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17591014504432678, |
| "step": 3605, |
| "valid_targets_mean": 2436.2, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 4.898236092265943, |
| "grad_norm": 0.7296787884141677, |
| "learning_rate": 1.0027358123819625e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1968274563550949, |
| "step": 3610, |
| "valid_targets_mean": 2829.1, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 4.905020352781547, |
| "grad_norm": 0.6735262562716569, |
| "learning_rate": 9.968764098613329e-06, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.178671196103096, |
| "step": 3615, |
| "valid_targets_mean": 2898.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 4.911804613297151, |
| "grad_norm": 0.7274784816663047, |
| "learning_rate": 9.910284887821733e-06, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20386825501918793, |
| "step": 3620, |
| "valid_targets_mean": 2990.9, |
| "valid_targets_min": 1363 |
| }, |
| { |
| "epoch": 4.918588873812754, |
| "grad_norm": 0.8018638530971335, |
| "learning_rate": 9.851921160779729e-06, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19886431097984314, |
| "step": 3625, |
| "valid_targets_mean": 2382.4, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 4.925373134328359, |
| "grad_norm": 0.8315431805467934, |
| "learning_rate": 9.793673585500454e-06, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18963271379470825, |
| "step": 3630, |
| "valid_targets_mean": 2400.6, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 4.932157394843962, |
| "grad_norm": 0.7403065285740312, |
| "learning_rate": 9.73554282866757e-06, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1916884034872055, |
| "step": 3635, |
| "valid_targets_mean": 2484.9, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 4.9389416553595655, |
| "grad_norm": 0.8056592037843991, |
| "learning_rate": 9.677529555627705e-06, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1968856304883957, |
| "step": 3640, |
| "valid_targets_mean": 2373.9, |
| "valid_targets_min": 1222 |
| }, |
| { |
| "epoch": 4.94572591587517, |
| "grad_norm": 0.6847276217753911, |
| "learning_rate": 9.61963443038278e-06, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19165253639221191, |
| "step": 3645, |
| "valid_targets_mean": 3296.9, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 4.952510176390773, |
| "grad_norm": 0.7481331426159193, |
| "learning_rate": 9.561858115582432e-06, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1881834864616394, |
| "step": 3650, |
| "valid_targets_mean": 2459.1, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 4.959294436906378, |
| "grad_norm": 0.7380750762114332, |
| "learning_rate": 9.504201272516456e-06, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18983861804008484, |
| "step": 3655, |
| "valid_targets_mean": 2577.3, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 4.966078697421981, |
| "grad_norm": 0.7036147611876263, |
| "learning_rate": 9.44666456110718e-06, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19570358097553253, |
| "step": 3660, |
| "valid_targets_mean": 3040.5, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 4.9728629579375845, |
| "grad_norm": 0.7932038159884709, |
| "learning_rate": 9.38924863990197e-06, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1836714744567871, |
| "step": 3665, |
| "valid_targets_mean": 2151.7, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 4.979647218453189, |
| "grad_norm": 0.6964386837916756, |
| "learning_rate": 9.331954166065635e-06, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18505831062793732, |
| "step": 3670, |
| "valid_targets_mean": 2731.6, |
| "valid_targets_min": 1165 |
| }, |
| { |
| "epoch": 4.986431478968792, |
| "grad_norm": 0.7601196537242972, |
| "learning_rate": 9.27478179537297e-06, |
| "loss": 0.1947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19253486394882202, |
| "step": 3675, |
| "valid_targets_mean": 2509.4, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 4.993215739484397, |
| "grad_norm": 0.8155086323774635, |
| "learning_rate": 9.217732182201184e-06, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19509343802928925, |
| "step": 3680, |
| "valid_targets_mean": 2026.9, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.7646808703457486, |
| "learning_rate": 9.160805979522452e-06, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18792404234409332, |
| "step": 3685, |
| "valid_targets_mean": 2684.2, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 5.006784260515603, |
| "grad_norm": 0.6860326719249955, |
| "learning_rate": 9.104003838896445e-06, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1950758993625641, |
| "step": 3690, |
| "valid_targets_mean": 3155.7, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 5.013568521031208, |
| "grad_norm": 0.8441160581115864, |
| "learning_rate": 9.047326410462829e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.161452516913414, |
| "step": 3695, |
| "valid_targets_mean": 1863.4, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 5.020352781546811, |
| "grad_norm": 0.7067203784439574, |
| "learning_rate": 8.990774342933888e-06, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1699763685464859, |
| "step": 3700, |
| "valid_targets_mean": 3295.1, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 5.0271370420624155, |
| "grad_norm": 0.7615352549068712, |
| "learning_rate": 8.934348283587029e-06, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1905319094657898, |
| "step": 3705, |
| "valid_targets_mean": 2832.2, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 5.033921302578019, |
| "grad_norm": 0.7103293756116349, |
| "learning_rate": 8.878048878257443e-06, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1622033417224884, |
| "step": 3710, |
| "valid_targets_mean": 2561.1, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 5.040705563093622, |
| "grad_norm": 0.6718184525017369, |
| "learning_rate": 8.82187677133065e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16609933972358704, |
| "step": 3715, |
| "valid_targets_mean": 3126.9, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 5.047489823609227, |
| "grad_norm": 0.7837080600442082, |
| "learning_rate": 8.765832605735159e-06, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19446608424186707, |
| "step": 3720, |
| "valid_targets_mean": 2856.1, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 5.05427408412483, |
| "grad_norm": 0.6563421792158702, |
| "learning_rate": 8.709917022935117e-06, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14738069474697113, |
| "step": 3725, |
| "valid_targets_mean": 2943.3, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 5.0610583446404345, |
| "grad_norm": 0.8034887747351711, |
| "learning_rate": 8.654130662922927e-06, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18572455644607544, |
| "step": 3730, |
| "valid_targets_mean": 3047.0, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 5.067842605156038, |
| "grad_norm": 0.7592407786525501, |
| "learning_rate": 8.59847416421198e-06, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18500494956970215, |
| "step": 3735, |
| "valid_targets_mean": 2576.2, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 5.074626865671641, |
| "grad_norm": 0.7045855658185989, |
| "learning_rate": 8.542948163829281e-06, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16853509843349457, |
| "step": 3740, |
| "valid_targets_mean": 3002.3, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 5.081411126187246, |
| "grad_norm": 0.7766566314367146, |
| "learning_rate": 8.48755329730822e-06, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1695399284362793, |
| "step": 3745, |
| "valid_targets_mean": 3074.8, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 5.088195386702849, |
| "grad_norm": 0.7988370685668423, |
| "learning_rate": 8.432290198681252e-06, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2006351202726364, |
| "step": 3750, |
| "valid_targets_mean": 2525.8, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 5.094979647218453, |
| "grad_norm": 0.7054424649548406, |
| "learning_rate": 8.377159500472655e-06, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17677809298038483, |
| "step": 3755, |
| "valid_targets_mean": 3203.8, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 5.101763907734057, |
| "grad_norm": 0.713725738511338, |
| "learning_rate": 8.322161833691314e-06, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16771814227104187, |
| "step": 3760, |
| "valid_targets_mean": 2823.8, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 5.108548168249661, |
| "grad_norm": 0.8555144387463031, |
| "learning_rate": 8.267297827823451e-06, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18097899854183197, |
| "step": 3765, |
| "valid_targets_mean": 2239.5, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 5.115332428765265, |
| "grad_norm": 0.6934604273299277, |
| "learning_rate": 8.212568110825475e-06, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15618851780891418, |
| "step": 3770, |
| "valid_targets_mean": 2868.4, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 5.122116689280868, |
| "grad_norm": 0.7648492466356746, |
| "learning_rate": 8.157973309116734e-06, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17531245946884155, |
| "step": 3775, |
| "valid_targets_mean": 2618.1, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 5.128900949796472, |
| "grad_norm": 0.7285693028786157, |
| "learning_rate": 8.103514047572409e-06, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17099301517009735, |
| "step": 3780, |
| "valid_targets_mean": 3425.1, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 5.135685210312076, |
| "grad_norm": 0.8202795361017104, |
| "learning_rate": 8.049190949516312e-06, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1414903700351715, |
| "step": 3785, |
| "valid_targets_mean": 1912.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 5.14246947082768, |
| "grad_norm": 0.8263248998725861, |
| "learning_rate": 7.995004636713763e-06, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19762666523456573, |
| "step": 3790, |
| "valid_targets_mean": 2408.8, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 5.149253731343284, |
| "grad_norm": 0.7393185445325677, |
| "learning_rate": 7.940955729364508e-06, |
| "loss": 0.1819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1720680445432663, |
| "step": 3795, |
| "valid_targets_mean": 2906.4, |
| "valid_targets_min": 1179 |
| }, |
| { |
| "epoch": 5.156037991858887, |
| "grad_norm": 0.803370399333462, |
| "learning_rate": 7.88704484609556e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17175140976905823, |
| "step": 3800, |
| "valid_targets_mean": 2323.2, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.162822252374491, |
| "grad_norm": 0.6536820438575788, |
| "learning_rate": 7.83327260395418e-06, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15294823050498962, |
| "step": 3805, |
| "valid_targets_mean": 3594.9, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 5.169606512890095, |
| "grad_norm": 1.122135081296357, |
| "learning_rate": 7.779639618400761e-06, |
| "loss": 0.1765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16186411678791046, |
| "step": 3810, |
| "valid_targets_mean": 2047.9, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 5.176390773405699, |
| "grad_norm": 0.8371034996880778, |
| "learning_rate": 7.726146503301835e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18086284399032593, |
| "step": 3815, |
| "valid_targets_mean": 2635.9, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 5.1831750339213025, |
| "grad_norm": 0.8310613229880927, |
| "learning_rate": 7.672793870922988e-06, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1729108989238739, |
| "step": 3820, |
| "valid_targets_mean": 2154.4, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 5.189959294436906, |
| "grad_norm": 0.7736398422191684, |
| "learning_rate": 7.619582331921918e-06, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19843143224716187, |
| "step": 3825, |
| "valid_targets_mean": 3357.2, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 5.19674355495251, |
| "grad_norm": 0.7257509154939583, |
| "learning_rate": 7.566512495341387e-06, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17544004321098328, |
| "step": 3830, |
| "valid_targets_mean": 2957.9, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 5.203527815468114, |
| "grad_norm": 0.7915636689184143, |
| "learning_rate": 7.513584968602279e-06, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17739593982696533, |
| "step": 3835, |
| "valid_targets_mean": 3008.4, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 5.210312075983718, |
| "grad_norm": 0.7239442896123227, |
| "learning_rate": 7.4608003574966604e-06, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15659013390541077, |
| "step": 3840, |
| "valid_targets_mean": 2958.6, |
| "valid_targets_min": 1152 |
| }, |
| { |
| "epoch": 5.2170963364993215, |
| "grad_norm": 0.8396562792144856, |
| "learning_rate": 7.408159266180803e-06, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17542997002601624, |
| "step": 3845, |
| "valid_targets_mean": 2428.6, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 5.223880597014926, |
| "grad_norm": 0.7134303390915493, |
| "learning_rate": 7.3556622971683246e-06, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1654246747493744, |
| "step": 3850, |
| "valid_targets_mean": 3071.6, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 5.230664857530529, |
| "grad_norm": 0.8451388168730941, |
| "learning_rate": 7.3033100513232356e-06, |
| "loss": 0.1836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1715916395187378, |
| "step": 3855, |
| "valid_targets_mean": 2175.2, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 5.237449118046133, |
| "grad_norm": 0.717910328678344, |
| "learning_rate": 7.251103127853119e-06, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17889514565467834, |
| "step": 3860, |
| "valid_targets_mean": 2811.1, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 5.244233378561737, |
| "grad_norm": 0.6701275306479537, |
| "learning_rate": 7.199042124302218e-06, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15984272956848145, |
| "step": 3865, |
| "valid_targets_mean": 3448.8, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 5.25101763907734, |
| "grad_norm": 0.7396236758430029, |
| "learning_rate": 7.1471276365446265e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16578418016433716, |
| "step": 3870, |
| "valid_targets_mean": 2790.6, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 5.257801899592945, |
| "grad_norm": 0.7761448636163958, |
| "learning_rate": 7.095360258777479e-06, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16495108604431152, |
| "step": 3875, |
| "valid_targets_mean": 2547.1, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 5.264586160108548, |
| "grad_norm": 0.7169834901617055, |
| "learning_rate": 7.043740583514116e-06, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16059651970863342, |
| "step": 3880, |
| "valid_targets_mean": 2682.7, |
| "valid_targets_min": 1125 |
| }, |
| { |
| "epoch": 5.271370420624152, |
| "grad_norm": 0.937784973378471, |
| "learning_rate": 6.99226920157734e-06, |
| "loss": 0.1759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15862375497817993, |
| "step": 3885, |
| "valid_targets_mean": 2327.4, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 5.278154681139756, |
| "grad_norm": 0.7636077182810278, |
| "learning_rate": 6.9409467020926105e-06, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15665987133979797, |
| "step": 3890, |
| "valid_targets_mean": 2581.5, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 5.284938941655359, |
| "grad_norm": 0.8082211996097235, |
| "learning_rate": 6.88977367248135e-06, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17556774616241455, |
| "step": 3895, |
| "valid_targets_mean": 2410.4, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 5.291723202170964, |
| "grad_norm": 0.7855611135912653, |
| "learning_rate": 6.838750698454179e-06, |
| "loss": 0.1823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19265274703502655, |
| "step": 3900, |
| "valid_targets_mean": 2630.9, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 5.298507462686567, |
| "grad_norm": 0.773979909790802, |
| "learning_rate": 6.787878364004223e-06, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1742939054965973, |
| "step": 3905, |
| "valid_targets_mean": 2754.6, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 5.305291723202171, |
| "grad_norm": 0.7045798341954811, |
| "learning_rate": 6.7371572514004565e-06, |
| "loss": 0.1759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1639530062675476, |
| "step": 3910, |
| "valid_targets_mean": 3152.7, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 5.312075983717775, |
| "grad_norm": 0.7118839049525844, |
| "learning_rate": 6.6865879411809905e-06, |
| "loss": 0.1702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1681211143732071, |
| "step": 3915, |
| "valid_targets_mean": 3016.1, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 5.318860244233378, |
| "grad_norm": 0.7619077612605996, |
| "learning_rate": 6.636171012146475e-06, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1695559173822403, |
| "step": 3920, |
| "valid_targets_mean": 2828.6, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 5.325644504748983, |
| "grad_norm": 0.704742231689896, |
| "learning_rate": 6.58590704135343e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15426993370056152, |
| "step": 3925, |
| "valid_targets_mean": 2844.4, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 5.332428765264586, |
| "grad_norm": 1.083531396358083, |
| "learning_rate": 6.535796604107689e-06, |
| "loss": 0.1759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15194523334503174, |
| "step": 3930, |
| "valid_targets_mean": 2859.6, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 5.3392130257801895, |
| "grad_norm": 0.7267810541836737, |
| "learning_rate": 6.485840273957764e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18725672364234924, |
| "step": 3935, |
| "valid_targets_mean": 3104.9, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 5.345997286295794, |
| "grad_norm": 0.7803241832429276, |
| "learning_rate": 6.4360386226883096e-06, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18757139146327972, |
| "step": 3940, |
| "valid_targets_mean": 2826.7, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 5.352781546811397, |
| "grad_norm": 0.7469635091923277, |
| "learning_rate": 6.386392220313595e-06, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1943964660167694, |
| "step": 3945, |
| "valid_targets_mean": 2944.8, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 5.359565807327002, |
| "grad_norm": 0.7710548111024483, |
| "learning_rate": 6.336901635070924e-06, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18395206332206726, |
| "step": 3950, |
| "valid_targets_mean": 2640.2, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 5.366350067842605, |
| "grad_norm": 0.7839171636791334, |
| "learning_rate": 6.287567433414203e-06, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18562139570713043, |
| "step": 3955, |
| "valid_targets_mean": 2582.2, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 5.373134328358209, |
| "grad_norm": 0.7856837884639124, |
| "learning_rate": 6.238390180007388e-06, |
| "loss": 0.1809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1797139048576355, |
| "step": 3960, |
| "valid_targets_mean": 2337.2, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 5.379918588873813, |
| "grad_norm": 0.7809120404347694, |
| "learning_rate": 6.189370437718076e-06, |
| "loss": 0.1708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17183539271354675, |
| "step": 3965, |
| "valid_targets_mean": 2353.1, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 5.386702849389416, |
| "grad_norm": 0.7115407389633623, |
| "learning_rate": 6.140508767611031e-06, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17769712209701538, |
| "step": 3970, |
| "valid_targets_mean": 3229.7, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.393487109905021, |
| "grad_norm": 0.9077544313783328, |
| "learning_rate": 6.091805728941766e-06, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19499380886554718, |
| "step": 3975, |
| "valid_targets_mean": 3067.6, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 5.400271370420624, |
| "grad_norm": 0.8077064097851708, |
| "learning_rate": 6.0432618791501685e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1870405375957489, |
| "step": 3980, |
| "valid_targets_mean": 2559.1, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 5.407055630936228, |
| "grad_norm": 0.6398380496001846, |
| "learning_rate": 5.994877773854073e-06, |
| "loss": 0.1702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15979993343353271, |
| "step": 3985, |
| "valid_targets_mean": 3374.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 5.413839891451832, |
| "grad_norm": 0.7502361275025041, |
| "learning_rate": 5.946653966842952e-06, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17689886689186096, |
| "step": 3990, |
| "valid_targets_mean": 2697.2, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 5.420624151967435, |
| "grad_norm": 0.7109443485696391, |
| "learning_rate": 5.89859101007153e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19721101224422455, |
| "step": 3995, |
| "valid_targets_mean": 3432.0, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 5.4274084124830395, |
| "grad_norm": 0.7778834659042302, |
| "learning_rate": 5.850689453653519e-06, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.176166370511055, |
| "step": 4000, |
| "valid_targets_mean": 2819.3, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 5.434192672998643, |
| "grad_norm": 0.7986804713666946, |
| "learning_rate": 5.802949845855268e-06, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17381024360656738, |
| "step": 4005, |
| "valid_targets_mean": 2511.1, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.440976933514247, |
| "grad_norm": 0.74764269275807, |
| "learning_rate": 5.75537273308951e-06, |
| "loss": 0.1694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1764945685863495, |
| "step": 4010, |
| "valid_targets_mean": 3111.7, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 5.447761194029851, |
| "grad_norm": 0.7387352711479095, |
| "learning_rate": 5.7079586599091386e-06, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1689624935388565, |
| "step": 4015, |
| "valid_targets_mean": 2689.8, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 5.454545454545454, |
| "grad_norm": 0.6334842178503496, |
| "learning_rate": 5.660708169000915e-06, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1706801950931549, |
| "step": 4020, |
| "valid_targets_mean": 4078.6, |
| "valid_targets_min": 1344 |
| }, |
| { |
| "epoch": 5.4613297150610585, |
| "grad_norm": 0.7687849593222028, |
| "learning_rate": 5.61362180117931e-06, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.180070698261261, |
| "step": 4025, |
| "valid_targets_mean": 2676.0, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 5.468113975576662, |
| "grad_norm": 0.730085829715646, |
| "learning_rate": 5.566700095380278e-06, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17584823071956635, |
| "step": 4030, |
| "valid_targets_mean": 3169.8, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 5.474898236092266, |
| "grad_norm": 0.7919939571403866, |
| "learning_rate": 5.519943588655119e-06, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16983819007873535, |
| "step": 4035, |
| "valid_targets_mean": 2544.8, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 5.48168249660787, |
| "grad_norm": 0.7573834464121695, |
| "learning_rate": 5.473352816164297e-06, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18410179018974304, |
| "step": 4040, |
| "valid_targets_mean": 2772.2, |
| "valid_targets_min": 1090 |
| }, |
| { |
| "epoch": 5.488466757123474, |
| "grad_norm": 0.8466367207178821, |
| "learning_rate": 5.426928311171349e-06, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1880597323179245, |
| "step": 4045, |
| "valid_targets_mean": 2396.6, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 5.495251017639077, |
| "grad_norm": 0.7284020341330157, |
| "learning_rate": 5.3806706050367595e-06, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1683264523744583, |
| "step": 4050, |
| "valid_targets_mean": 2992.8, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 5.502035278154681, |
| "grad_norm": 0.7784161722246488, |
| "learning_rate": 5.334580227211876e-06, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1845816969871521, |
| "step": 4055, |
| "valid_targets_mean": 2580.1, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 5.508819538670285, |
| "grad_norm": 0.8548009473097017, |
| "learning_rate": 5.28865770523288e-06, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17506195604801178, |
| "step": 4060, |
| "valid_targets_mean": 2178.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 5.515603799185889, |
| "grad_norm": 0.7774055293795816, |
| "learning_rate": 5.242903564714703e-06, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16525691747665405, |
| "step": 4065, |
| "valid_targets_mean": 2520.9, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 5.522388059701493, |
| "grad_norm": 0.796456602697807, |
| "learning_rate": 5.197318329345053e-06, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1665637195110321, |
| "step": 4070, |
| "valid_targets_mean": 2367.8, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 5.529172320217096, |
| "grad_norm": 0.646421264270265, |
| "learning_rate": 5.151902520878389e-06, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15533316135406494, |
| "step": 4075, |
| "valid_targets_mean": 2986.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 5.5359565807327, |
| "grad_norm": 0.7819970698101568, |
| "learning_rate": 5.106656659129976e-06, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20608392357826233, |
| "step": 4080, |
| "valid_targets_mean": 2478.6, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 5.542740841248304, |
| "grad_norm": 0.7853975289145698, |
| "learning_rate": 5.061581261969908e-06, |
| "loss": 0.1796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17922022938728333, |
| "step": 4085, |
| "valid_targets_mean": 2634.1, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 5.549525101763908, |
| "grad_norm": 0.7225473013309462, |
| "learning_rate": 5.016676845317195e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1765461564064026, |
| "step": 4090, |
| "valid_targets_mean": 3014.4, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 5.556309362279512, |
| "grad_norm": 0.7295640966157877, |
| "learning_rate": 4.971943923133871e-06, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17156416177749634, |
| "step": 4095, |
| "valid_targets_mean": 3041.5, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 5.563093622795115, |
| "grad_norm": 0.9219762006603129, |
| "learning_rate": 4.9273830074190775e-06, |
| "loss": 0.1765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18373648822307587, |
| "step": 4100, |
| "valid_targets_mean": 2428.7, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 5.569877883310719, |
| "grad_norm": 0.702767206840844, |
| "learning_rate": 4.8829946082032485e-06, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13803914189338684, |
| "step": 4105, |
| "valid_targets_mean": 2718.2, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 5.576662143826323, |
| "grad_norm": 0.7199250201736765, |
| "learning_rate": 4.838779233542219e-06, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18196873366832733, |
| "step": 4110, |
| "valid_targets_mean": 3093.8, |
| "valid_targets_min": 1395 |
| }, |
| { |
| "epoch": 5.5834464043419265, |
| "grad_norm": 0.702683524158407, |
| "learning_rate": 4.794737389511466e-06, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15686261653900146, |
| "step": 4115, |
| "valid_targets_mean": 2956.6, |
| "valid_targets_min": 1365 |
| }, |
| { |
| "epoch": 5.590230664857531, |
| "grad_norm": 0.8226186328669812, |
| "learning_rate": 4.750869580200268e-06, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18233484029769897, |
| "step": 4120, |
| "valid_targets_mean": 2818.7, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 5.597014925373134, |
| "grad_norm": 0.757006026009914, |
| "learning_rate": 4.707176307705958e-06, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17816491425037384, |
| "step": 4125, |
| "valid_targets_mean": 2692.9, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 5.603799185888738, |
| "grad_norm": 0.7711809358808944, |
| "learning_rate": 4.6636580721281945e-06, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1927419900894165, |
| "step": 4130, |
| "valid_targets_mean": 2813.9, |
| "valid_targets_min": 1322 |
| }, |
| { |
| "epoch": 5.610583446404342, |
| "grad_norm": 0.8362493387614779, |
| "learning_rate": 4.620315371563188e-06, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16866496205329895, |
| "step": 4135, |
| "valid_targets_mean": 2549.8, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 5.6173677069199455, |
| "grad_norm": 0.7202504972034123, |
| "learning_rate": 4.577148702098064e-06, |
| "loss": 0.1708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18742281198501587, |
| "step": 4140, |
| "valid_targets_mean": 3108.2, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 5.62415196743555, |
| "grad_norm": 0.7230613052656376, |
| "learning_rate": 4.5341585578051125e-06, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1717241406440735, |
| "step": 4145, |
| "valid_targets_mean": 2795.6, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 5.630936227951153, |
| "grad_norm": 0.7394571746760491, |
| "learning_rate": 4.491345430736207e-06, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17502638697624207, |
| "step": 4150, |
| "valid_targets_mean": 2911.4, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 5.637720488466757, |
| "grad_norm": 1.1380143885731062, |
| "learning_rate": 4.4487098109171115e-06, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16936932504177094, |
| "step": 4155, |
| "valid_targets_mean": 2618.9, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 5.644504748982361, |
| "grad_norm": 0.880683030604768, |
| "learning_rate": 4.406252186341904e-06, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1713424026966095, |
| "step": 4160, |
| "valid_targets_mean": 2082.8, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 5.651289009497964, |
| "grad_norm": 0.8944130226850632, |
| "learning_rate": 4.363973042967393e-06, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2198825478553772, |
| "step": 4165, |
| "valid_targets_mean": 2161.4, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 5.658073270013569, |
| "grad_norm": 0.7666908944066096, |
| "learning_rate": 4.3218728647075324e-06, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16684460639953613, |
| "step": 4170, |
| "valid_targets_mean": 2747.1, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 5.664857530529172, |
| "grad_norm": 1.1331036484064003, |
| "learning_rate": 4.2799521334279155e-06, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16542381048202515, |
| "step": 4175, |
| "valid_targets_mean": 2846.9, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 5.6716417910447765, |
| "grad_norm": 0.7113624200207286, |
| "learning_rate": 4.238211328940214e-06, |
| "loss": 0.175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15958712995052338, |
| "step": 4180, |
| "valid_targets_mean": 2826.9, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 5.67842605156038, |
| "grad_norm": 0.7443765505636735, |
| "learning_rate": 4.196650928996744e-06, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17205163836479187, |
| "step": 4185, |
| "valid_targets_mean": 2878.1, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 5.685210312075983, |
| "grad_norm": 0.765002712688627, |
| "learning_rate": 4.155271409284947e-06, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17750981450080872, |
| "step": 4190, |
| "valid_targets_mean": 2678.2, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 5.691994572591588, |
| "grad_norm": 0.7973473759974611, |
| "learning_rate": 4.114073243421964e-06, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18639904260635376, |
| "step": 4195, |
| "valid_targets_mean": 2673.8, |
| "valid_targets_min": 1544 |
| }, |
| { |
| "epoch": 5.698778833107191, |
| "grad_norm": 0.8006125558694456, |
| "learning_rate": 4.073056902949233e-06, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.181000754237175, |
| "step": 4200, |
| "valid_targets_mean": 2716.2, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 5.7055630936227955, |
| "grad_norm": 0.7771322898882181, |
| "learning_rate": 4.032222857327055e-06, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1973440945148468, |
| "step": 4205, |
| "valid_targets_mean": 3029.1, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 5.712347354138399, |
| "grad_norm": 0.7542045578109661, |
| "learning_rate": 3.991571573929263e-06, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16543592512607574, |
| "step": 4210, |
| "valid_targets_mean": 2804.5, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 5.719131614654002, |
| "grad_norm": 0.6746826061759319, |
| "learning_rate": 3.951103518037822e-06, |
| "loss": 0.1694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17549774050712585, |
| "step": 4215, |
| "valid_targets_mean": 3377.5, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 5.725915875169607, |
| "grad_norm": 0.7884807830662328, |
| "learning_rate": 3.910819152837564e-06, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19728972017765045, |
| "step": 4220, |
| "valid_targets_mean": 2609.3, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 5.73270013568521, |
| "grad_norm": 0.6844292385894344, |
| "learning_rate": 3.870718939410829e-06, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2012067437171936, |
| "step": 4225, |
| "valid_targets_mean": 3169.2, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 5.739484396200814, |
| "grad_norm": 0.6779140929423958, |
| "learning_rate": 3.8308033367322185e-06, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16013997793197632, |
| "step": 4230, |
| "valid_targets_mean": 3190.8, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 5.746268656716418, |
| "grad_norm": 0.7186843297493842, |
| "learning_rate": 3.791072801663349e-06, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17085684835910797, |
| "step": 4235, |
| "valid_targets_mean": 3101.9, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 5.753052917232022, |
| "grad_norm": 0.773844588416225, |
| "learning_rate": 3.751527788947593e-06, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18918392062187195, |
| "step": 4240, |
| "valid_targets_mean": 2950.2, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 5.759837177747626, |
| "grad_norm": 0.8943301985541035, |
| "learning_rate": 3.7121687512049075e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1794520914554596, |
| "step": 4245, |
| "valid_targets_mean": 3305.4, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 5.766621438263229, |
| "grad_norm": 0.71555932932248, |
| "learning_rate": 3.672996138926623e-06, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1853591352701187, |
| "step": 4250, |
| "valid_targets_mean": 3303.0, |
| "valid_targets_min": 1317 |
| }, |
| { |
| "epoch": 5.773405698778833, |
| "grad_norm": 0.7600028735931071, |
| "learning_rate": 3.634010400470318e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15217794477939606, |
| "step": 4255, |
| "valid_targets_mean": 2485.2, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 5.780189959294437, |
| "grad_norm": 0.6651550656338701, |
| "learning_rate": 3.595211982054652e-06, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15896007418632507, |
| "step": 4260, |
| "valid_targets_mean": 3312.4, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 5.786974219810041, |
| "grad_norm": 0.793423124225591, |
| "learning_rate": 3.5566013277542987e-06, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1872842162847519, |
| "step": 4265, |
| "valid_targets_mean": 2579.4, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 5.7937584803256446, |
| "grad_norm": 0.7190178787946112, |
| "learning_rate": 3.5181788794948267e-06, |
| "loss": 0.1739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1685473471879959, |
| "step": 4270, |
| "valid_targets_mean": 2938.9, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 5.800542740841248, |
| "grad_norm": 0.7427543324860382, |
| "learning_rate": 3.479945077047655e-06, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18788832426071167, |
| "step": 4275, |
| "valid_targets_mean": 3514.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 5.807327001356852, |
| "grad_norm": 0.7301184905700668, |
| "learning_rate": 3.4419003580250386e-06, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724769026041031, |
| "step": 4280, |
| "valid_targets_mean": 2761.8, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 5.814111261872456, |
| "grad_norm": 0.6996558660986915, |
| "learning_rate": 3.40404515787502e-06, |
| "loss": 0.1775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17133083939552307, |
| "step": 4285, |
| "valid_targets_mean": 3322.6, |
| "valid_targets_min": 1164 |
| }, |
| { |
| "epoch": 5.82089552238806, |
| "grad_norm": 0.7470138239152765, |
| "learning_rate": 3.366379909876487e-06, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1647733896970749, |
| "step": 4290, |
| "valid_targets_mean": 2699.9, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 5.8276797829036635, |
| "grad_norm": 0.8027648641349744, |
| "learning_rate": 3.3289050451341785e-06, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17798423767089844, |
| "step": 4295, |
| "valid_targets_mean": 2830.8, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 5.834464043419267, |
| "grad_norm": 0.6833745641979659, |
| "learning_rate": 3.291620992573781e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1725693941116333, |
| "step": 4300, |
| "valid_targets_mean": 3136.2, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 5.841248303934871, |
| "grad_norm": 0.7632930036843467, |
| "learning_rate": 3.254528178936991e-06, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1607835590839386, |
| "step": 4305, |
| "valid_targets_mean": 2220.1, |
| "valid_targets_min": 1083 |
| }, |
| { |
| "epoch": 5.848032564450475, |
| "grad_norm": 0.7766685814823788, |
| "learning_rate": 3.217627028776642e-06, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17807729542255402, |
| "step": 4310, |
| "valid_targets_mean": 3144.8, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 5.854816824966079, |
| "grad_norm": 0.7615851643722991, |
| "learning_rate": 3.180917964451864e-06, |
| "loss": 0.177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18378789722919464, |
| "step": 4315, |
| "valid_targets_mean": 2792.7, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 5.8616010854816825, |
| "grad_norm": 0.7720381142011892, |
| "learning_rate": 3.1444014061232096e-06, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19216835498809814, |
| "step": 4320, |
| "valid_targets_mean": 2816.5, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 5.868385345997286, |
| "grad_norm": 0.7413182551927285, |
| "learning_rate": 3.1080777717478906e-06, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17600227892398834, |
| "step": 4325, |
| "valid_targets_mean": 2807.1, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 5.87516960651289, |
| "grad_norm": 0.830639238497367, |
| "learning_rate": 3.071947477074948e-06, |
| "loss": 0.1744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20260506868362427, |
| "step": 4330, |
| "valid_targets_mean": 3276.9, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 5.881953867028494, |
| "grad_norm": 0.7247615457982057, |
| "learning_rate": 3.036010935640541e-06, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1745220124721527, |
| "step": 4335, |
| "valid_targets_mean": 3025.8, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 5.888738127544098, |
| "grad_norm": 0.7666810644080457, |
| "learning_rate": 3.0002685587631665e-06, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19823196530342102, |
| "step": 4340, |
| "valid_targets_mean": 2815.8, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 5.895522388059701, |
| "grad_norm": 0.6891577535572125, |
| "learning_rate": 2.9647207555389833e-06, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1756839156150818, |
| "step": 4345, |
| "valid_targets_mean": 3165.6, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 5.902306648575305, |
| "grad_norm": 0.6280441768186072, |
| "learning_rate": 2.929367932837128e-06, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16393789649009705, |
| "step": 4350, |
| "valid_targets_mean": 3511.4, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 5.909090909090909, |
| "grad_norm": 0.7212401001251478, |
| "learning_rate": 2.8942104952950358e-06, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1590360701084137, |
| "step": 4355, |
| "valid_targets_mean": 2814.4, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 5.915875169606513, |
| "grad_norm": 0.7587496985425881, |
| "learning_rate": 2.8592488453138402e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18076002597808838, |
| "step": 4360, |
| "valid_targets_mean": 2772.0, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 5.922659430122117, |
| "grad_norm": 0.7026766056453736, |
| "learning_rate": 2.8244833830537334e-06, |
| "loss": 0.1775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16852641105651855, |
| "step": 4365, |
| "valid_targets_mean": 3198.9, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 5.92944369063772, |
| "grad_norm": 0.7591755791375419, |
| "learning_rate": 2.789914506429423e-06, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18854087591171265, |
| "step": 4370, |
| "valid_targets_mean": 3410.3, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 5.936227951153324, |
| "grad_norm": 0.7317196861574712, |
| "learning_rate": 2.755542611105544e-06, |
| "loss": 0.175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17983709275722504, |
| "step": 4375, |
| "valid_targets_mean": 2910.4, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 5.943012211668928, |
| "grad_norm": 0.7873291444565179, |
| "learning_rate": 2.7213680904921426e-06, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15739159286022186, |
| "step": 4380, |
| "valid_targets_mean": 2447.4, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 5.949796472184532, |
| "grad_norm": 0.783627540382998, |
| "learning_rate": 2.687391335740195e-06, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18448659777641296, |
| "step": 4385, |
| "valid_targets_mean": 2981.9, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 5.956580732700136, |
| "grad_norm": 0.8163415230485238, |
| "learning_rate": 2.6536127357370834e-06, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17967082560062408, |
| "step": 4390, |
| "valid_targets_mean": 2268.2, |
| "valid_targets_min": 1087 |
| }, |
| { |
| "epoch": 5.963364993215739, |
| "grad_norm": 0.6972529066512584, |
| "learning_rate": 2.6200326771021977e-06, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17101269960403442, |
| "step": 4395, |
| "valid_targets_mean": 3305.3, |
| "valid_targets_min": 1304 |
| }, |
| { |
| "epoch": 5.970149253731344, |
| "grad_norm": 0.7444293238213098, |
| "learning_rate": 2.5866515441824637e-06, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16424033045768738, |
| "step": 4400, |
| "valid_targets_mean": 2531.2, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 5.976933514246947, |
| "grad_norm": 0.7787083692853177, |
| "learning_rate": 2.553469719047983e-06, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18210354447364807, |
| "step": 4405, |
| "valid_targets_mean": 3141.8, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 5.9837177747625505, |
| "grad_norm": 0.7791998751111936, |
| "learning_rate": 2.5204875814876318e-06, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19235186278820038, |
| "step": 4410, |
| "valid_targets_mean": 2803.9, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 5.990502035278155, |
| "grad_norm": 0.7009703971990965, |
| "learning_rate": 2.487705509004721e-06, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18249055743217468, |
| "step": 4415, |
| "valid_targets_mean": 3232.0, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 5.997286295793758, |
| "grad_norm": 0.7781270453801223, |
| "learning_rate": 2.4551238768126906e-06, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16195908188819885, |
| "step": 4420, |
| "valid_targets_mean": 2633.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 6.004070556309363, |
| "grad_norm": 0.7415388448727406, |
| "learning_rate": 2.422743057830792e-06, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19907845556735992, |
| "step": 4425, |
| "valid_targets_mean": 2871.6, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 6.010854816824966, |
| "grad_norm": 0.742053212238427, |
| "learning_rate": 2.3905634226798415e-06, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18320277333259583, |
| "step": 4430, |
| "valid_targets_mean": 3028.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 6.0176390773405695, |
| "grad_norm": 0.8079591238507426, |
| "learning_rate": 2.3585853396779546e-06, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17492371797561646, |
| "step": 4435, |
| "valid_targets_mean": 2414.6, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 6.024423337856174, |
| "grad_norm": 0.7245282326645127, |
| "learning_rate": 2.326809174836355e-06, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16501660645008087, |
| "step": 4440, |
| "valid_targets_mean": 2658.6, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 6.031207598371777, |
| "grad_norm": 0.7529821726671959, |
| "learning_rate": 2.295235291855171e-06, |
| "loss": 0.1621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16563096642494202, |
| "step": 4445, |
| "valid_targets_mean": 2985.2, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 6.0379918588873815, |
| "grad_norm": 0.7218429838629064, |
| "learning_rate": 2.2638640521192666e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16327796876430511, |
| "step": 4450, |
| "valid_targets_mean": 2918.9, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 6.044776119402985, |
| "grad_norm": 0.7670474706596653, |
| "learning_rate": 2.23269581469413e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17224714159965515, |
| "step": 4455, |
| "valid_targets_mean": 2854.1, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 6.051560379918589, |
| "grad_norm": 0.85371010583432, |
| "learning_rate": 2.201730936321731e-06, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18799713253974915, |
| "step": 4460, |
| "valid_targets_mean": 2257.5, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 6.058344640434193, |
| "grad_norm": 0.8581102151455461, |
| "learning_rate": 2.170969771416471e-06, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19284003973007202, |
| "step": 4465, |
| "valid_targets_mean": 2541.4, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 6.065128900949796, |
| "grad_norm": 0.7082075259100371, |
| "learning_rate": 2.140412672061094e-06, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14846593141555786, |
| "step": 4470, |
| "valid_targets_mean": 2874.5, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 6.0719131614654005, |
| "grad_norm": 0.6593303484533789, |
| "learning_rate": 2.1100599880026885e-06, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17295196652412415, |
| "step": 4475, |
| "valid_targets_mean": 3751.6, |
| "valid_targets_min": 1730 |
| }, |
| { |
| "epoch": 6.078697421981004, |
| "grad_norm": 0.7194386838659942, |
| "learning_rate": 2.079912066648655e-06, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14499616622924805, |
| "step": 4480, |
| "valid_targets_mean": 2578.9, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 6.085481682496608, |
| "grad_norm": 0.7703414212546942, |
| "learning_rate": 2.049969253062758e-06, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17155641317367554, |
| "step": 4485, |
| "valid_targets_mean": 2867.4, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.092265943012212, |
| "grad_norm": 0.7581834478927615, |
| "learning_rate": 2.0202318899611483e-06, |
| "loss": 0.1596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14970597624778748, |
| "step": 4490, |
| "valid_targets_mean": 2776.1, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 6.099050203527815, |
| "grad_norm": 0.8858694998395675, |
| "learning_rate": 1.9907003177084605e-06, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19518548250198364, |
| "step": 4495, |
| "valid_targets_mean": 2301.6, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 6.1058344640434195, |
| "grad_norm": 0.7698959242156672, |
| "learning_rate": 1.9613748743139126e-06, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18513622879981995, |
| "step": 4500, |
| "valid_targets_mean": 3196.8, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 6.112618724559023, |
| "grad_norm": 0.9050028409977037, |
| "learning_rate": 1.9322558954274305e-06, |
| "loss": 0.1693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17871133983135223, |
| "step": 4505, |
| "valid_targets_mean": 2160.6, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 6.119402985074627, |
| "grad_norm": 0.7740731558411673, |
| "learning_rate": 1.9033437143358213e-06, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16579106450080872, |
| "step": 4510, |
| "valid_targets_mean": 2948.0, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 6.126187245590231, |
| "grad_norm": 0.8348067497419805, |
| "learning_rate": 1.874638661958934e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16571199893951416, |
| "step": 4515, |
| "valid_targets_mean": 2415.9, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 6.132971506105834, |
| "grad_norm": 0.7256235619648512, |
| "learning_rate": 1.8461410668459035e-06, |
| "loss": 0.1567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14996132254600525, |
| "step": 4520, |
| "valid_targets_mean": 2668.2, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 6.139755766621438, |
| "grad_norm": 0.7614175427466571, |
| "learning_rate": 1.8178512551713568e-06, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15067064762115479, |
| "step": 4525, |
| "valid_targets_mean": 3234.1, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 6.146540027137042, |
| "grad_norm": 0.7569505883546243, |
| "learning_rate": 1.7897695507317036e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17070305347442627, |
| "step": 4530, |
| "valid_targets_mean": 2981.2, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 6.153324287652646, |
| "grad_norm": 0.715139884326026, |
| "learning_rate": 1.761896274941426e-06, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1826499104499817, |
| "step": 4535, |
| "valid_targets_mean": 3501.9, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 6.16010854816825, |
| "grad_norm": 0.7854237661191246, |
| "learning_rate": 1.7342317468293912e-06, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16877636313438416, |
| "step": 4540, |
| "valid_targets_mean": 2512.0, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 6.166892808683853, |
| "grad_norm": 0.8303757582473726, |
| "learning_rate": 1.7067762830352096e-06, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17255139350891113, |
| "step": 4545, |
| "valid_targets_mean": 2534.2, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 6.173677069199457, |
| "grad_norm": 0.7385224765472438, |
| "learning_rate": 1.679530197805599e-06, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15643605589866638, |
| "step": 4550, |
| "valid_targets_mean": 2944.8, |
| "valid_targets_min": 1366 |
| }, |
| { |
| "epoch": 6.180461329715061, |
| "grad_norm": 0.7564443718183899, |
| "learning_rate": 1.652493802990811e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17550310492515564, |
| "step": 4555, |
| "valid_targets_mean": 3110.1, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 6.187245590230665, |
| "grad_norm": 1.71255016027657, |
| "learning_rate": 1.6256674080410185e-06, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15688160061836243, |
| "step": 4560, |
| "valid_targets_mean": 3095.8, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 6.1940298507462686, |
| "grad_norm": 0.8040556589037928, |
| "learning_rate": 1.5990513200028269e-06, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1727936565876007, |
| "step": 4565, |
| "valid_targets_mean": 2527.2, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 6.200814111261873, |
| "grad_norm": 0.7945263075310672, |
| "learning_rate": 1.5726458435157255e-06, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18288177251815796, |
| "step": 4570, |
| "valid_targets_mean": 3045.4, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 6.207598371777476, |
| "grad_norm": 0.7545719664187707, |
| "learning_rate": 1.5464512808086008e-06, |
| "loss": 0.1694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17064568400382996, |
| "step": 4575, |
| "valid_targets_mean": 3098.4, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 6.21438263229308, |
| "grad_norm": 0.747591105064271, |
| "learning_rate": 1.5204679316963012e-06, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1849783957004547, |
| "step": 4580, |
| "valid_targets_mean": 3041.9, |
| "valid_targets_min": 1643 |
| }, |
| { |
| "epoch": 6.221166892808684, |
| "grad_norm": 0.7177247952162282, |
| "learning_rate": 1.4946960935761734e-06, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17120692133903503, |
| "step": 4585, |
| "valid_targets_mean": 3201.8, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 6.2279511533242875, |
| "grad_norm": 0.8094458246760512, |
| "learning_rate": 1.4691360614246897e-06, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16246119141578674, |
| "step": 4590, |
| "valid_targets_mean": 2322.5, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.234735413839892, |
| "grad_norm": 0.7798473673390547, |
| "learning_rate": 1.443788127794048e-06, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17415021359920502, |
| "step": 4595, |
| "valid_targets_mean": 2854.2, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 6.241519674355495, |
| "grad_norm": 0.7946140484277268, |
| "learning_rate": 1.4186525828088282e-06, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15857259929180145, |
| "step": 4600, |
| "valid_targets_mean": 2525.8, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 6.248303934871099, |
| "grad_norm": 0.7801428383995377, |
| "learning_rate": 1.3937297141626904e-06, |
| "loss": 0.1726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1684061586856842, |
| "step": 4605, |
| "valid_targets_mean": 2809.8, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 6.255088195386703, |
| "grad_norm": 0.6643638326526149, |
| "learning_rate": 1.3690198071150528e-06, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15296955406665802, |
| "step": 4610, |
| "valid_targets_mean": 3476.2, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 6.2618724559023065, |
| "grad_norm": 0.7686142175477614, |
| "learning_rate": 1.3445231444878504e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17054758965969086, |
| "step": 4615, |
| "valid_targets_mean": 2753.3, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 6.268656716417911, |
| "grad_norm": 0.8432191119730226, |
| "learning_rate": 1.3202400066622834e-06, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17865519225597382, |
| "step": 4620, |
| "valid_targets_mean": 2344.4, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 6.275440976933514, |
| "grad_norm": 0.6339497035055569, |
| "learning_rate": 1.2961706715756184e-06, |
| "loss": 0.1587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1531352996826172, |
| "step": 4625, |
| "valid_targets_mean": 3586.7, |
| "valid_targets_min": 2054 |
| }, |
| { |
| "epoch": 6.282225237449118, |
| "grad_norm": 0.8544021195040931, |
| "learning_rate": 1.2723154147179973e-06, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1579844206571579, |
| "step": 4630, |
| "valid_targets_mean": 3154.9, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 6.289009497964722, |
| "grad_norm": 0.8007481753817313, |
| "learning_rate": 1.2486745091292862e-06, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1802925169467926, |
| "step": 4635, |
| "valid_targets_mean": 2729.8, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 6.295793758480325, |
| "grad_norm": 0.8142132607230317, |
| "learning_rate": 1.2252482253959653e-06, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18052034080028534, |
| "step": 4640, |
| "valid_targets_mean": 2541.6, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 6.30257801899593, |
| "grad_norm": 0.6774345228089872, |
| "learning_rate": 1.202036831648008e-06, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.150282084941864, |
| "step": 4645, |
| "valid_targets_mean": 3526.9, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 6.309362279511533, |
| "grad_norm": 0.7516698326728172, |
| "learning_rate": 1.1790405935558292e-06, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16584287583827972, |
| "step": 4650, |
| "valid_targets_mean": 2976.7, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 6.3161465400271375, |
| "grad_norm": 0.7046916433526038, |
| "learning_rate": 1.156259774327233e-06, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16168582439422607, |
| "step": 4655, |
| "valid_targets_mean": 3335.2, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 6.322930800542741, |
| "grad_norm": 0.767262026885646, |
| "learning_rate": 1.1336946347044164e-06, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15575771033763885, |
| "step": 4660, |
| "valid_targets_mean": 2716.2, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 6.329715061058344, |
| "grad_norm": 0.792890542631687, |
| "learning_rate": 1.111345432960964e-06, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16956427693367004, |
| "step": 4665, |
| "valid_targets_mean": 2624.8, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 6.336499321573949, |
| "grad_norm": 0.7772682272896229, |
| "learning_rate": 1.089212424898909e-06, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16567683219909668, |
| "step": 4670, |
| "valid_targets_mean": 2692.4, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 6.343283582089552, |
| "grad_norm": 0.7218817470491743, |
| "learning_rate": 1.0672958638457963e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1656082570552826, |
| "step": 4675, |
| "valid_targets_mean": 3137.2, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 6.350067842605156, |
| "grad_norm": 0.7660758671491292, |
| "learning_rate": 1.0455960006517828e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16689500212669373, |
| "step": 4680, |
| "valid_targets_mean": 2776.9, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 6.35685210312076, |
| "grad_norm": 0.7614176463332171, |
| "learning_rate": 1.0241130836867775e-06, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1655552089214325, |
| "step": 4685, |
| "valid_targets_mean": 2639.2, |
| "valid_targets_min": 1340 |
| }, |
| { |
| "epoch": 6.363636363636363, |
| "grad_norm": 0.731905552102256, |
| "learning_rate": 1.0028473588375775e-06, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15648706257343292, |
| "step": 4690, |
| "valid_targets_mean": 2678.6, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 6.370420624151968, |
| "grad_norm": 0.7374044504633019, |
| "learning_rate": 9.817990695050804e-07, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17541341483592987, |
| "step": 4695, |
| "valid_targets_mean": 3396.6, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.377204884667571, |
| "grad_norm": 0.8070797537585928, |
| "learning_rate": 9.60968456601472e-07, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17572826147079468, |
| "step": 4700, |
| "valid_targets_mean": 2604.2, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 6.383989145183175, |
| "grad_norm": 0.7275287979567348, |
| "learning_rate": 9.403557585474954e-07, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15313151478767395, |
| "step": 4705, |
| "valid_targets_mean": 2704.1, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 6.390773405698779, |
| "grad_norm": 0.8970798559467905, |
| "learning_rate": 9.199612112696843e-07, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1705400049686432, |
| "step": 4710, |
| "valid_targets_mean": 2101.6, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 6.397557666214382, |
| "grad_norm": 0.7536549104416713, |
| "learning_rate": 8.9978504819771e-07, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1547962725162506, |
| "step": 4715, |
| "valid_targets_mean": 2824.7, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 6.404341926729987, |
| "grad_norm": 0.8045187393820044, |
| "learning_rate": 8.798275002616785e-07, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17857302725315094, |
| "step": 4720, |
| "valid_targets_mean": 2904.6, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 6.41112618724559, |
| "grad_norm": 0.8644670987087135, |
| "learning_rate": 8.600887958894866e-07, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18547791242599487, |
| "step": 4725, |
| "valid_targets_mean": 2751.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 6.417910447761194, |
| "grad_norm": 0.8231644619228083, |
| "learning_rate": 8.4056916100423e-07, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16595998406410217, |
| "step": 4730, |
| "valid_targets_mean": 2423.4, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.424694708276798, |
| "grad_norm": 0.7911518564082718, |
| "learning_rate": 8.212688190215879e-07, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17415902018547058, |
| "step": 4735, |
| "valid_targets_mean": 2703.4, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 6.431478968792401, |
| "grad_norm": 0.8160726715736674, |
| "learning_rate": 8.021879908472962e-07, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18597552180290222, |
| "step": 4740, |
| "valid_targets_mean": 2784.6, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 6.4382632293080055, |
| "grad_norm": 0.7067244227602366, |
| "learning_rate": 7.833268948745854e-07, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16125139594078064, |
| "step": 4745, |
| "valid_targets_mean": 3260.1, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 6.445047489823609, |
| "grad_norm": 0.7408785373138851, |
| "learning_rate": 7.646857469817148e-07, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15260982513427734, |
| "step": 4750, |
| "valid_targets_mean": 2774.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 6.451831750339213, |
| "grad_norm": 0.6966270003794208, |
| "learning_rate": 7.462647605294849e-07, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.148808091878891, |
| "step": 4755, |
| "valid_targets_mean": 2975.9, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 6.458616010854817, |
| "grad_norm": 0.7126074027304123, |
| "learning_rate": 7.28064146358789e-07, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15134704113006592, |
| "step": 4760, |
| "valid_targets_mean": 3576.7, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 6.46540027137042, |
| "grad_norm": 0.8135549579243775, |
| "learning_rate": 7.100841127882119e-07, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1627068817615509, |
| "step": 4765, |
| "valid_targets_mean": 2379.0, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 6.4721845318860245, |
| "grad_norm": 0.6946858722656691, |
| "learning_rate": 6.9232486561164e-07, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15446284413337708, |
| "step": 4770, |
| "valid_targets_mean": 3180.2, |
| "valid_targets_min": 1145 |
| }, |
| { |
| "epoch": 6.478968792401628, |
| "grad_norm": 0.8707673966033334, |
| "learning_rate": 6.74786608095912e-07, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17315858602523804, |
| "step": 4775, |
| "valid_targets_mean": 2392.1, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 6.485753052917232, |
| "grad_norm": 0.7302574945303589, |
| "learning_rate": 6.574695409784792e-07, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1769123077392578, |
| "step": 4780, |
| "valid_targets_mean": 3501.0, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 6.492537313432836, |
| "grad_norm": 0.8695981905879026, |
| "learning_rate": 6.403738624651201e-07, |
| "loss": 0.1702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1758110076189041, |
| "step": 4785, |
| "valid_targets_mean": 2153.2, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 6.49932157394844, |
| "grad_norm": 0.6446530009894795, |
| "learning_rate": 6.234997682276711e-07, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1484566032886505, |
| "step": 4790, |
| "valid_targets_mean": 3468.8, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 6.5061058344640434, |
| "grad_norm": 0.7063043963291199, |
| "learning_rate": 6.068474514017797e-07, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1765894889831543, |
| "step": 4795, |
| "valid_targets_mean": 3490.4, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 6.512890094979647, |
| "grad_norm": 0.8151482914810542, |
| "learning_rate": 5.904171025847016e-07, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16545557975769043, |
| "step": 4800, |
| "valid_targets_mean": 2565.6, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 6.519674355495251, |
| "grad_norm": 0.7173252334227114, |
| "learning_rate": 5.742089098331094e-07, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15513482689857483, |
| "step": 4805, |
| "valid_targets_mean": 3147.9, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 6.526458616010855, |
| "grad_norm": 0.744561572381357, |
| "learning_rate": 5.582230586609538e-07, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1628095507621765, |
| "step": 4810, |
| "valid_targets_mean": 2782.1, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 6.533242876526459, |
| "grad_norm": 0.9358406796473209, |
| "learning_rate": 5.424597320373259e-07, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18553614616394043, |
| "step": 4815, |
| "valid_targets_mean": 2122.8, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 6.540027137042062, |
| "grad_norm": 0.7762174577670051, |
| "learning_rate": 5.269191103843719e-07, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16511686146259308, |
| "step": 4820, |
| "valid_targets_mean": 2672.0, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 6.546811397557666, |
| "grad_norm": 0.683256793284698, |
| "learning_rate": 5.116013715752299e-07, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17595712840557098, |
| "step": 4825, |
| "valid_targets_mean": 3763.1, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 6.55359565807327, |
| "grad_norm": 0.7956506160614817, |
| "learning_rate": 4.965066909319837e-07, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17820480465888977, |
| "step": 4830, |
| "valid_targets_mean": 2759.7, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 6.560379918588874, |
| "grad_norm": 0.7587179233666759, |
| "learning_rate": 4.816352412236702e-07, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17972393333911896, |
| "step": 4835, |
| "valid_targets_mean": 2840.0, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 6.567164179104478, |
| "grad_norm": 0.7306219090534811, |
| "learning_rate": 4.669871926642877e-07, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15142644941806793, |
| "step": 4840, |
| "valid_targets_mean": 3011.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 6.573948439620081, |
| "grad_norm": 0.8468764362506153, |
| "learning_rate": 4.5256271291085785e-07, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16415920853614807, |
| "step": 4845, |
| "valid_targets_mean": 2226.1, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 6.580732700135686, |
| "grad_norm": 0.7218042166118971, |
| "learning_rate": 4.3836196706150026e-07, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14739587903022766, |
| "step": 4850, |
| "valid_targets_mean": 3025.1, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.587516960651289, |
| "grad_norm": 0.7548311142057721, |
| "learning_rate": 4.243851176535474e-07, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1665259748697281, |
| "step": 4855, |
| "valid_targets_mean": 2818.0, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 6.5943012211668925, |
| "grad_norm": 0.7611024739102207, |
| "learning_rate": 4.106323246616817e-07, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15098467469215393, |
| "step": 4860, |
| "valid_targets_mean": 3311.1, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 6.601085481682497, |
| "grad_norm": 0.8170024951749895, |
| "learning_rate": 3.971037454961058e-07, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1671171486377716, |
| "step": 4865, |
| "valid_targets_mean": 2565.4, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 6.6078697421981, |
| "grad_norm": 0.7074879855210716, |
| "learning_rate": 3.8379953500074617e-07, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1538231521844864, |
| "step": 4870, |
| "valid_targets_mean": 3038.6, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 6.614654002713705, |
| "grad_norm": 0.7784406456308786, |
| "learning_rate": 3.7071984545146157e-07, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17332404851913452, |
| "step": 4875, |
| "valid_targets_mean": 2704.2, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 6.621438263229308, |
| "grad_norm": 0.7707976870962088, |
| "learning_rate": 3.578648265543261e-07, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15194040536880493, |
| "step": 4880, |
| "valid_targets_mean": 2598.7, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 6.6282225237449115, |
| "grad_norm": 0.7794811748817996, |
| "learning_rate": 3.4523462544389987e-07, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1765557825565338, |
| "step": 4885, |
| "valid_targets_mean": 2984.3, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 6.635006784260516, |
| "grad_norm": 0.7299801758059727, |
| "learning_rate": 3.328293866815435e-07, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16560907661914825, |
| "step": 4890, |
| "valid_targets_mean": 3176.7, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 6.641791044776119, |
| "grad_norm": 0.8430277934827622, |
| "learning_rate": 3.2064925225377297e-07, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1819601058959961, |
| "step": 4895, |
| "valid_targets_mean": 2420.4, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 6.648575305291724, |
| "grad_norm": 0.8143191944576621, |
| "learning_rate": 3.086943615706295e-07, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18464431166648865, |
| "step": 4900, |
| "valid_targets_mean": 2860.9, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 6.655359565807327, |
| "grad_norm": 0.7808926512242406, |
| "learning_rate": 2.969648514640855e-07, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17209918797016144, |
| "step": 4905, |
| "valid_targets_mean": 2871.8, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 6.6621438263229305, |
| "grad_norm": 0.7932529850799425, |
| "learning_rate": 2.854608561864702e-07, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17645207047462463, |
| "step": 4910, |
| "valid_targets_mean": 2660.2, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 6.668928086838535, |
| "grad_norm": 0.92065568822347, |
| "learning_rate": 2.7418250740895325e-07, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19371803104877472, |
| "step": 4915, |
| "valid_targets_mean": 2207.4, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 6.675712347354138, |
| "grad_norm": 0.6839393586837104, |
| "learning_rate": 2.6312993422001e-07, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17107108235359192, |
| "step": 4920, |
| "valid_targets_mean": 3477.2, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 6.6824966078697425, |
| "grad_norm": 0.710980917983464, |
| "learning_rate": 2.5230326312397193e-07, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1745888739824295, |
| "step": 4925, |
| "valid_targets_mean": 3478.5, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 6.689280868385346, |
| "grad_norm": 0.7823508117950982, |
| "learning_rate": 2.417026180395476e-07, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15715618431568146, |
| "step": 4930, |
| "valid_targets_mean": 2545.1, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 6.696065128900949, |
| "grad_norm": 0.7659619371709346, |
| "learning_rate": 2.3132812029844187e-07, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14484542608261108, |
| "step": 4935, |
| "valid_targets_mean": 2404.1, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 6.702849389416554, |
| "grad_norm": 0.7229493539815992, |
| "learning_rate": 2.2117988864393424e-07, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15829598903656006, |
| "step": 4940, |
| "valid_targets_mean": 3077.1, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 6.709633649932157, |
| "grad_norm": 0.7896285355647491, |
| "learning_rate": 2.112580392295338e-07, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17784717679023743, |
| "step": 4945, |
| "valid_targets_mean": 2630.4, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 6.7164179104477615, |
| "grad_norm": 0.9253668056101276, |
| "learning_rate": 2.015626856176578e-07, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16507627069950104, |
| "step": 4950, |
| "valid_targets_mean": 2150.9, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 6.723202170963365, |
| "grad_norm": 0.8173264202820435, |
| "learning_rate": 1.9209393877831273e-07, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18161508440971375, |
| "step": 4955, |
| "valid_targets_mean": 2604.2, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 6.729986431478968, |
| "grad_norm": 0.7523430361745242, |
| "learning_rate": 1.8285190708783984e-07, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1569797694683075, |
| "step": 4960, |
| "valid_targets_mean": 2848.9, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 6.736770691994573, |
| "grad_norm": 0.7772846302429779, |
| "learning_rate": 1.7383669632766276e-07, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17585310339927673, |
| "step": 4965, |
| "valid_targets_mean": 2752.7, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 6.743554952510176, |
| "grad_norm": 0.9312669800652025, |
| "learning_rate": 1.6504840968309288e-07, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16369280219078064, |
| "step": 4970, |
| "valid_targets_mean": 2244.8, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 6.75033921302578, |
| "grad_norm": 0.740973564771969, |
| "learning_rate": 1.5648714774213037e-07, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16859431564807892, |
| "step": 4975, |
| "valid_targets_mean": 3112.4, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 6.757123473541384, |
| "grad_norm": 0.800910909512139, |
| "learning_rate": 1.4815300849432278e-07, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1737082302570343, |
| "step": 4980, |
| "valid_targets_mean": 2754.4, |
| "valid_targets_min": 1617 |
| }, |
| { |
| "epoch": 6.763907734056987, |
| "grad_norm": 0.725161307786821, |
| "learning_rate": 1.400460873296461e-07, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16292381286621094, |
| "step": 4985, |
| "valid_targets_mean": 3145.3, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 6.770691994572592, |
| "grad_norm": 0.8381499766215631, |
| "learning_rate": 1.3216647703740315e-07, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18227586150169373, |
| "step": 4990, |
| "valid_targets_mean": 2443.8, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 6.777476255088195, |
| "grad_norm": 0.8004952099912124, |
| "learning_rate": 1.2451426780517363e-07, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17602723836898804, |
| "step": 4995, |
| "valid_targets_mean": 2544.9, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 6.784260515603799, |
| "grad_norm": 0.8175798384888614, |
| "learning_rate": 1.1708954721776355e-07, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15319892764091492, |
| "step": 5000, |
| "valid_targets_mean": 3087.2, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 6.791044776119403, |
| "grad_norm": 0.8311080394214818, |
| "learning_rate": 1.0989240025622627e-07, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1745099425315857, |
| "step": 5005, |
| "valid_targets_mean": 2356.4, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 6.797829036635007, |
| "grad_norm": 0.765582281484442, |
| "learning_rate": 1.0292290929687421e-07, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15547017753124237, |
| "step": 5010, |
| "valid_targets_mean": 2607.4, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 6.804613297150611, |
| "grad_norm": 0.8814252430063856, |
| "learning_rate": 9.618115411033524e-08, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16623856127262115, |
| "step": 5015, |
| "valid_targets_mean": 2101.0, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 6.811397557666214, |
| "grad_norm": 0.7599170245144763, |
| "learning_rate": 8.966721186065341e-08, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1648900806903839, |
| "step": 5020, |
| "valid_targets_mean": 2629.4, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 6.818181818181818, |
| "grad_norm": 0.6566181393738637, |
| "learning_rate": 8.338115710438744e-08, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1621677428483963, |
| "step": 5025, |
| "valid_targets_mean": 3358.0, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 6.824966078697422, |
| "grad_norm": 0.7442894660376455, |
| "learning_rate": 7.732306178977134e-08, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1600368767976761, |
| "step": 5030, |
| "valid_targets_mean": 3117.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 6.831750339213026, |
| "grad_norm": 0.7314337251400312, |
| "learning_rate": 7.149299525588405e-08, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1598661243915558, |
| "step": 5035, |
| "valid_targets_mean": 2865.1, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 6.8385345997286295, |
| "grad_norm": 0.712971911902212, |
| "learning_rate": 6.58910242318611e-08, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1687866449356079, |
| "step": 5040, |
| "valid_targets_mean": 3268.2, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 6.845318860244234, |
| "grad_norm": 0.7170233413590963, |
| "learning_rate": 6.051721283612422e-08, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16001065075397491, |
| "step": 5045, |
| "valid_targets_mean": 3043.4, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 6.852103120759837, |
| "grad_norm": 0.8748422499637547, |
| "learning_rate": 5.537162257565065e-08, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17490287125110626, |
| "step": 5050, |
| "valid_targets_mean": 2234.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 6.858887381275441, |
| "grad_norm": 0.7527414733725077, |
| "learning_rate": 5.045431234527165e-08, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17598162591457367, |
| "step": 5055, |
| "valid_targets_mean": 3049.6, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 6.865671641791045, |
| "grad_norm": 0.750418327168722, |
| "learning_rate": 4.576533842699294e-08, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1612885594367981, |
| "step": 5060, |
| "valid_targets_mean": 2946.2, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 6.8724559023066485, |
| "grad_norm": 0.8234037034287423, |
| "learning_rate": 4.1304754489359666e-08, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15995310246944427, |
| "step": 5065, |
| "valid_targets_mean": 2353.8, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 6.879240162822253, |
| "grad_norm": 0.8151052308072695, |
| "learning_rate": 3.707261158682807e-08, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16730859875679016, |
| "step": 5070, |
| "valid_targets_mean": 2366.6, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 6.886024423337856, |
| "grad_norm": 0.794569340466791, |
| "learning_rate": 3.306895815919475e-08, |
| "loss": 0.1614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17812877893447876, |
| "step": 5075, |
| "valid_targets_mean": 2787.9, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 6.89280868385346, |
| "grad_norm": 0.6779205812201277, |
| "learning_rate": 2.929384003103497e-08, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1553945243358612, |
| "step": 5080, |
| "valid_targets_mean": 3201.9, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 6.899592944369064, |
| "grad_norm": 0.7802177039337713, |
| "learning_rate": 2.5747300411180787e-08, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16561156511306763, |
| "step": 5085, |
| "valid_targets_mean": 2595.4, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 6.906377204884667, |
| "grad_norm": 0.811535089999137, |
| "learning_rate": 2.2429379892221493e-08, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1710594892501831, |
| "step": 5090, |
| "valid_targets_mean": 2819.6, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 6.913161465400272, |
| "grad_norm": 0.7976488997817401, |
| "learning_rate": 1.9340116450050628e-08, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1631883978843689, |
| "step": 5095, |
| "valid_targets_mean": 2428.8, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.919945725915875, |
| "grad_norm": 0.8090475833391716, |
| "learning_rate": 1.6479545443415236e-08, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1432981789112091, |
| "step": 5100, |
| "valid_targets_mean": 2219.2, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 6.926729986431479, |
| "grad_norm": 0.682864252053581, |
| "learning_rate": 1.3847699613527276e-08, |
| "loss": 0.1572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1406230330467224, |
| "step": 5105, |
| "valid_targets_mean": 2982.7, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 6.933514246947083, |
| "grad_norm": 0.6898488676376657, |
| "learning_rate": 1.1444609083675062e-08, |
| "loss": 0.1682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1759582757949829, |
| "step": 5110, |
| "valid_targets_mean": 3367.1, |
| "valid_targets_min": 1487 |
| }, |
| { |
| "epoch": 6.940298507462686, |
| "grad_norm": 0.7796796211939258, |
| "learning_rate": 9.270301358890177e-09, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1705056130886078, |
| "step": 5115, |
| "valid_targets_mean": 2493.1, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 6.947082767978291, |
| "grad_norm": 1.019436094106403, |
| "learning_rate": 7.324801325621078e-09, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1720581352710724, |
| "step": 5120, |
| "valid_targets_mean": 2621.9, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 6.953867028493894, |
| "grad_norm": 0.7032830768741243, |
| "learning_rate": 5.6081312514599805e-09, |
| "loss": 0.1614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14902475476264954, |
| "step": 5125, |
| "valid_targets_mean": 3147.9, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 6.960651289009498, |
| "grad_norm": 0.7432217757535253, |
| "learning_rate": 4.120310784878623e-09, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1647299975156784, |
| "step": 5130, |
| "valid_targets_mean": 2841.1, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 6.967435549525102, |
| "grad_norm": 0.7089666153527104, |
| "learning_rate": 2.861356955008443e-09, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19622814655303955, |
| "step": 5135, |
| "valid_targets_mean": 3448.8, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 6.974219810040705, |
| "grad_norm": 0.9344960536682286, |
| "learning_rate": 1.8312841714474005e-09, |
| "loss": 0.1624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16499242186546326, |
| "step": 5140, |
| "valid_targets_mean": 2747.8, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 6.98100407055631, |
| "grad_norm": 0.7980431188161958, |
| "learning_rate": 1.030104224086781e-09, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15351396799087524, |
| "step": 5145, |
| "valid_targets_mean": 2372.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.987788331071913, |
| "grad_norm": 0.6998390532387075, |
| "learning_rate": 4.578262829846303e-10, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1696673333644867, |
| "step": 5150, |
| "valid_targets_mean": 3469.1, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 6.9945725915875165, |
| "grad_norm": 0.7592131753298821, |
| "learning_rate": 1.1445689825473339e-10, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16776353120803833, |
| "step": 5155, |
| "valid_targets_mean": 2719.2, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16736872494220734, |
| "step": 5159, |
| "total_flos": 1027340714311680.0, |
| "train_loss": 0.24267188053672734, |
| "train_runtime": 23911.9379, |
| "train_samples_per_second": 3.449, |
| "train_steps_per_second": 0.216, |
| "valid_targets_mean": 2441.9, |
| "valid_targets_min": 1168 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 5159, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 200, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1027340714311680.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|