| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4389, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.007974481658692184, |
| "grad_norm": 19.08310269585043, |
| "learning_rate": 3.644646924829157e-07, |
| "loss": 0.7989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8064001798629761, |
| "step": 5, |
| "valid_targets_mean": 3405.2, |
| "valid_targets_min": 1804 |
| }, |
| { |
| "epoch": 0.01594896331738437, |
| "grad_norm": 18.15244545055453, |
| "learning_rate": 8.200455580865605e-07, |
| "loss": 0.7787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7641298174858093, |
| "step": 10, |
| "valid_targets_mean": 2772.0, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 0.023923444976076555, |
| "grad_norm": 13.672484690698322, |
| "learning_rate": 1.2756264236902052e-06, |
| "loss": 0.7357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6846181154251099, |
| "step": 15, |
| "valid_targets_mean": 3543.5, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 0.03189792663476874, |
| "grad_norm": 12.741705912118789, |
| "learning_rate": 1.7312072892938498e-06, |
| "loss": 0.7002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6495967507362366, |
| "step": 20, |
| "valid_targets_mean": 3172.8, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 0.03987240829346093, |
| "grad_norm": 8.796778470910523, |
| "learning_rate": 2.1867881548974945e-06, |
| "loss": 0.6617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5894312262535095, |
| "step": 25, |
| "valid_targets_mean": 3213.4, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 0.04784688995215311, |
| "grad_norm": 5.349177988575253, |
| "learning_rate": 2.642369020501139e-06, |
| "loss": 0.6311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6095372438430786, |
| "step": 30, |
| "valid_targets_mean": 3185.8, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 0.05582137161084529, |
| "grad_norm": 3.3314893539168238, |
| "learning_rate": 3.0979498861047843e-06, |
| "loss": 0.5367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4944782853126526, |
| "step": 35, |
| "valid_targets_mean": 2579.5, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 0.06379585326953748, |
| "grad_norm": 2.4005782583446984, |
| "learning_rate": 3.5535307517084285e-06, |
| "loss": 0.5448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5224937200546265, |
| "step": 40, |
| "valid_targets_mean": 2636.4, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 0.07177033492822966, |
| "grad_norm": 1.3723814844051554, |
| "learning_rate": 4.009111617312073e-06, |
| "loss": 0.478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4328991770744324, |
| "step": 45, |
| "valid_targets_mean": 3519.6, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 0.07974481658692185, |
| "grad_norm": 1.3026590573106005, |
| "learning_rate": 4.464692482915718e-06, |
| "loss": 0.5271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4638175070285797, |
| "step": 50, |
| "valid_targets_mean": 2428.6, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 0.08771929824561403, |
| "grad_norm": 1.2999173286453858, |
| "learning_rate": 4.920273348519363e-06, |
| "loss": 0.4904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5091861486434937, |
| "step": 55, |
| "valid_targets_mean": 2451.5, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 0.09569377990430622, |
| "grad_norm": 0.911171533209259, |
| "learning_rate": 5.375854214123008e-06, |
| "loss": 0.4631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4018824100494385, |
| "step": 60, |
| "valid_targets_mean": 2899.0, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 0.10366826156299841, |
| "grad_norm": 0.9137218681759303, |
| "learning_rate": 5.831435079726651e-06, |
| "loss": 0.4235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4257986545562744, |
| "step": 65, |
| "valid_targets_mean": 2692.9, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 0.11164274322169059, |
| "grad_norm": 0.7940217799338982, |
| "learning_rate": 6.287015945330297e-06, |
| "loss": 0.3964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3876068592071533, |
| "step": 70, |
| "valid_targets_mean": 2944.8, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 0.11961722488038277, |
| "grad_norm": 0.8646607237411834, |
| "learning_rate": 6.742596810933942e-06, |
| "loss": 0.4214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3561863303184509, |
| "step": 75, |
| "valid_targets_mean": 2176.2, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 0.12759170653907495, |
| "grad_norm": 0.7019349077333937, |
| "learning_rate": 7.1981776765375854e-06, |
| "loss": 0.3958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36579617857933044, |
| "step": 80, |
| "valid_targets_mean": 3109.9, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 0.13556618819776714, |
| "grad_norm": 0.776844100371323, |
| "learning_rate": 7.65375854214123e-06, |
| "loss": 0.4248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3523101508617401, |
| "step": 85, |
| "valid_targets_mean": 2283.4, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 0.14354066985645933, |
| "grad_norm": 0.7814197273845711, |
| "learning_rate": 8.109339407744875e-06, |
| "loss": 0.3677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36872315406799316, |
| "step": 90, |
| "valid_targets_mean": 2170.3, |
| "valid_targets_min": 1321 |
| }, |
| { |
| "epoch": 0.15151515151515152, |
| "grad_norm": 0.6933045488358227, |
| "learning_rate": 8.564920273348521e-06, |
| "loss": 0.3791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3503817319869995, |
| "step": 95, |
| "valid_targets_mean": 2544.8, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 0.1594896331738437, |
| "grad_norm": 0.7344042311376202, |
| "learning_rate": 9.020501138952164e-06, |
| "loss": 0.4041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36823010444641113, |
| "step": 100, |
| "valid_targets_mean": 2677.9, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 0.1674641148325359, |
| "grad_norm": 0.8885061382631938, |
| "learning_rate": 9.47608200455581e-06, |
| "loss": 0.3574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37888795137405396, |
| "step": 105, |
| "valid_targets_mean": 2963.9, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 0.17543859649122806, |
| "grad_norm": 0.7040180595260014, |
| "learning_rate": 9.931662870159453e-06, |
| "loss": 0.3907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4308871626853943, |
| "step": 110, |
| "valid_targets_mean": 2947.4, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 0.18341307814992025, |
| "grad_norm": 0.6704086894938297, |
| "learning_rate": 1.03872437357631e-05, |
| "loss": 0.3819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.374492347240448, |
| "step": 115, |
| "valid_targets_mean": 2938.1, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 0.19138755980861244, |
| "grad_norm": 0.7460794224492051, |
| "learning_rate": 1.0842824601366744e-05, |
| "loss": 0.3688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3808710277080536, |
| "step": 120, |
| "valid_targets_mean": 2539.7, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 0.19936204146730463, |
| "grad_norm": 0.7530056967637131, |
| "learning_rate": 1.1298405466970387e-05, |
| "loss": 0.3658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38335102796554565, |
| "step": 125, |
| "valid_targets_mean": 2847.5, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.20733652312599682, |
| "grad_norm": 0.6712559232045431, |
| "learning_rate": 1.1753986332574032e-05, |
| "loss": 0.3667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37891942262649536, |
| "step": 130, |
| "valid_targets_mean": 3401.6, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 0.215311004784689, |
| "grad_norm": 0.6836972272176005, |
| "learning_rate": 1.2209567198177677e-05, |
| "loss": 0.3686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41928017139434814, |
| "step": 135, |
| "valid_targets_mean": 3157.6, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 0.22328548644338117, |
| "grad_norm": 0.6997393115915425, |
| "learning_rate": 1.2665148063781323e-05, |
| "loss": 0.3738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34178513288497925, |
| "step": 140, |
| "valid_targets_mean": 2723.2, |
| "valid_targets_min": 1371 |
| }, |
| { |
| "epoch": 0.23125996810207336, |
| "grad_norm": 0.7360428127205939, |
| "learning_rate": 1.3120728929384968e-05, |
| "loss": 0.3395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.336765855550766, |
| "step": 145, |
| "valid_targets_mean": 2483.8, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 0.23923444976076555, |
| "grad_norm": 0.6300114527878021, |
| "learning_rate": 1.357630979498861e-05, |
| "loss": 0.3264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3560517430305481, |
| "step": 150, |
| "valid_targets_mean": 3368.4, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 0.24720893141945774, |
| "grad_norm": 0.7089495360173708, |
| "learning_rate": 1.4031890660592255e-05, |
| "loss": 0.3514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37352272868156433, |
| "step": 155, |
| "valid_targets_mean": 3006.2, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 0.2551834130781499, |
| "grad_norm": 0.6816824704537204, |
| "learning_rate": 1.4487471526195902e-05, |
| "loss": 0.3268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31338217854499817, |
| "step": 160, |
| "valid_targets_mean": 2765.8, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 0.2631578947368421, |
| "grad_norm": 0.6672669398637605, |
| "learning_rate": 1.4943052391799546e-05, |
| "loss": 0.3408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3209226131439209, |
| "step": 165, |
| "valid_targets_mean": 3222.7, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 0.2711323763955343, |
| "grad_norm": 0.7103134650450313, |
| "learning_rate": 1.539863325740319e-05, |
| "loss": 0.3101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3130913972854614, |
| "step": 170, |
| "valid_targets_mean": 2424.1, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 0.27910685805422647, |
| "grad_norm": 0.8003799128827424, |
| "learning_rate": 1.5854214123006836e-05, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27181631326675415, |
| "step": 175, |
| "valid_targets_mean": 2400.7, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 0.28708133971291866, |
| "grad_norm": 0.6232480405624014, |
| "learning_rate": 1.630979498861048e-05, |
| "loss": 0.3295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3603177070617676, |
| "step": 180, |
| "valid_targets_mean": 3960.4, |
| "valid_targets_min": 1658 |
| }, |
| { |
| "epoch": 0.29505582137161085, |
| "grad_norm": 0.7699746809628365, |
| "learning_rate": 1.6765375854214125e-05, |
| "loss": 0.3568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31741786003112793, |
| "step": 185, |
| "valid_targets_mean": 2706.6, |
| "valid_targets_min": 1017 |
| }, |
| { |
| "epoch": 0.30303030303030304, |
| "grad_norm": 0.6458959798755932, |
| "learning_rate": 1.722095671981777e-05, |
| "loss": 0.301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3305377960205078, |
| "step": 190, |
| "valid_targets_mean": 3139.9, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 0.31100478468899523, |
| "grad_norm": 0.716800670588027, |
| "learning_rate": 1.7676537585421415e-05, |
| "loss": 0.3094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34545591473579407, |
| "step": 195, |
| "valid_targets_mean": 2778.2, |
| "valid_targets_min": 1294 |
| }, |
| { |
| "epoch": 0.3189792663476874, |
| "grad_norm": 0.7022017213023772, |
| "learning_rate": 1.813211845102506e-05, |
| "loss": 0.3211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39925310015678406, |
| "step": 200, |
| "valid_targets_mean": 3597.8, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 0.3269537480063796, |
| "grad_norm": 0.6415795025905041, |
| "learning_rate": 1.8587699316628704e-05, |
| "loss": 0.3136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29438742995262146, |
| "step": 205, |
| "valid_targets_mean": 3129.2, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 0.3349282296650718, |
| "grad_norm": 0.7778916243584333, |
| "learning_rate": 1.904328018223235e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26425981521606445, |
| "step": 210, |
| "valid_targets_mean": 2129.7, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 0.34290271132376393, |
| "grad_norm": 0.6219565329305242, |
| "learning_rate": 1.9498861047835993e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4421326518058777, |
| "step": 215, |
| "valid_targets_mean": 3950.2, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 0.3508771929824561, |
| "grad_norm": 0.785836372040567, |
| "learning_rate": 1.9954441913439638e-05, |
| "loss": 0.29, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34666532278060913, |
| "step": 220, |
| "valid_targets_mean": 2993.6, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 0.3588516746411483, |
| "grad_norm": 0.746881160297121, |
| "learning_rate": 2.0410022779043283e-05, |
| "loss": 0.3313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.286319375038147, |
| "step": 225, |
| "valid_targets_mean": 2257.7, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 0.3668261562998405, |
| "grad_norm": 0.7507845800604592, |
| "learning_rate": 2.0865603644646927e-05, |
| "loss": 0.3111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33375227451324463, |
| "step": 230, |
| "valid_targets_mean": 2517.9, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 0.3748006379585327, |
| "grad_norm": 0.6392812481173415, |
| "learning_rate": 2.1321184510250572e-05, |
| "loss": 0.298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36269882321357727, |
| "step": 235, |
| "valid_targets_mean": 3927.3, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 0.3827751196172249, |
| "grad_norm": 0.7350944642779489, |
| "learning_rate": 2.1776765375854217e-05, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2749019265174866, |
| "step": 240, |
| "valid_targets_mean": 2795.9, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 0.39074960127591707, |
| "grad_norm": 0.6799973116920671, |
| "learning_rate": 2.223234624145786e-05, |
| "loss": 0.328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3284507989883423, |
| "step": 245, |
| "valid_targets_mean": 3278.3, |
| "valid_targets_min": 1179 |
| }, |
| { |
| "epoch": 0.39872408293460926, |
| "grad_norm": 0.6937881723620776, |
| "learning_rate": 2.2687927107061506e-05, |
| "loss": 0.2755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26359331607818604, |
| "step": 250, |
| "valid_targets_mean": 2635.9, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 0.40669856459330145, |
| "grad_norm": 0.6768083264850395, |
| "learning_rate": 2.314350797266515e-05, |
| "loss": 0.3128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2547405958175659, |
| "step": 255, |
| "valid_targets_mean": 2782.8, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 0.41467304625199364, |
| "grad_norm": 0.6577985129097631, |
| "learning_rate": 2.3599088838268792e-05, |
| "loss": 0.273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27426400780677795, |
| "step": 260, |
| "valid_targets_mean": 2750.0, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 0.4226475279106858, |
| "grad_norm": 0.682947460712769, |
| "learning_rate": 2.4054669703872436e-05, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30281588435173035, |
| "step": 265, |
| "valid_targets_mean": 3342.2, |
| "valid_targets_min": 1294 |
| }, |
| { |
| "epoch": 0.430622009569378, |
| "grad_norm": 0.746329268810735, |
| "learning_rate": 2.4510250569476085e-05, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27677425742149353, |
| "step": 270, |
| "valid_targets_mean": 2662.0, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 0.43859649122807015, |
| "grad_norm": 0.6987593054550297, |
| "learning_rate": 2.496583143507973e-05, |
| "loss": 0.3044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29885128140449524, |
| "step": 275, |
| "valid_targets_mean": 2668.7, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 0.44657097288676234, |
| "grad_norm": 0.7260544620953092, |
| "learning_rate": 2.5421412300683374e-05, |
| "loss": 0.2868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29124659299850464, |
| "step": 280, |
| "valid_targets_mean": 2561.8, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 0.45454545454545453, |
| "grad_norm": 0.7281604766084092, |
| "learning_rate": 2.587699316628702e-05, |
| "loss": 0.2721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2808125615119934, |
| "step": 285, |
| "valid_targets_mean": 2608.4, |
| "valid_targets_min": 1218 |
| }, |
| { |
| "epoch": 0.4625199362041467, |
| "grad_norm": 0.7025214327060316, |
| "learning_rate": 2.6332574031890663e-05, |
| "loss": 0.2878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31319329142570496, |
| "step": 290, |
| "valid_targets_mean": 2582.1, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 0.4704944178628389, |
| "grad_norm": 0.7856192992209702, |
| "learning_rate": 2.6788154897494308e-05, |
| "loss": 0.2823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27091526985168457, |
| "step": 295, |
| "valid_targets_mean": 2811.6, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 0.4784688995215311, |
| "grad_norm": 0.7108315007493442, |
| "learning_rate": 2.7243735763097953e-05, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3215833902359009, |
| "step": 300, |
| "valid_targets_mean": 2883.8, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 0.4864433811802233, |
| "grad_norm": 0.7748559874677846, |
| "learning_rate": 2.7699316628701597e-05, |
| "loss": 0.2579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22398757934570312, |
| "step": 305, |
| "valid_targets_mean": 2005.8, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 0.4944178628389155, |
| "grad_norm": 0.7462878729201242, |
| "learning_rate": 2.815489749430524e-05, |
| "loss": 0.3319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33022865653038025, |
| "step": 310, |
| "valid_targets_mean": 2705.2, |
| "valid_targets_min": 248 |
| }, |
| { |
| "epoch": 0.5023923444976076, |
| "grad_norm": 0.7802542037539941, |
| "learning_rate": 2.8610478359908883e-05, |
| "loss": 0.2839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23213829100131989, |
| "step": 315, |
| "valid_targets_mean": 2407.5, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 0.5103668261562998, |
| "grad_norm": 0.7649747995292412, |
| "learning_rate": 2.906605922551253e-05, |
| "loss": 0.2961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3233932852745056, |
| "step": 320, |
| "valid_targets_mean": 2915.9, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 0.518341307814992, |
| "grad_norm": 0.7978888829804283, |
| "learning_rate": 2.9521640091116176e-05, |
| "loss": 0.276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22950753569602966, |
| "step": 325, |
| "valid_targets_mean": 2392.1, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 0.5263157894736842, |
| "grad_norm": 0.7437520517670876, |
| "learning_rate": 2.997722095671982e-05, |
| "loss": 0.2964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2997945249080658, |
| "step": 330, |
| "valid_targets_mean": 3249.1, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 0.5342902711323764, |
| "grad_norm": 0.6657204266063321, |
| "learning_rate": 3.0432801822323465e-05, |
| "loss": 0.2606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29147499799728394, |
| "step": 335, |
| "valid_targets_mean": 3084.5, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 0.5422647527910686, |
| "grad_norm": 0.605457899238917, |
| "learning_rate": 3.088838268792711e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23867332935333252, |
| "step": 340, |
| "valid_targets_mean": 3086.1, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 0.5502392344497608, |
| "grad_norm": 0.677848238624908, |
| "learning_rate": 3.1343963553530755e-05, |
| "loss": 0.2957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3328245282173157, |
| "step": 345, |
| "valid_targets_mean": 2985.1, |
| "valid_targets_min": 1422 |
| }, |
| { |
| "epoch": 0.5582137161084529, |
| "grad_norm": 0.6938963916271617, |
| "learning_rate": 3.17995444191344e-05, |
| "loss": 0.2893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2992449998855591, |
| "step": 350, |
| "valid_targets_mean": 3391.4, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 0.5661881977671451, |
| "grad_norm": 0.6671036083494569, |
| "learning_rate": 3.2255125284738044e-05, |
| "loss": 0.2639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.261359304189682, |
| "step": 355, |
| "valid_targets_mean": 2705.2, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 0.5741626794258373, |
| "grad_norm": 0.641793075175834, |
| "learning_rate": 3.271070615034169e-05, |
| "loss": 0.2563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2564861476421356, |
| "step": 360, |
| "valid_targets_mean": 3231.8, |
| "valid_targets_min": 1258 |
| }, |
| { |
| "epoch": 0.5821371610845295, |
| "grad_norm": 0.6260519357718421, |
| "learning_rate": 3.316628701594533e-05, |
| "loss": 0.2795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29788124561309814, |
| "step": 365, |
| "valid_targets_mean": 3343.8, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 0.5901116427432217, |
| "grad_norm": 0.7016875050444317, |
| "learning_rate": 3.362186788154898e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23810943961143494, |
| "step": 370, |
| "valid_targets_mean": 2345.8, |
| "valid_targets_min": 1102 |
| }, |
| { |
| "epoch": 0.5980861244019139, |
| "grad_norm": 0.6940263992622621, |
| "learning_rate": 3.407744874715262e-05, |
| "loss": 0.2589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.239394873380661, |
| "step": 375, |
| "valid_targets_mean": 2608.0, |
| "valid_targets_min": 1286 |
| }, |
| { |
| "epoch": 0.6060606060606061, |
| "grad_norm": 0.7346814637270078, |
| "learning_rate": 3.453302961275627e-05, |
| "loss": 0.2878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3815971612930298, |
| "step": 380, |
| "valid_targets_mean": 3218.8, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 0.6140350877192983, |
| "grad_norm": 0.6058315721294318, |
| "learning_rate": 3.498861047835991e-05, |
| "loss": 0.2755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2890080213546753, |
| "step": 385, |
| "valid_targets_mean": 3851.6, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 0.6220095693779905, |
| "grad_norm": 0.7023734773136625, |
| "learning_rate": 3.5444191343963557e-05, |
| "loss": 0.2706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30273354053497314, |
| "step": 390, |
| "valid_targets_mean": 2969.1, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 0.6299840510366826, |
| "grad_norm": 1.4920526075234164, |
| "learning_rate": 3.58997722095672e-05, |
| "loss": 0.2762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22971850633621216, |
| "step": 395, |
| "valid_targets_mean": 2233.4, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 0.6379585326953748, |
| "grad_norm": 0.6703882371109363, |
| "learning_rate": 3.6355353075170846e-05, |
| "loss": 0.2807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30465108156204224, |
| "step": 400, |
| "valid_targets_mean": 2949.6, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 0.645933014354067, |
| "grad_norm": 0.6301067583808945, |
| "learning_rate": 3.681093394077449e-05, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2273084968328476, |
| "step": 405, |
| "valid_targets_mean": 2778.0, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 0.6539074960127592, |
| "grad_norm": 0.7296897171202118, |
| "learning_rate": 3.7266514806378135e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27479881048202515, |
| "step": 410, |
| "valid_targets_mean": 2959.2, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 0.6618819776714514, |
| "grad_norm": 0.6281384576410912, |
| "learning_rate": 3.772209567198178e-05, |
| "loss": 0.2755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25720399618148804, |
| "step": 415, |
| "valid_targets_mean": 3779.6, |
| "valid_targets_min": 1287 |
| }, |
| { |
| "epoch": 0.6698564593301436, |
| "grad_norm": 0.5853097243857709, |
| "learning_rate": 3.8177676537585425e-05, |
| "loss": 0.258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3213130533695221, |
| "step": 420, |
| "valid_targets_mean": 4250.0, |
| "valid_targets_min": 1513 |
| }, |
| { |
| "epoch": 0.6778309409888357, |
| "grad_norm": 0.7301060156034734, |
| "learning_rate": 3.863325740318907e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26980870962142944, |
| "step": 425, |
| "valid_targets_mean": 2502.8, |
| "valid_targets_min": 1158 |
| }, |
| { |
| "epoch": 0.6858054226475279, |
| "grad_norm": 0.5832615343218808, |
| "learning_rate": 3.9088838268792714e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2549774646759033, |
| "step": 430, |
| "valid_targets_mean": 3444.6, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 0.69377990430622, |
| "grad_norm": 0.749747412812053, |
| "learning_rate": 3.954441913439636e-05, |
| "loss": 0.2566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2809187173843384, |
| "step": 435, |
| "valid_targets_mean": 2738.5, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 0.7017543859649122, |
| "grad_norm": 0.6682751126395767, |
| "learning_rate": 4e-05, |
| "loss": 0.247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24001020193099976, |
| "step": 440, |
| "valid_targets_mean": 2767.5, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 0.7097288676236044, |
| "grad_norm": 0.647984542933624, |
| "learning_rate": 3.9999841858814384e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29405590891838074, |
| "step": 445, |
| "valid_targets_mean": 3640.1, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 0.7177033492822966, |
| "grad_norm": 0.6803155407263939, |
| "learning_rate": 3.999936743775839e-05, |
| "loss": 0.283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2493191361427307, |
| "step": 450, |
| "valid_targets_mean": 2872.7, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 0.7256778309409888, |
| "grad_norm": 0.5860939981094048, |
| "learning_rate": 3.9998576744334574e-05, |
| "loss": 0.2728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31388020515441895, |
| "step": 455, |
| "valid_targets_mean": 4003.9, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 0.733652312599681, |
| "grad_norm": 0.7082359097380168, |
| "learning_rate": 3.999746979104705e-05, |
| "loss": 0.2537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.265491247177124, |
| "step": 460, |
| "valid_targets_mean": 2565.0, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 0.7416267942583732, |
| "grad_norm": 0.7642274897132844, |
| "learning_rate": 3.999604659540131e-05, |
| "loss": 0.2751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.284295916557312, |
| "step": 465, |
| "valid_targets_mean": 3430.8, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 0.7496012759170654, |
| "grad_norm": 0.5893515909471992, |
| "learning_rate": 3.999430717990395e-05, |
| "loss": 0.2728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2829861640930176, |
| "step": 470, |
| "valid_targets_mean": 3407.2, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 0.7575757575757576, |
| "grad_norm": 0.8136772121235736, |
| "learning_rate": 3.999225157206228e-05, |
| "loss": 0.2526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23452086746692657, |
| "step": 475, |
| "valid_targets_mean": 1940.5, |
| "valid_targets_min": 1060 |
| }, |
| { |
| "epoch": 0.7655502392344498, |
| "grad_norm": 0.7188632991013135, |
| "learning_rate": 3.998987980438393e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19779305160045624, |
| "step": 480, |
| "valid_targets_mean": 2111.4, |
| "valid_targets_min": 1441 |
| }, |
| { |
| "epoch": 0.773524720893142, |
| "grad_norm": 0.5775811168461635, |
| "learning_rate": 3.9987191914376306e-05, |
| "loss": 0.262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2576785683631897, |
| "step": 485, |
| "valid_targets_mean": 3279.2, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 0.7814992025518341, |
| "grad_norm": 0.7007873699634931, |
| "learning_rate": 3.998418794454604e-05, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2803601920604706, |
| "step": 490, |
| "valid_targets_mean": 3080.1, |
| "valid_targets_min": 1657 |
| }, |
| { |
| "epoch": 0.7894736842105263, |
| "grad_norm": 0.6007025928633855, |
| "learning_rate": 3.998086794239825e-05, |
| "loss": 0.2829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32280203700065613, |
| "step": 495, |
| "valid_targets_mean": 4255.9, |
| "valid_targets_min": 1680 |
| }, |
| { |
| "epoch": 0.7974481658692185, |
| "grad_norm": 0.6880645344758224, |
| "learning_rate": 3.997723196043585e-05, |
| "loss": 0.2605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24724368751049042, |
| "step": 500, |
| "valid_targets_mean": 2747.2, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 0.8054226475279107, |
| "grad_norm": 0.6773462313419402, |
| "learning_rate": 3.9973280056158695e-05, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2253529280424118, |
| "step": 505, |
| "valid_targets_mean": 2516.2, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 0.8133971291866029, |
| "grad_norm": 0.7173069626107433, |
| "learning_rate": 3.9969012292062655e-05, |
| "loss": 0.2671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27754151821136475, |
| "step": 510, |
| "valid_targets_mean": 2236.1, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 0.8213716108452951, |
| "grad_norm": 0.6542849868717581, |
| "learning_rate": 3.996442873563866e-05, |
| "loss": 0.2611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24865597486495972, |
| "step": 515, |
| "valid_targets_mean": 2807.8, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 0.8293460925039873, |
| "grad_norm": 0.6023761211547769, |
| "learning_rate": 3.9959529459371624e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24921664595603943, |
| "step": 520, |
| "valid_targets_mean": 2813.4, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 0.8373205741626795, |
| "grad_norm": 0.688792403344696, |
| "learning_rate": 3.9954314540739284e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2918543219566345, |
| "step": 525, |
| "valid_targets_mean": 2673.4, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 0.8452950558213717, |
| "grad_norm": 0.5571463923330057, |
| "learning_rate": 3.994878406221097e-05, |
| "loss": 0.2576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31798291206359863, |
| "step": 530, |
| "valid_targets_mean": 3787.4, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 0.8532695374800638, |
| "grad_norm": 0.5343440337170275, |
| "learning_rate": 3.994293811124632e-05, |
| "loss": 0.2699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3140130043029785, |
| "step": 535, |
| "valid_targets_mean": 4513.2, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 0.861244019138756, |
| "grad_norm": 0.6667148523666464, |
| "learning_rate": 3.993677678029392e-05, |
| "loss": 0.2883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2631716728210449, |
| "step": 540, |
| "valid_targets_mean": 2576.0, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 0.8692185007974481, |
| "grad_norm": 0.621797201029701, |
| "learning_rate": 3.9930300166789765e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23845577239990234, |
| "step": 545, |
| "valid_targets_mean": 2497.0, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 0.8771929824561403, |
| "grad_norm": 0.5849281982647846, |
| "learning_rate": 3.992350837315581e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24086298048496246, |
| "step": 550, |
| "valid_targets_mean": 2936.5, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 0.8851674641148325, |
| "grad_norm": 0.6100603750245858, |
| "learning_rate": 3.991640150679826e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2142607867717743, |
| "step": 555, |
| "valid_targets_mean": 2693.3, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 0.8931419457735247, |
| "grad_norm": 0.679595548377651, |
| "learning_rate": 3.990897968010596e-05, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23986729979515076, |
| "step": 560, |
| "valid_targets_mean": 2657.9, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 0.9011164274322169, |
| "grad_norm": 0.5714798003175021, |
| "learning_rate": 3.990124301044855e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22235023975372314, |
| "step": 565, |
| "valid_targets_mean": 3395.3, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 0.9090909090909091, |
| "grad_norm": 0.6184667605667801, |
| "learning_rate": 3.989319162017465e-05, |
| "loss": 0.2446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22823108732700348, |
| "step": 570, |
| "valid_targets_mean": 2967.4, |
| "valid_targets_min": 1564 |
| }, |
| { |
| "epoch": 0.9170653907496013, |
| "grad_norm": 0.7112571643134058, |
| "learning_rate": 3.988482563660989e-05, |
| "loss": 0.2718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30855730175971985, |
| "step": 575, |
| "valid_targets_mean": 2733.8, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 0.9250398724082934, |
| "grad_norm": 0.5409940557899795, |
| "learning_rate": 3.987614519205493e-05, |
| "loss": 0.2587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2341741919517517, |
| "step": 580, |
| "valid_targets_mean": 3420.3, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 0.9330143540669856, |
| "grad_norm": 0.6283821372972509, |
| "learning_rate": 3.986715042378334e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26625967025756836, |
| "step": 585, |
| "valid_targets_mean": 2681.2, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 0.9409888357256778, |
| "grad_norm": 0.5958617621432479, |
| "learning_rate": 3.985784147403947e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2559368312358856, |
| "step": 590, |
| "valid_targets_mean": 2903.1, |
| "valid_targets_min": 1321 |
| }, |
| { |
| "epoch": 0.94896331738437, |
| "grad_norm": 0.5949783472882877, |
| "learning_rate": 3.9848218490036144e-05, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2529694437980652, |
| "step": 595, |
| "valid_targets_mean": 3612.6, |
| "valid_targets_min": 1114 |
| }, |
| { |
| "epoch": 0.9569377990430622, |
| "grad_norm": 0.5701025918722548, |
| "learning_rate": 3.983828162395238e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24346418678760529, |
| "step": 600, |
| "valid_targets_mean": 3209.6, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 0.9649122807017544, |
| "grad_norm": 1.3475027154750536, |
| "learning_rate": 3.9828031032930944e-05, |
| "loss": 0.2693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23624694347381592, |
| "step": 605, |
| "valid_targets_mean": 2403.8, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 0.9728867623604466, |
| "grad_norm": 0.6783942654321022, |
| "learning_rate": 3.98174668790759e-05, |
| "loss": 0.2531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28323280811309814, |
| "step": 610, |
| "valid_targets_mean": 3008.2, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 0.9808612440191388, |
| "grad_norm": 0.7285748900158596, |
| "learning_rate": 3.9806589329450045e-05, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23608598113059998, |
| "step": 615, |
| "valid_targets_mean": 1979.1, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 0.988835725677831, |
| "grad_norm": 0.5779028885760018, |
| "learning_rate": 3.979539855607222e-05, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22704467177391052, |
| "step": 620, |
| "valid_targets_mean": 2778.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 0.9968102073365231, |
| "grad_norm": 0.53910671747115, |
| "learning_rate": 3.9783894735914646e-05, |
| "loss": 0.2609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24189332127571106, |
| "step": 625, |
| "valid_targets_mean": 3171.7, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.0047846889952152, |
| "grad_norm": 0.5590992427797843, |
| "learning_rate": 3.9772078050900105e-05, |
| "loss": 0.2519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.267245352268219, |
| "step": 630, |
| "valid_targets_mean": 3224.1, |
| "valid_targets_min": 1330 |
| }, |
| { |
| "epoch": 1.0127591706539074, |
| "grad_norm": 0.5412219374722034, |
| "learning_rate": 3.9759948687899055e-05, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2462998479604721, |
| "step": 635, |
| "valid_targets_mean": 3618.4, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 1.0207336523125996, |
| "grad_norm": 0.6043980742100203, |
| "learning_rate": 3.974750683872667e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24493081867694855, |
| "step": 640, |
| "valid_targets_mean": 2639.1, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 1.0287081339712918, |
| "grad_norm": 0.7096444272979168, |
| "learning_rate": 3.973475270013984e-05, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33669358491897583, |
| "step": 645, |
| "valid_targets_mean": 2667.2, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 1.036682615629984, |
| "grad_norm": 0.5889749694176992, |
| "learning_rate": 3.972168647383402e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20457293093204498, |
| "step": 650, |
| "valid_targets_mean": 2950.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 1.0446570972886762, |
| "grad_norm": 0.545750879813732, |
| "learning_rate": 3.970830836644006e-05, |
| "loss": 0.2317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23334968090057373, |
| "step": 655, |
| "valid_targets_mean": 3426.9, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 1.0526315789473684, |
| "grad_norm": 0.6522530149915291, |
| "learning_rate": 3.9694618589520945e-05, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21202175319194794, |
| "step": 660, |
| "valid_targets_mean": 2608.2, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 1.0606060606060606, |
| "grad_norm": 0.6005460698394031, |
| "learning_rate": 3.9680617359568414e-05, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2296278476715088, |
| "step": 665, |
| "valid_targets_mean": 2712.1, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 1.0685805422647527, |
| "grad_norm": 0.6017327323981438, |
| "learning_rate": 3.966630489799959e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21935969591140747, |
| "step": 670, |
| "valid_targets_mean": 2787.2, |
| "valid_targets_min": 1514 |
| }, |
| { |
| "epoch": 1.076555023923445, |
| "grad_norm": 0.6150691268319541, |
| "learning_rate": 3.9651681431153445e-05, |
| "loss": 0.236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22077104449272156, |
| "step": 675, |
| "valid_targets_mean": 2930.1, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 1.0845295055821371, |
| "grad_norm": 0.6200136891990149, |
| "learning_rate": 3.96367471902872e-05, |
| "loss": 0.2118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19286946952342987, |
| "step": 680, |
| "valid_targets_mean": 2750.2, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 1.0925039872408293, |
| "grad_norm": 0.5655815816732179, |
| "learning_rate": 3.9621502411572705e-05, |
| "loss": 0.2595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24388240277767181, |
| "step": 685, |
| "valid_targets_mean": 3086.5, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 1.1004784688995215, |
| "grad_norm": 0.5885904619456156, |
| "learning_rate": 3.960594733609273e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2468026876449585, |
| "step": 690, |
| "valid_targets_mean": 3201.1, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 1.1084529505582137, |
| "grad_norm": 0.5232919415905639, |
| "learning_rate": 3.9590082209837054e-05, |
| "loss": 0.2231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22746863961219788, |
| "step": 695, |
| "valid_targets_mean": 3608.3, |
| "valid_targets_min": 1395 |
| }, |
| { |
| "epoch": 1.1164274322169059, |
| "grad_norm": 0.5795983343051004, |
| "learning_rate": 3.957390728369867e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21875368058681488, |
| "step": 700, |
| "valid_targets_mean": 2985.8, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 1.124401913875598, |
| "grad_norm": 0.6474674101877196, |
| "learning_rate": 3.955742281346979e-05, |
| "loss": 0.2168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24110597372055054, |
| "step": 705, |
| "valid_targets_mean": 2594.4, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 1.1323763955342903, |
| "grad_norm": 0.6120178805218351, |
| "learning_rate": 3.9540629059837767e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2766246795654297, |
| "step": 710, |
| "valid_targets_mean": 2957.4, |
| "valid_targets_min": 1321 |
| }, |
| { |
| "epoch": 1.1403508771929824, |
| "grad_norm": 0.6448170583460983, |
| "learning_rate": 3.952352628838102e-05, |
| "loss": 0.2222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19483381509780884, |
| "step": 715, |
| "valid_targets_mean": 2121.1, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 1.1483253588516746, |
| "grad_norm": 0.6548168327201195, |
| "learning_rate": 3.95061147695648e-05, |
| "loss": 0.2324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21812087297439575, |
| "step": 720, |
| "valid_targets_mean": 2455.1, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 1.1562998405103668, |
| "grad_norm": 0.6190274225455182, |
| "learning_rate": 3.9488394778736935e-05, |
| "loss": 0.2746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22314514219760895, |
| "step": 725, |
| "valid_targets_mean": 2731.3, |
| "valid_targets_min": 1342 |
| }, |
| { |
| "epoch": 1.164274322169059, |
| "grad_norm": 0.6010823414002561, |
| "learning_rate": 3.947036659612345e-05, |
| "loss": 0.2324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2784811854362488, |
| "step": 730, |
| "valid_targets_mean": 3532.8, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 1.1722488038277512, |
| "grad_norm": 0.6149720156451945, |
| "learning_rate": 3.945203050682418e-05, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2704809308052063, |
| "step": 735, |
| "valid_targets_mean": 3149.3, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 1.1802232854864434, |
| "grad_norm": 0.510802694097458, |
| "learning_rate": 3.94333868008082e-05, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2353009134531021, |
| "step": 740, |
| "valid_targets_mean": 3687.4, |
| "valid_targets_min": 1494 |
| }, |
| { |
| "epoch": 1.1881977671451356, |
| "grad_norm": 0.6004191651529056, |
| "learning_rate": 3.94144357729093e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27018919587135315, |
| "step": 745, |
| "valid_targets_mean": 3065.2, |
| "valid_targets_min": 1087 |
| }, |
| { |
| "epoch": 1.1961722488038278, |
| "grad_norm": 0.5173197330016904, |
| "learning_rate": 3.939517772282127e-05, |
| "loss": 0.2183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19749709963798523, |
| "step": 750, |
| "valid_targets_mean": 3088.0, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 1.20414673046252, |
| "grad_norm": 0.5989450936696408, |
| "learning_rate": 3.93756129550932e-05, |
| "loss": 0.2236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22018079459667206, |
| "step": 755, |
| "valid_targets_mean": 2998.4, |
| "valid_targets_min": 1572 |
| }, |
| { |
| "epoch": 1.2121212121212122, |
| "grad_norm": 0.570268839573639, |
| "learning_rate": 3.935574177912465e-05, |
| "loss": 0.2564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2346849888563156, |
| "step": 760, |
| "valid_targets_mean": 3287.2, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 1.2200956937799043, |
| "grad_norm": 0.601105124747731, |
| "learning_rate": 3.9335564509160746e-05, |
| "loss": 0.2372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2528783977031708, |
| "step": 765, |
| "valid_targets_mean": 3077.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 1.2280701754385965, |
| "grad_norm": 0.6142966339382259, |
| "learning_rate": 3.931508146428724e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22747379541397095, |
| "step": 770, |
| "valid_targets_mean": 2825.7, |
| "valid_targets_min": 1102 |
| }, |
| { |
| "epoch": 1.2360446570972887, |
| "grad_norm": 0.5087997480632052, |
| "learning_rate": 3.929429296842542e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23831650614738464, |
| "step": 775, |
| "valid_targets_mean": 3389.8, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 1.244019138755981, |
| "grad_norm": 0.5239878661727811, |
| "learning_rate": 3.927319935032703e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2023959755897522, |
| "step": 780, |
| "valid_targets_mean": 3227.9, |
| "valid_targets_min": 1260 |
| }, |
| { |
| "epoch": 1.251993620414673, |
| "grad_norm": 0.6968846240351381, |
| "learning_rate": 3.925180094356905e-05, |
| "loss": 0.2242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20895949006080627, |
| "step": 785, |
| "valid_targets_mean": 2142.9, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 1.2599681020733653, |
| "grad_norm": 0.6041827706842907, |
| "learning_rate": 3.9230098086548414e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19941559433937073, |
| "step": 790, |
| "valid_targets_mean": 2695.4, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 1.2679425837320575, |
| "grad_norm": 0.5775916446397974, |
| "learning_rate": 3.920809112247668e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21255138516426086, |
| "step": 795, |
| "valid_targets_mean": 2856.7, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 1.2759170653907497, |
| "grad_norm": 0.5543005602140678, |
| "learning_rate": 3.918578039937459e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2445598691701889, |
| "step": 800, |
| "valid_targets_mean": 3451.8, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 1.2838915470494419, |
| "grad_norm": 0.560785534024231, |
| "learning_rate": 3.916316627006656e-05, |
| "loss": 0.2197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19521670043468475, |
| "step": 805, |
| "valid_targets_mean": 3096.6, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 1.291866028708134, |
| "grad_norm": 0.5767637988086921, |
| "learning_rate": 3.914024909217511e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2539677619934082, |
| "step": 810, |
| "valid_targets_mean": 3374.2, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 1.2998405103668262, |
| "grad_norm": 0.6209716508260346, |
| "learning_rate": 3.911702922811522e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19697776436805725, |
| "step": 815, |
| "valid_targets_mean": 2215.6, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 1.3078149920255182, |
| "grad_norm": 0.6291469867776873, |
| "learning_rate": 3.909350704508856e-05, |
| "loss": 0.2348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23938624560832977, |
| "step": 820, |
| "valid_targets_mean": 2760.1, |
| "valid_targets_min": 1112 |
| }, |
| { |
| "epoch": 1.3157894736842106, |
| "grad_norm": 0.5575921172983946, |
| "learning_rate": 3.906968291507773e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2400011122226715, |
| "step": 825, |
| "valid_targets_mean": 3671.2, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 1.3237639553429026, |
| "grad_norm": 0.6345082402652992, |
| "learning_rate": 3.904555721484034e-05, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24229951202869415, |
| "step": 830, |
| "valid_targets_mean": 2401.9, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 1.331738437001595, |
| "grad_norm": 0.6195684041173591, |
| "learning_rate": 3.9021130325903076e-05, |
| "loss": 0.2487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3127402663230896, |
| "step": 835, |
| "valid_targets_mean": 3132.9, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 1.339712918660287, |
| "grad_norm": 0.6563542216109102, |
| "learning_rate": 3.899640263455566e-05, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2351498007774353, |
| "step": 840, |
| "valid_targets_mean": 2515.1, |
| "valid_targets_min": 1464 |
| }, |
| { |
| "epoch": 1.3476874003189794, |
| "grad_norm": 0.64783568591679, |
| "learning_rate": 3.897137453184472e-05, |
| "loss": 0.2372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22898787260055542, |
| "step": 845, |
| "valid_targets_mean": 2141.3, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 1.3556618819776713, |
| "grad_norm": 0.5823873984785253, |
| "learning_rate": 3.894604641356767e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19752237200737, |
| "step": 850, |
| "valid_targets_mean": 2627.8, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 1.3636363636363638, |
| "grad_norm": 0.5757894549438445, |
| "learning_rate": 3.8920418680266346e-05, |
| "loss": 0.2167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1831761598587036, |
| "step": 855, |
| "valid_targets_mean": 2389.3, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 1.3716108452950557, |
| "grad_norm": 0.49327863847117276, |
| "learning_rate": 3.889449173722077e-05, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20380468666553497, |
| "step": 860, |
| "valid_targets_mean": 3471.6, |
| "valid_targets_min": 1488 |
| }, |
| { |
| "epoch": 1.3795853269537481, |
| "grad_norm": 0.6307638441078381, |
| "learning_rate": 3.8868265994442694e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21134331822395325, |
| "step": 865, |
| "valid_targets_mean": 2447.6, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 1.38755980861244, |
| "grad_norm": 0.5265701690721363, |
| "learning_rate": 3.8841741866669126e-05, |
| "loss": 0.2454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21514572203159332, |
| "step": 870, |
| "valid_targets_mean": 3132.0, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 1.3955342902711323, |
| "grad_norm": 0.6272683045446587, |
| "learning_rate": 3.881491977335577e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2270197570323944, |
| "step": 875, |
| "valid_targets_mean": 2979.2, |
| "valid_targets_min": 1335 |
| }, |
| { |
| "epoch": 1.4035087719298245, |
| "grad_norm": 0.5125155204565588, |
| "learning_rate": 3.878780013867038e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.211686909198761, |
| "step": 880, |
| "valid_targets_mean": 3388.2, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 1.4114832535885167, |
| "grad_norm": 0.5884010149005009, |
| "learning_rate": 3.8760383391486074e-05, |
| "loss": 0.2428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21981844305992126, |
| "step": 885, |
| "valid_targets_mean": 2581.7, |
| "valid_targets_min": 1090 |
| }, |
| { |
| "epoch": 1.4194577352472089, |
| "grad_norm": 0.5864469022550587, |
| "learning_rate": 3.873266996537456e-05, |
| "loss": 0.2394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2843884825706482, |
| "step": 890, |
| "valid_targets_mean": 3282.1, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 1.427432216905901, |
| "grad_norm": 0.6407016912115063, |
| "learning_rate": 3.8704660298599225e-05, |
| "loss": 0.2586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3323836922645569, |
| "step": 895, |
| "valid_targets_mean": 3613.4, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 1.4354066985645932, |
| "grad_norm": 0.548542676602486, |
| "learning_rate": 3.867635483410827e-05, |
| "loss": 0.2219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2041669636964798, |
| "step": 900, |
| "valid_targets_mean": 2906.9, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 1.4433811802232854, |
| "grad_norm": 0.5135362865237451, |
| "learning_rate": 3.864775401952767e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.236622616648674, |
| "step": 905, |
| "valid_targets_mean": 3590.2, |
| "valid_targets_min": 1038 |
| }, |
| { |
| "epoch": 1.4513556618819776, |
| "grad_norm": 0.5695703284047577, |
| "learning_rate": 3.8618858307154085e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31914830207824707, |
| "step": 910, |
| "valid_targets_mean": 3563.1, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 1.4593301435406698, |
| "grad_norm": 0.6066778005066594, |
| "learning_rate": 3.8589668153947743e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16905300319194794, |
| "step": 915, |
| "valid_targets_mean": 2114.1, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 1.467304625199362, |
| "grad_norm": 0.5937089594035688, |
| "learning_rate": 3.8560184021525194e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2555321455001831, |
| "step": 920, |
| "valid_targets_mean": 2893.0, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 1.4752791068580542, |
| "grad_norm": 0.6283464141673474, |
| "learning_rate": 3.853040637615199e-05, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.195700004696846, |
| "step": 925, |
| "valid_targets_mean": 2522.1, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 1.4832535885167464, |
| "grad_norm": 0.5723038985943404, |
| "learning_rate": 3.850033568873536e-05, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19896413385868073, |
| "step": 930, |
| "valid_targets_mean": 2328.2, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 1.4912280701754386, |
| "grad_norm": 0.6164522031974263, |
| "learning_rate": 3.8469972434816706e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18973922729492188, |
| "step": 935, |
| "valid_targets_mean": 2312.7, |
| "valid_targets_min": 1280 |
| }, |
| { |
| "epoch": 1.4992025518341308, |
| "grad_norm": 0.6086637262441689, |
| "learning_rate": 3.843931709456414e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24724075198173523, |
| "step": 940, |
| "valid_targets_mean": 2995.4, |
| "valid_targets_min": 1567 |
| }, |
| { |
| "epoch": 1.507177033492823, |
| "grad_norm": 0.6483381919678638, |
| "learning_rate": 3.840837015276483e-05, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3337307572364807, |
| "step": 945, |
| "valid_targets_mean": 2911.9, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 1.5151515151515151, |
| "grad_norm": 0.5855323586411422, |
| "learning_rate": 3.83771320988174e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17903995513916016, |
| "step": 950, |
| "valid_targets_mean": 2291.5, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 1.5231259968102073, |
| "grad_norm": 0.584270941139963, |
| "learning_rate": 3.834560342672413e-05, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21279588341712952, |
| "step": 955, |
| "valid_targets_mean": 2610.5, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 1.5311004784688995, |
| "grad_norm": 0.5503620072606771, |
| "learning_rate": 3.831378463508318e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2559887170791626, |
| "step": 960, |
| "valid_targets_mean": 3138.2, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 1.5390749601275917, |
| "grad_norm": 0.6001392975485096, |
| "learning_rate": 3.8281676227080694e-05, |
| "loss": 0.2222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2329024225473404, |
| "step": 965, |
| "valid_targets_mean": 2648.9, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 1.547049441786284, |
| "grad_norm": 0.5346724503885805, |
| "learning_rate": 3.824927871048284e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19294703006744385, |
| "step": 970, |
| "valid_targets_mean": 2822.2, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 1.555023923444976, |
| "grad_norm": 0.49919442227666905, |
| "learning_rate": 3.8216592597627797e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2007545828819275, |
| "step": 975, |
| "valid_targets_mean": 3116.3, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 1.5629984051036683, |
| "grad_norm": 0.5982205761118605, |
| "learning_rate": 3.818361840541761e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18389758467674255, |
| "step": 980, |
| "valid_targets_mean": 2047.2, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 1.5709728867623605, |
| "grad_norm": 0.5512917759429814, |
| "learning_rate": 3.815035665531008e-05, |
| "loss": 0.2115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1839146614074707, |
| "step": 985, |
| "valid_targets_mean": 2353.8, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.5789473684210527, |
| "grad_norm": 0.6223649318682416, |
| "learning_rate": 3.811680787331047e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18036724627017975, |
| "step": 990, |
| "valid_targets_mean": 2156.6, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 1.5869218500797448, |
| "grad_norm": 0.6352872088960317, |
| "learning_rate": 3.8082972589963175e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2819938361644745, |
| "step": 995, |
| "valid_targets_mean": 2302.4, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 1.594896331738437, |
| "grad_norm": 0.6242377091078459, |
| "learning_rate": 3.80488513403434e-05, |
| "loss": 0.2396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.289346307516098, |
| "step": 1000, |
| "valid_targets_mean": 2421.4, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 1.6028708133971292, |
| "grad_norm": 0.5826983613530846, |
| "learning_rate": 3.8014444664048616e-05, |
| "loss": 0.2144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25043565034866333, |
| "step": 1005, |
| "valid_targets_mean": 2823.9, |
| "valid_targets_min": 1114 |
| }, |
| { |
| "epoch": 1.6108452950558214, |
| "grad_norm": 0.5546186494842212, |
| "learning_rate": 3.797975310519009e-05, |
| "loss": 0.2145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21974100172519684, |
| "step": 1010, |
| "valid_targets_mean": 3072.6, |
| "valid_targets_min": 1653 |
| }, |
| { |
| "epoch": 1.6188197767145136, |
| "grad_norm": 0.4632694182062778, |
| "learning_rate": 3.794477721238425e-05, |
| "loss": 0.2261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21472452580928802, |
| "step": 1015, |
| "valid_targets_mean": 3615.5, |
| "valid_targets_min": 1532 |
| }, |
| { |
| "epoch": 1.6267942583732058, |
| "grad_norm": 0.5830152765455087, |
| "learning_rate": 3.7909517538744e-05, |
| "loss": 0.2408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2194686233997345, |
| "step": 1020, |
| "valid_targets_mean": 2642.8, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 1.6347687400318978, |
| "grad_norm": 0.6151873688159493, |
| "learning_rate": 3.7873974641870006e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1882760226726532, |
| "step": 1025, |
| "valid_targets_mean": 2297.1, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 1.6427432216905902, |
| "grad_norm": 2.140862445980475, |
| "learning_rate": 3.7838149083841856e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23605549335479736, |
| "step": 1030, |
| "valid_targets_mean": 2535.2, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 1.6507177033492821, |
| "grad_norm": 0.6528803837865146, |
| "learning_rate": 3.7802041431209166e-05, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2378740757703781, |
| "step": 1035, |
| "valid_targets_mean": 2299.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 1.6586921850079746, |
| "grad_norm": 0.6191369201573628, |
| "learning_rate": 3.776565225498264e-05, |
| "loss": 0.2877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24140696227550507, |
| "step": 1040, |
| "valid_targets_mean": 2222.6, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.6498039390645324, |
| "learning_rate": 3.7728982130625025e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2488032430410385, |
| "step": 1045, |
| "valid_targets_mean": 2576.2, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 1.674641148325359, |
| "grad_norm": 0.6375130250679868, |
| "learning_rate": 3.769203163804202e-05, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2386590838432312, |
| "step": 1050, |
| "valid_targets_mean": 2930.1, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 1.682615629984051, |
| "grad_norm": 0.5527652926140382, |
| "learning_rate": 3.7654801361573076e-05, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.264995276927948, |
| "step": 1055, |
| "valid_targets_mean": 3239.4, |
| "valid_targets_min": 1355 |
| }, |
| { |
| "epoch": 1.6905901116427433, |
| "grad_norm": 0.5370865034755017, |
| "learning_rate": 3.761729188998222e-05, |
| "loss": 0.2418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28277504444122314, |
| "step": 1060, |
| "valid_targets_mean": 3348.9, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 1.6985645933014353, |
| "grad_norm": 0.5747670458007346, |
| "learning_rate": 3.757950381644868e-05, |
| "loss": 0.2282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20245248079299927, |
| "step": 1065, |
| "valid_targets_mean": 2440.8, |
| "valid_targets_min": 1309 |
| }, |
| { |
| "epoch": 1.7065390749601277, |
| "grad_norm": 0.6094654650302161, |
| "learning_rate": 3.7541437738557524e-05, |
| "loss": 0.2247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20767079293727875, |
| "step": 1070, |
| "valid_targets_mean": 2374.6, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 1.7145135566188197, |
| "grad_norm": 0.5569861380782473, |
| "learning_rate": 3.750309425829022e-05, |
| "loss": 0.2408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24564585089683533, |
| "step": 1075, |
| "valid_targets_mean": 3401.3, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 1.722488038277512, |
| "grad_norm": 0.613745920593988, |
| "learning_rate": 3.746447398201512e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2049260288476944, |
| "step": 1080, |
| "valid_targets_mean": 2619.6, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 1.730462519936204, |
| "grad_norm": 0.5548189655462026, |
| "learning_rate": 3.7425577520477846e-05, |
| "loss": 0.2516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23266099393367767, |
| "step": 1085, |
| "valid_targets_mean": 2925.9, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 1.7384370015948964, |
| "grad_norm": 0.5254275868939079, |
| "learning_rate": 3.738640548879166e-05, |
| "loss": 0.2263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18870019912719727, |
| "step": 1090, |
| "valid_targets_mean": 2759.0, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 1.7464114832535884, |
| "grad_norm": 0.5020906772682225, |
| "learning_rate": 3.7346958506427696e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25047755241394043, |
| "step": 1095, |
| "valid_targets_mean": 3543.0, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 1.7543859649122808, |
| "grad_norm": 0.6019040221940559, |
| "learning_rate": 3.730723719720523e-05, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21497926115989685, |
| "step": 1100, |
| "valid_targets_mean": 2993.9, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 1.7623604465709728, |
| "grad_norm": 0.5134617499391168, |
| "learning_rate": 3.7267242189281746e-05, |
| "loss": 0.217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23121070861816406, |
| "step": 1105, |
| "valid_targets_mean": 3359.8, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 1.7703349282296652, |
| "grad_norm": 0.555534809215992, |
| "learning_rate": 3.722697411514305e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2400152087211609, |
| "step": 1110, |
| "valid_targets_mean": 2866.0, |
| "valid_targets_min": 1332 |
| }, |
| { |
| "epoch": 1.7783094098883572, |
| "grad_norm": 0.6105348331308175, |
| "learning_rate": 3.7186433611593225e-05, |
| "loss": 0.2265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30984336137771606, |
| "step": 1115, |
| "valid_targets_mean": 3165.9, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 1.7862838915470496, |
| "grad_norm": 0.5761430256224706, |
| "learning_rate": 3.7145621319744614e-05, |
| "loss": 0.2334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26511406898498535, |
| "step": 1120, |
| "valid_targets_mean": 3365.7, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 1.7942583732057416, |
| "grad_norm": 0.5782063968492165, |
| "learning_rate": 3.7104537885007635e-05, |
| "loss": 0.2262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21325793862342834, |
| "step": 1125, |
| "valid_targets_mean": 2586.2, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 1.802232854864434, |
| "grad_norm": 0.6766750855241791, |
| "learning_rate": 3.7063183957080594e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19376319646835327, |
| "step": 1130, |
| "valid_targets_mean": 2382.9, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 1.810207336523126, |
| "grad_norm": 0.47421899311917426, |
| "learning_rate": 3.7021560189939416e-05, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21126791834831238, |
| "step": 1135, |
| "valid_targets_mean": 3506.8, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 1.8181818181818183, |
| "grad_norm": 0.5034779048358913, |
| "learning_rate": 3.697966724182729e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19855384528636932, |
| "step": 1140, |
| "valid_targets_mean": 3456.3, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 1.8261562998405103, |
| "grad_norm": 0.6337585629876568, |
| "learning_rate": 3.6937505775244246e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22304585576057434, |
| "step": 1145, |
| "valid_targets_mean": 2685.5, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 1.8341307814992025, |
| "grad_norm": 0.5610178719430047, |
| "learning_rate": 3.689507645693674e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2178836166858673, |
| "step": 1150, |
| "valid_targets_mean": 3309.5, |
| "valid_targets_min": 1342 |
| }, |
| { |
| "epoch": 1.8421052631578947, |
| "grad_norm": 0.5239047956067104, |
| "learning_rate": 3.6852379957887025e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1819612830877304, |
| "step": 1155, |
| "valid_targets_mean": 2517.4, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 1.8500797448165869, |
| "grad_norm": 0.5749497640819529, |
| "learning_rate": 3.6809416953302606e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1893683671951294, |
| "step": 1160, |
| "valid_targets_mean": 2465.4, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 1.858054226475279, |
| "grad_norm": 0.5625715315011639, |
| "learning_rate": 3.676618812260553e-05, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18896302580833435, |
| "step": 1165, |
| "valid_targets_mean": 2504.8, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 1.8660287081339713, |
| "grad_norm": 0.5196211344002306, |
| "learning_rate": 3.672269414942166e-05, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18706221878528595, |
| "step": 1170, |
| "valid_targets_mean": 2709.4, |
| "valid_targets_min": 1589 |
| }, |
| { |
| "epoch": 1.8740031897926634, |
| "grad_norm": 0.5409333832286379, |
| "learning_rate": 3.6678935721569825e-05, |
| "loss": 0.2275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18008098006248474, |
| "step": 1175, |
| "valid_targets_mean": 2698.2, |
| "valid_targets_min": 1756 |
| }, |
| { |
| "epoch": 1.8819776714513556, |
| "grad_norm": 0.5215242217921682, |
| "learning_rate": 3.663491353105101e-05, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23432385921478271, |
| "step": 1180, |
| "valid_targets_mean": 3169.7, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 1.8899521531100478, |
| "grad_norm": 0.4659554830522906, |
| "learning_rate": 3.659062827403735e-05, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18295270204544067, |
| "step": 1185, |
| "valid_targets_mean": 3136.5, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 1.89792663476874, |
| "grad_norm": 0.5834321903658111, |
| "learning_rate": 3.654608065086115e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1885906457901001, |
| "step": 1190, |
| "valid_targets_mean": 2347.2, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 1.9059011164274322, |
| "grad_norm": 0.4892253621146179, |
| "learning_rate": 3.650127136600379e-05, |
| "loss": 0.2282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25364458560943604, |
| "step": 1195, |
| "valid_targets_mean": 4085.2, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 1.9138755980861244, |
| "grad_norm": 0.5076087679251333, |
| "learning_rate": 3.645620112808464e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20003008842468262, |
| "step": 1200, |
| "valid_targets_mean": 3066.7, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 1.9218500797448166, |
| "grad_norm": 0.5335946413112277, |
| "learning_rate": 3.641087064984977e-05, |
| "loss": 0.2257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2127196490764618, |
| "step": 1205, |
| "valid_targets_mean": 2720.1, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 1.9298245614035088, |
| "grad_norm": 0.6361693621882534, |
| "learning_rate": 3.636528064816073e-05, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19323310256004333, |
| "step": 1210, |
| "valid_targets_mean": 2129.1, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 1.937799043062201, |
| "grad_norm": 0.5843343837357229, |
| "learning_rate": 3.6319431843983223e-05, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2852637767791748, |
| "step": 1215, |
| "valid_targets_mean": 3620.1, |
| "valid_targets_min": 1158 |
| }, |
| { |
| "epoch": 1.9457735247208932, |
| "grad_norm": 0.5951676671617808, |
| "learning_rate": 3.6273324962375676e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2468632161617279, |
| "step": 1220, |
| "valid_targets_mean": 2911.6, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 1.9537480063795853, |
| "grad_norm": 0.6569118735077601, |
| "learning_rate": 3.622696073247777e-05, |
| "loss": 0.2117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24635280668735504, |
| "step": 1225, |
| "valid_targets_mean": 3458.5, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.9617224880382775, |
| "grad_norm": 0.5437346633446027, |
| "learning_rate": 3.6180339887498953e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2951074540615082, |
| "step": 1230, |
| "valid_targets_mean": 3982.8, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 1.9696969696969697, |
| "grad_norm": 0.4940449249242946, |
| "learning_rate": 3.613346316470678e-05, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23175011575222015, |
| "step": 1235, |
| "valid_targets_mean": 3729.4, |
| "valid_targets_min": 1226 |
| }, |
| { |
| "epoch": 1.977671451355662, |
| "grad_norm": 0.5477246251152017, |
| "learning_rate": 3.60863313054153e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18664443492889404, |
| "step": 1240, |
| "valid_targets_mean": 2555.5, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 1.985645933014354, |
| "grad_norm": 0.5424225434810162, |
| "learning_rate": 3.6038945054973334e-05, |
| "loss": 0.2151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21529079973697662, |
| "step": 1245, |
| "valid_targets_mean": 3182.9, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 1.9936204146730463, |
| "grad_norm": 0.5309854104241837, |
| "learning_rate": 3.599130516275266e-05, |
| "loss": 0.2126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21649429202079773, |
| "step": 1250, |
| "valid_targets_mean": 2814.7, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 2.0015948963317385, |
| "grad_norm": 0.6830016071881365, |
| "learning_rate": 3.594341238213618e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2428247332572937, |
| "step": 1255, |
| "valid_targets_mean": 2230.6, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 2.0095693779904304, |
| "grad_norm": 0.583613177123442, |
| "learning_rate": 3.589526747050601e-05, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1945180892944336, |
| "step": 1260, |
| "valid_targets_mean": 2468.8, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 2.017543859649123, |
| "grad_norm": 0.5249288021444334, |
| "learning_rate": 3.584687118923149e-05, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1898598074913025, |
| "step": 1265, |
| "valid_targets_mean": 2771.9, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 2.025518341307815, |
| "grad_norm": 0.6525341636876454, |
| "learning_rate": 3.579822430365714e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22228668630123138, |
| "step": 1270, |
| "valid_targets_mean": 3191.8, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 2.0334928229665072, |
| "grad_norm": 0.5729538709639772, |
| "learning_rate": 3.57493275830906e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17011548578739166, |
| "step": 1275, |
| "valid_targets_mean": 2719.9, |
| "valid_targets_min": 1164 |
| }, |
| { |
| "epoch": 2.041467304625199, |
| "grad_norm": 0.5358768215183619, |
| "learning_rate": 3.570018180079037e-05, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21794959902763367, |
| "step": 1280, |
| "valid_targets_mean": 3458.1, |
| "valid_targets_min": 1452 |
| }, |
| { |
| "epoch": 2.0494417862838916, |
| "grad_norm": 1.025831647271483, |
| "learning_rate": 3.5650787733953715e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16724932193756104, |
| "step": 1285, |
| "valid_targets_mean": 2740.6, |
| "valid_targets_min": 1379 |
| }, |
| { |
| "epoch": 2.0574162679425836, |
| "grad_norm": 0.5249612579847214, |
| "learning_rate": 3.560114616370425e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21160989999771118, |
| "step": 1290, |
| "valid_targets_mean": 3251.8, |
| "valid_targets_min": 1721 |
| }, |
| { |
| "epoch": 2.065390749601276, |
| "grad_norm": 0.5644105309104152, |
| "learning_rate": 3.555125787507964e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19360047578811646, |
| "step": 1295, |
| "valid_targets_mean": 2911.9, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.073365231259968, |
| "grad_norm": 0.5815407495575634, |
| "learning_rate": 3.550112365701921e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2966446280479431, |
| "step": 1300, |
| "valid_targets_mean": 3293.7, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 2.0813397129186604, |
| "grad_norm": 0.5385897882404551, |
| "learning_rate": 3.545074430235142e-05, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22409307956695557, |
| "step": 1305, |
| "valid_targets_mean": 3228.1, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 2.0893141945773523, |
| "grad_norm": 0.5692012223049029, |
| "learning_rate": 3.540012060778137e-05, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15392714738845825, |
| "step": 1310, |
| "valid_targets_mean": 2260.0, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 2.0972886762360448, |
| "grad_norm": 0.5300644084507816, |
| "learning_rate": 3.534925337387816e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24721625447273254, |
| "step": 1315, |
| "valid_targets_mean": 3622.4, |
| "valid_targets_min": 1160 |
| }, |
| { |
| "epoch": 2.1052631578947367, |
| "grad_norm": 0.5647284692712146, |
| "learning_rate": 3.529814340506226e-05, |
| "loss": 0.2017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20379406213760376, |
| "step": 1320, |
| "valid_targets_mean": 3280.3, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 2.113237639553429, |
| "grad_norm": 0.558965345583107, |
| "learning_rate": 3.524679150959277e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17460405826568604, |
| "step": 1325, |
| "valid_targets_mean": 2684.2, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 2.121212121212121, |
| "grad_norm": 0.5955047163911827, |
| "learning_rate": 3.519519849955466e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1885492503643036, |
| "step": 1330, |
| "valid_targets_mean": 3299.5, |
| "valid_targets_min": 1561 |
| }, |
| { |
| "epoch": 2.1291866028708135, |
| "grad_norm": 0.4966909790003643, |
| "learning_rate": 3.514336519084591e-05, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18052926659584045, |
| "step": 1335, |
| "valid_targets_mean": 3317.4, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 2.1371610845295055, |
| "grad_norm": 0.5299411406686442, |
| "learning_rate": 3.509129240316461e-05, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2125854790210724, |
| "step": 1340, |
| "valid_targets_mean": 3120.4, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 2.145135566188198, |
| "grad_norm": 0.5800308757617607, |
| "learning_rate": 3.5038980959995985e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.263176828622818, |
| "step": 1345, |
| "valid_targets_mean": 3585.3, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 2.15311004784689, |
| "grad_norm": 0.5999009997718916, |
| "learning_rate": 3.498643168859941e-05, |
| "loss": 0.2003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20120833814144135, |
| "step": 1350, |
| "valid_targets_mean": 2516.6, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 2.1610845295055823, |
| "grad_norm": 0.48961821808382117, |
| "learning_rate": 3.493364541999529e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18192213773727417, |
| "step": 1355, |
| "valid_targets_mean": 3155.0, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 2.1690590111642742, |
| "grad_norm": 0.6849100630435138, |
| "learning_rate": 3.488062298895194e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18514913320541382, |
| "step": 1360, |
| "valid_targets_mean": 2309.5, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 2.1770334928229667, |
| "grad_norm": 0.5344472039018315, |
| "learning_rate": 3.482736523397237e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1777096837759018, |
| "step": 1365, |
| "valid_targets_mean": 2620.4, |
| "valid_targets_min": 1172 |
| }, |
| { |
| "epoch": 2.1850079744816586, |
| "grad_norm": 0.5312536211636795, |
| "learning_rate": 3.4773872997281026e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2192026972770691, |
| "step": 1370, |
| "valid_targets_mean": 3280.9, |
| "valid_targets_min": 1436 |
| }, |
| { |
| "epoch": 2.192982456140351, |
| "grad_norm": 0.5286821474310076, |
| "learning_rate": 3.472014712481048e-05, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19956275820732117, |
| "step": 1375, |
| "valid_targets_mean": 3385.3, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.200956937799043, |
| "grad_norm": 0.5500060285804033, |
| "learning_rate": 3.466618846618806e-05, |
| "loss": 0.2139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18642191588878632, |
| "step": 1380, |
| "valid_targets_mean": 2684.4, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 2.2089314194577354, |
| "grad_norm": 0.5352427652804307, |
| "learning_rate": 3.461199787472238e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18637782335281372, |
| "step": 1385, |
| "valid_targets_mean": 3044.4, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 2.2169059011164274, |
| "grad_norm": 0.5447384914029251, |
| "learning_rate": 3.455757620738989e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18728208541870117, |
| "step": 1390, |
| "valid_targets_mean": 3003.2, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 2.22488038277512, |
| "grad_norm": 0.5717238697325798, |
| "learning_rate": 3.450292432482127e-05, |
| "loss": 0.2048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2106652557849884, |
| "step": 1395, |
| "valid_targets_mean": 2633.9, |
| "valid_targets_min": 1250 |
| }, |
| { |
| "epoch": 2.2328548644338118, |
| "grad_norm": 0.6406144106784887, |
| "learning_rate": 3.444804309128789e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2285759598016739, |
| "step": 1400, |
| "valid_targets_mean": 3575.9, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 2.240829346092504, |
| "grad_norm": 0.47144056813631574, |
| "learning_rate": 3.439293337468808e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521637737751007, |
| "step": 1405, |
| "valid_targets_mean": 2935.6, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 2.248803827751196, |
| "grad_norm": 0.5527496205056719, |
| "learning_rate": 3.4337596046533426e-05, |
| "loss": 0.2284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2488706111907959, |
| "step": 1410, |
| "valid_targets_mean": 3477.2, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 2.2567783094098885, |
| "grad_norm": 0.508828813177984, |
| "learning_rate": 3.4282031981935e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2234359085559845, |
| "step": 1415, |
| "valid_targets_mean": 3965.8, |
| "valid_targets_min": 1125 |
| }, |
| { |
| "epoch": 2.2647527910685805, |
| "grad_norm": 0.5695739787713568, |
| "learning_rate": 3.42262420595895e-05, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24366150796413422, |
| "step": 1420, |
| "valid_targets_mean": 3077.3, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 2.2727272727272725, |
| "grad_norm": 0.5998788145463537, |
| "learning_rate": 3.417022716176539e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2406616061925888, |
| "step": 1425, |
| "valid_targets_mean": 2459.1, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 2.280701754385965, |
| "grad_norm": 0.5743859087966089, |
| "learning_rate": 3.411398817428889e-05, |
| "loss": 0.1926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17860084772109985, |
| "step": 1430, |
| "valid_targets_mean": 2430.9, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 2.2886762360446573, |
| "grad_norm": 0.5291060692515646, |
| "learning_rate": 3.4057525986530016e-05, |
| "loss": 0.1989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2760910391807556, |
| "step": 1435, |
| "valid_targets_mean": 4081.8, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 2.2966507177033493, |
| "grad_norm": 0.4928425236453258, |
| "learning_rate": 3.400084149138851e-05, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20123213529586792, |
| "step": 1440, |
| "valid_targets_mean": 3745.3, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 2.3046251993620412, |
| "grad_norm": 0.5186264077191272, |
| "learning_rate": 3.394393558527969e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1761550009250641, |
| "step": 1445, |
| "valid_targets_mean": 3007.8, |
| "valid_targets_min": 1280 |
| }, |
| { |
| "epoch": 2.3125996810207337, |
| "grad_norm": 0.587444586310813, |
| "learning_rate": 3.388680916812031e-05, |
| "loss": 0.1857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16212230920791626, |
| "step": 1450, |
| "valid_targets_mean": 2444.2, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 2.320574162679426, |
| "grad_norm": 0.5679214383824454, |
| "learning_rate": 3.382946314331429e-05, |
| "loss": 0.2167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2232741117477417, |
| "step": 1455, |
| "valid_targets_mean": 2940.7, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 2.328548644338118, |
| "grad_norm": 0.7826501249243136, |
| "learning_rate": 3.377189841773848e-05, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25218990445137024, |
| "step": 1460, |
| "valid_targets_mean": 2453.1, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 2.33652312599681, |
| "grad_norm": 0.5876238136730855, |
| "learning_rate": 3.371411590172827e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17968472838401794, |
| "step": 1465, |
| "valid_targets_mean": 2336.6, |
| "valid_targets_min": 1328 |
| }, |
| { |
| "epoch": 2.3444976076555024, |
| "grad_norm": 0.8075832611828215, |
| "learning_rate": 3.365611650906321e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1817243993282318, |
| "step": 1470, |
| "valid_targets_mean": 2379.7, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 2.352472089314195, |
| "grad_norm": 0.5509881788274565, |
| "learning_rate": 3.359790115695259e-05, |
| "loss": 0.2206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22982379794120789, |
| "step": 1475, |
| "valid_targets_mean": 3067.1, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 2.360446570972887, |
| "grad_norm": 0.5056847617580823, |
| "learning_rate": 3.353947076602088e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1958909034729004, |
| "step": 1480, |
| "valid_targets_mean": 3523.2, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 2.3684210526315788, |
| "grad_norm": 0.5159845635621267, |
| "learning_rate": 3.34808262602932e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16456438601016998, |
| "step": 1485, |
| "valid_targets_mean": 3085.1, |
| "valid_targets_min": 1702 |
| }, |
| { |
| "epoch": 2.376395534290271, |
| "grad_norm": 0.5858693851449541, |
| "learning_rate": 3.342196856718074e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19342803955078125, |
| "step": 1490, |
| "valid_targets_mean": 2573.2, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 2.384370015948963, |
| "grad_norm": 0.664991036812387, |
| "learning_rate": 3.336289861746602e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19867199659347534, |
| "step": 1495, |
| "valid_targets_mean": 2357.4, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 2.3923444976076556, |
| "grad_norm": 1.048356992635596, |
| "learning_rate": 3.330361734528823e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20687635242938995, |
| "step": 1500, |
| "valid_targets_mean": 3404.9, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 2.4003189792663475, |
| "grad_norm": 0.6470737570437413, |
| "learning_rate": 3.324412568812844e-05, |
| "loss": 0.1723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14438386261463165, |
| "step": 1505, |
| "valid_targets_mean": 1706.2, |
| "valid_targets_min": 1222 |
| }, |
| { |
| "epoch": 2.40829346092504, |
| "grad_norm": 0.5670728091943865, |
| "learning_rate": 3.318442458679477e-05, |
| "loss": 0.214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18530724942684174, |
| "step": 1510, |
| "valid_targets_mean": 2804.8, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 2.416267942583732, |
| "grad_norm": 0.5832801162625506, |
| "learning_rate": 3.312451498540751e-05, |
| "loss": 0.1739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17289073765277863, |
| "step": 1515, |
| "valid_targets_mean": 2337.8, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 2.4242424242424243, |
| "grad_norm": 0.5933227626430476, |
| "learning_rate": 3.306439783138421e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16400037705898285, |
| "step": 1520, |
| "valid_targets_mean": 2690.1, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 2.4322169059011163, |
| "grad_norm": 0.5243891317529017, |
| "learning_rate": 3.3004074075424666e-05, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17849090695381165, |
| "step": 1525, |
| "valid_targets_mean": 3053.1, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 2.4401913875598087, |
| "grad_norm": 0.6178786903379436, |
| "learning_rate": 3.29435446714959e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21913208067417145, |
| "step": 1530, |
| "valid_targets_mean": 3507.8, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 2.4481658692185007, |
| "grad_norm": 0.5841079747434857, |
| "learning_rate": 3.288281057681709e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17646032571792603, |
| "step": 1535, |
| "valid_targets_mean": 2283.2, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 2.456140350877193, |
| "grad_norm": 0.5168606282768784, |
| "learning_rate": 3.28218727518444e-05, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15758445858955383, |
| "step": 1540, |
| "valid_targets_mean": 3063.2, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 2.464114832535885, |
| "grad_norm": 0.6165157331403959, |
| "learning_rate": 3.2760732160255835e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21482142806053162, |
| "step": 1545, |
| "valid_targets_mean": 2569.4, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 2.4720893141945774, |
| "grad_norm": 0.5845544905089886, |
| "learning_rate": 3.269938976893595e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21223688125610352, |
| "step": 1550, |
| "valid_targets_mean": 2661.5, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 2.4800637958532694, |
| "grad_norm": 0.6284605565912317, |
| "learning_rate": 3.2637846547960596e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17033833265304565, |
| "step": 1555, |
| "valid_targets_mean": 2224.4, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 2.488038277511962, |
| "grad_norm": 0.7490821757292555, |
| "learning_rate": 3.2576103470581564e-05, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31501030921936035, |
| "step": 1560, |
| "valid_targets_mean": 3381.4, |
| "valid_targets_min": 1226 |
| }, |
| { |
| "epoch": 2.496012759170654, |
| "grad_norm": 0.5814501383804671, |
| "learning_rate": 3.25141615132112e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19716112315654755, |
| "step": 1565, |
| "valid_targets_mean": 2829.0, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 2.503987240829346, |
| "grad_norm": 0.5136642074516043, |
| "learning_rate": 3.245202165540697e-05, |
| "loss": 0.1924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19882862269878387, |
| "step": 1570, |
| "valid_targets_mean": 3679.9, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 2.511961722488038, |
| "grad_norm": 0.5440586455353177, |
| "learning_rate": 3.238968487985594e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19790814816951752, |
| "step": 1575, |
| "valid_targets_mean": 2993.3, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 2.5199362041467306, |
| "grad_norm": 0.5929188884939683, |
| "learning_rate": 3.232715217235927e-05, |
| "loss": 0.1938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2090296745300293, |
| "step": 1580, |
| "valid_targets_mean": 2928.6, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 2.5279106858054226, |
| "grad_norm": 0.5697340637761833, |
| "learning_rate": 3.226442452181662e-05, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17136168479919434, |
| "step": 1585, |
| "valid_targets_mean": 2591.6, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 2.535885167464115, |
| "grad_norm": 0.540923625766811, |
| "learning_rate": 3.220150292021049e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19687724113464355, |
| "step": 1590, |
| "valid_targets_mean": 3221.6, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 2.543859649122807, |
| "grad_norm": 0.5767857398726057, |
| "learning_rate": 3.213838836259055e-05, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19307035207748413, |
| "step": 1595, |
| "valid_targets_mean": 2589.1, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 2.5518341307814993, |
| "grad_norm": 0.5166304301744661, |
| "learning_rate": 3.2075081847057886e-05, |
| "loss": 0.212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20582881569862366, |
| "step": 1600, |
| "valid_targets_mean": 3190.3, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 2.5598086124401913, |
| "grad_norm": 0.5911901543387457, |
| "learning_rate": 3.201158437474925e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24600306153297424, |
| "step": 1605, |
| "valid_targets_mean": 2878.9, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 2.5677830940988837, |
| "grad_norm": 0.5694511504999716, |
| "learning_rate": 3.194789694982119e-05, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15048804879188538, |
| "step": 1610, |
| "valid_targets_mean": 2276.8, |
| "valid_targets_min": 1519 |
| }, |
| { |
| "epoch": 2.5757575757575757, |
| "grad_norm": 0.5872429136127384, |
| "learning_rate": 3.1884020579434216e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1900998055934906, |
| "step": 1615, |
| "valid_targets_mean": 2539.7, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 2.583732057416268, |
| "grad_norm": 0.6141904777771472, |
| "learning_rate": 3.181995627373679e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16003698110580444, |
| "step": 1620, |
| "valid_targets_mean": 1980.6, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 2.59170653907496, |
| "grad_norm": 0.5646234400091081, |
| "learning_rate": 3.1755705045849465e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15863600373268127, |
| "step": 1625, |
| "valid_targets_mean": 2413.1, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 2.5996810207336525, |
| "grad_norm": 0.5748907862112433, |
| "learning_rate": 3.1691267911848765e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23583777248859406, |
| "step": 1630, |
| "valid_targets_mean": 3131.8, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 2.6076555023923444, |
| "grad_norm": 0.5379326811898751, |
| "learning_rate": 3.1626645890751167e-05, |
| "loss": 0.1938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16717740893363953, |
| "step": 1635, |
| "valid_targets_mean": 2830.4, |
| "valid_targets_min": 1309 |
| }, |
| { |
| "epoch": 2.6156299840510364, |
| "grad_norm": 0.5334708951980555, |
| "learning_rate": 3.156184000449697e-05, |
| "loss": 0.1954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16978397965431213, |
| "step": 1640, |
| "valid_targets_mean": 2473.9, |
| "valid_targets_min": 1083 |
| }, |
| { |
| "epoch": 2.623604465709729, |
| "grad_norm": 0.6318420574052661, |
| "learning_rate": 3.149685127793415e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17268671095371246, |
| "step": 1645, |
| "valid_targets_mean": 2450.8, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 2.6315789473684212, |
| "grad_norm": 0.5308821935515915, |
| "learning_rate": 3.143168073880214e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21769240498542786, |
| "step": 1650, |
| "valid_targets_mean": 3183.6, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 2.639553429027113, |
| "grad_norm": 0.6278883319373487, |
| "learning_rate": 3.1366329417715556e-05, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14011511206626892, |
| "step": 1655, |
| "valid_targets_mean": 1544.2, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 2.647527910685805, |
| "grad_norm": 0.5913767520819432, |
| "learning_rate": 3.1300798348147954e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17621494829654694, |
| "step": 1660, |
| "valid_targets_mean": 2409.2, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 2.6555023923444976, |
| "grad_norm": 0.5708954991838666, |
| "learning_rate": 3.123508856641542e-05, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20209786295890808, |
| "step": 1665, |
| "valid_targets_mean": 3007.8, |
| "valid_targets_min": 1544 |
| }, |
| { |
| "epoch": 2.66347687400319, |
| "grad_norm": 0.6239083317789432, |
| "learning_rate": 3.116920111166025e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14001812040805817, |
| "step": 1670, |
| "valid_targets_mean": 2042.8, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 2.671451355661882, |
| "grad_norm": 0.5555429521600216, |
| "learning_rate": 3.1103137025834456e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1607971489429474, |
| "step": 1675, |
| "valid_targets_mean": 2579.4, |
| "valid_targets_min": 1481 |
| }, |
| { |
| "epoch": 2.679425837320574, |
| "grad_norm": 0.5911984658901864, |
| "learning_rate": 3.103689735368333e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1880512535572052, |
| "step": 1680, |
| "valid_targets_mean": 2316.4, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 2.6874003189792663, |
| "grad_norm": 0.5568950096417259, |
| "learning_rate": 3.097048314272889e-05, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14909867942333221, |
| "step": 1685, |
| "valid_targets_mean": 2620.3, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 2.6953748006379588, |
| "grad_norm": 0.5605104059179533, |
| "learning_rate": 3.090389544325335e-05, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19391119480133057, |
| "step": 1690, |
| "valid_targets_mean": 3403.4, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 2.7033492822966507, |
| "grad_norm": 0.5940720122887997, |
| "learning_rate": 3.08371353082825e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21021555364131927, |
| "step": 1695, |
| "valid_targets_mean": 2653.8, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 2.7113237639553427, |
| "grad_norm": 0.5279976704245198, |
| "learning_rate": 3.0770203793568994e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20088006556034088, |
| "step": 1700, |
| "valid_targets_mean": 3224.9, |
| "valid_targets_min": 1552 |
| }, |
| { |
| "epoch": 2.719298245614035, |
| "grad_norm": 0.5728810440642814, |
| "learning_rate": 3.0703101957575765e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16884160041809082, |
| "step": 1705, |
| "valid_targets_mean": 2506.7, |
| "valid_targets_min": 1038 |
| }, |
| { |
| "epoch": 2.7272727272727275, |
| "grad_norm": 0.5630970898895722, |
| "learning_rate": 3.0635830861459204e-05, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.201943039894104, |
| "step": 1710, |
| "valid_targets_mean": 3317.2, |
| "valid_targets_min": 1394 |
| }, |
| { |
| "epoch": 2.7352472089314195, |
| "grad_norm": 0.5401867778634583, |
| "learning_rate": 3.056839156905239e-05, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17215926945209503, |
| "step": 1715, |
| "valid_targets_mean": 2514.6, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 2.7432216905901115, |
| "grad_norm": 0.7680039863293809, |
| "learning_rate": 3.0500785146848303e-05, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1482524424791336, |
| "step": 1720, |
| "valid_targets_mean": 2329.0, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 2.751196172248804, |
| "grad_norm": 0.5728974492985291, |
| "learning_rate": 3.04330126639829e-05, |
| "loss": 0.2008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15376368165016174, |
| "step": 1725, |
| "valid_targets_mean": 2507.7, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 2.7591706539074963, |
| "grad_norm": 0.5664221776878716, |
| "learning_rate": 3.0365075192218278e-05, |
| "loss": 0.1836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1676475703716278, |
| "step": 1730, |
| "valid_targets_mean": 2541.6, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 2.7671451355661882, |
| "grad_norm": 0.5049114348515064, |
| "learning_rate": 3.0296973805925663e-05, |
| "loss": 0.1852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18172882497310638, |
| "step": 1735, |
| "valid_targets_mean": 3568.7, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 2.77511961722488, |
| "grad_norm": 0.5614918409668362, |
| "learning_rate": 3.022870958206845e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18978315591812134, |
| "step": 1740, |
| "valid_targets_mean": 2648.4, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 2.7830940988835726, |
| "grad_norm": 0.5542031035808245, |
| "learning_rate": 3.0160283600185168e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1841156929731369, |
| "step": 1745, |
| "valid_targets_mean": 3271.1, |
| "valid_targets_min": 1346 |
| }, |
| { |
| "epoch": 2.7910685805422646, |
| "grad_norm": 0.568674574848384, |
| "learning_rate": 3.0091696942372412e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22050027549266815, |
| "step": 1750, |
| "valid_targets_mean": 2670.2, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 2.799043062200957, |
| "grad_norm": 0.5643138963885681, |
| "learning_rate": 3.002295069326772e-05, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18906863033771515, |
| "step": 1755, |
| "valid_targets_mean": 2565.9, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 2.807017543859649, |
| "grad_norm": 0.6646069591582359, |
| "learning_rate": 2.9954045940032423e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23465055227279663, |
| "step": 1760, |
| "valid_targets_mean": 3034.7, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 2.8149920255183414, |
| "grad_norm": 0.5196774748614063, |
| "learning_rate": 2.988498377233446e-05, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2014995664358139, |
| "step": 1765, |
| "valid_targets_mean": 3231.3, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 2.8229665071770333, |
| "grad_norm": 0.5502942878993454, |
| "learning_rate": 2.981576528233114e-05, |
| "loss": 0.1926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2188304364681244, |
| "step": 1770, |
| "valid_targets_mean": 3371.0, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 2.8309409888357258, |
| "grad_norm": 0.5425762676905854, |
| "learning_rate": 2.9746391564651867e-05, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14157424867153168, |
| "step": 1775, |
| "valid_targets_mean": 2150.8, |
| "valid_targets_min": 1266 |
| }, |
| { |
| "epoch": 2.8389154704944177, |
| "grad_norm": 0.6014818751525163, |
| "learning_rate": 2.9676863716380845e-05, |
| "loss": 0.201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1941225528717041, |
| "step": 1780, |
| "valid_targets_mean": 4106.5, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 2.84688995215311, |
| "grad_norm": 0.5538284681110416, |
| "learning_rate": 2.9607182837039697e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16050055623054504, |
| "step": 1785, |
| "valid_targets_mean": 2549.5, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 2.854864433811802, |
| "grad_norm": 0.6724791781520713, |
| "learning_rate": 2.9537350028570126e-05, |
| "loss": 0.2148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23556634783744812, |
| "step": 1790, |
| "valid_targets_mean": 2610.4, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 2.8628389154704945, |
| "grad_norm": 0.5282103567404306, |
| "learning_rate": 2.946736639531643e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19032198190689087, |
| "step": 1795, |
| "valid_targets_mean": 3423.3, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 2.8708133971291865, |
| "grad_norm": 0.5343948181525061, |
| "learning_rate": 2.9397233044008092e-05, |
| "loss": 0.1815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16319958865642548, |
| "step": 1800, |
| "valid_targets_mean": 2711.1, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 2.878787878787879, |
| "grad_norm": 0.6069494403984073, |
| "learning_rate": 2.9326951083742243e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15907859802246094, |
| "step": 1805, |
| "valid_targets_mean": 2519.6, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 2.886762360446571, |
| "grad_norm": 0.5831177287355487, |
| "learning_rate": 2.925652162596613e-05, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22586268186569214, |
| "step": 1810, |
| "valid_targets_mean": 3239.4, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 2.8947368421052633, |
| "grad_norm": 0.5605548506235492, |
| "learning_rate": 2.9185945784459558e-05, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17734205722808838, |
| "step": 1815, |
| "valid_targets_mean": 2670.1, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 2.9027113237639552, |
| "grad_norm": 0.6194121532589498, |
| "learning_rate": 2.9115224675317252e-05, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17597773671150208, |
| "step": 1820, |
| "valid_targets_mean": 1934.1, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 2.9106858054226477, |
| "grad_norm": 0.5784067931656794, |
| "learning_rate": 2.9044359416931206e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2120431363582611, |
| "step": 1825, |
| "valid_targets_mean": 3082.4, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 2.9186602870813396, |
| "grad_norm": 0.5518771187801405, |
| "learning_rate": 2.897335112997302e-05, |
| "loss": 0.2055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2005378007888794, |
| "step": 1830, |
| "valid_targets_mean": 2880.1, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 2.926634768740032, |
| "grad_norm": 0.48456097909556345, |
| "learning_rate": 2.8902200937376173e-05, |
| "loss": 0.1823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15114593505859375, |
| "step": 1835, |
| "valid_targets_mean": 3304.1, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 2.934609250398724, |
| "grad_norm": 0.568638742445266, |
| "learning_rate": 2.8830909964318242e-05, |
| "loss": 0.2012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.197839617729187, |
| "step": 1840, |
| "valid_targets_mean": 3082.9, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 2.9425837320574164, |
| "grad_norm": 0.6009143002900112, |
| "learning_rate": 2.875947933820312e-05, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21282166242599487, |
| "step": 1845, |
| "valid_targets_mean": 2744.5, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 2.9505582137161084, |
| "grad_norm": 0.5835820573311307, |
| "learning_rate": 2.868791018864321e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23180079460144043, |
| "step": 1850, |
| "valid_targets_mean": 3296.6, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 2.958532695374801, |
| "grad_norm": 0.5403850798020928, |
| "learning_rate": 2.861620364744151e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2239145040512085, |
| "step": 1855, |
| "valid_targets_mean": 3232.8, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 2.9665071770334928, |
| "grad_norm": 0.5471992005694861, |
| "learning_rate": 2.854436084857379e-05, |
| "loss": 0.2042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20272240042686462, |
| "step": 1860, |
| "valid_targets_mean": 2604.9, |
| "valid_targets_min": 1635 |
| }, |
| { |
| "epoch": 2.974481658692185, |
| "grad_norm": 0.5866640715776678, |
| "learning_rate": 2.847238292817057e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20167194306850433, |
| "step": 1865, |
| "valid_targets_mean": 2490.1, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 2.982456140350877, |
| "grad_norm": 0.5904315155737803, |
| "learning_rate": 2.8400271024499212e-05, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18105053901672363, |
| "step": 1870, |
| "valid_targets_mean": 2653.9, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 2.990430622009569, |
| "grad_norm": 0.5667528402230967, |
| "learning_rate": 2.832802627794593e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22661757469177246, |
| "step": 1875, |
| "valid_targets_mean": 3706.2, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 2.9984051036682615, |
| "grad_norm": 0.6009440796314518, |
| "learning_rate": 2.8255649830997704e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20299099385738373, |
| "step": 1880, |
| "valid_targets_mean": 3680.2, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 3.006379585326954, |
| "grad_norm": 0.6099874287063509, |
| "learning_rate": 2.8183142828224238e-05, |
| "loss": 0.1726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1845843642950058, |
| "step": 1885, |
| "valid_targets_mean": 2441.4, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 3.014354066985646, |
| "grad_norm": 0.6051159039153519, |
| "learning_rate": 2.811050641625988e-05, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18158197402954102, |
| "step": 1890, |
| "valid_targets_mean": 2382.5, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 3.0223285486443383, |
| "grad_norm": 0.5721617590448416, |
| "learning_rate": 2.8037741743785458e-05, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16156092286109924, |
| "step": 1895, |
| "valid_targets_mean": 2683.9, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 3.0303030303030303, |
| "grad_norm": 0.5865329434183887, |
| "learning_rate": 2.796484996151013e-05, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11619686335325241, |
| "step": 1900, |
| "valid_targets_mean": 2044.0, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 3.0382775119617227, |
| "grad_norm": 0.5737857689212434, |
| "learning_rate": 2.7891832222153188e-05, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1338677853345871, |
| "step": 1905, |
| "valid_targets_mean": 2470.9, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 3.0462519936204147, |
| "grad_norm": 0.5108539805469473, |
| "learning_rate": 2.7818689680425807e-05, |
| "loss": 0.1816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17531079053878784, |
| "step": 1910, |
| "valid_targets_mean": 3671.6, |
| "valid_targets_min": 1240 |
| }, |
| { |
| "epoch": 3.054226475279107, |
| "grad_norm": 0.5556796605107793, |
| "learning_rate": 2.7745423493012827e-05, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18171335756778717, |
| "step": 1915, |
| "valid_targets_mean": 2726.2, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 3.062200956937799, |
| "grad_norm": 0.6178579891937267, |
| "learning_rate": 2.767203481855441e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18336257338523865, |
| "step": 1920, |
| "valid_targets_mean": 2685.5, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 3.0701754385964914, |
| "grad_norm": 0.5854283357456007, |
| "learning_rate": 2.7598524817627764e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19227474927902222, |
| "step": 1925, |
| "valid_targets_mean": 2520.4, |
| "valid_targets_min": 1045 |
| }, |
| { |
| "epoch": 3.0781499202551834, |
| "grad_norm": 0.49625404123998523, |
| "learning_rate": 2.7524894652728754e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19637757539749146, |
| "step": 1930, |
| "valid_targets_mean": 4134.2, |
| "valid_targets_min": 1222 |
| }, |
| { |
| "epoch": 3.0861244019138754, |
| "grad_norm": 0.5676068839717044, |
| "learning_rate": 2.7451145488253544e-05, |
| "loss": 0.1962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22619007527828217, |
| "step": 1935, |
| "valid_targets_mean": 3551.0, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 3.094098883572568, |
| "grad_norm": 0.7692746963023798, |
| "learning_rate": 2.7377278490480157e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17253446578979492, |
| "step": 1940, |
| "valid_targets_mean": 3062.4, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 3.1020733652312598, |
| "grad_norm": 0.5526740615386009, |
| "learning_rate": 2.730329482755006e-05, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20209446549415588, |
| "step": 1945, |
| "valid_targets_mean": 2935.2, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 3.110047846889952, |
| "grad_norm": 0.5510587896491016, |
| "learning_rate": 2.7229195669449667e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1594051718711853, |
| "step": 1950, |
| "valid_targets_mean": 3520.5, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 3.118022328548644, |
| "grad_norm": 0.6250742491422023, |
| "learning_rate": 2.7154982187991855e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2715832591056824, |
| "step": 1955, |
| "valid_targets_mean": 3909.7, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 3.1259968102073366, |
| "grad_norm": 0.5920653083228358, |
| "learning_rate": 2.7080655556797406e-05, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26988518238067627, |
| "step": 1960, |
| "valid_targets_mean": 3452.6, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 3.1339712918660285, |
| "grad_norm": 0.5388774310856131, |
| "learning_rate": 2.700621695127649e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15851232409477234, |
| "step": 1965, |
| "valid_targets_mean": 2872.0, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 3.141945773524721, |
| "grad_norm": 0.6691557242877121, |
| "learning_rate": 2.693166754861003e-05, |
| "loss": 0.1857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2240079641342163, |
| "step": 1970, |
| "valid_targets_mean": 2786.1, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 3.149920255183413, |
| "grad_norm": 0.6366719433898753, |
| "learning_rate": 2.685700852773113e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19620132446289062, |
| "step": 1975, |
| "valid_targets_mean": 2583.2, |
| "valid_targets_min": 1304 |
| }, |
| { |
| "epoch": 3.1578947368421053, |
| "grad_norm": 0.5928192806363577, |
| "learning_rate": 2.6782241069306395e-05, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186061292886734, |
| "step": 1980, |
| "valid_targets_mean": 2680.7, |
| "valid_targets_min": 1416 |
| }, |
| { |
| "epoch": 3.1658692185007973, |
| "grad_norm": 0.5855724054324057, |
| "learning_rate": 2.6707366355717268e-05, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21362203359603882, |
| "step": 1985, |
| "valid_targets_mean": 2905.8, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 3.1738437001594897, |
| "grad_norm": 0.6347489114308262, |
| "learning_rate": 2.663238557104136e-05, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1517581045627594, |
| "step": 1990, |
| "valid_targets_mean": 2070.0, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 3.1818181818181817, |
| "grad_norm": 0.5635841038270237, |
| "learning_rate": 2.655729990103368e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1979377269744873, |
| "step": 1995, |
| "valid_targets_mean": 2958.0, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 3.189792663476874, |
| "grad_norm": 0.5945458950462633, |
| "learning_rate": 2.648211053310792e-05, |
| "loss": 0.1708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15361088514328003, |
| "step": 2000, |
| "valid_targets_mean": 2395.7, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 3.197767145135566, |
| "grad_norm": 0.6299192799682408, |
| "learning_rate": 2.6406818656317654e-05, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15608029067516327, |
| "step": 2005, |
| "valid_targets_mean": 2129.3, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.2057416267942584, |
| "grad_norm": 0.6201929767056361, |
| "learning_rate": 2.6331425461337557e-05, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19049637019634247, |
| "step": 2010, |
| "valid_targets_mean": 2675.4, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 3.2137161084529504, |
| "grad_norm": 0.5993976587951823, |
| "learning_rate": 2.6255932140444546e-05, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20035934448242188, |
| "step": 2015, |
| "valid_targets_mean": 2800.6, |
| "valid_targets_min": 1342 |
| }, |
| { |
| "epoch": 3.221690590111643, |
| "grad_norm": 0.5460305244294847, |
| "learning_rate": 2.618033988749895e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17547008395195007, |
| "step": 2020, |
| "valid_targets_mean": 3045.4, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 3.229665071770335, |
| "grad_norm": 0.5515986645818807, |
| "learning_rate": 2.6104649897925622e-05, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17502939701080322, |
| "step": 2025, |
| "valid_targets_mean": 2976.9, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 3.237639553429027, |
| "grad_norm": 0.5334926575974487, |
| "learning_rate": 2.602886336869503e-05, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13687369227409363, |
| "step": 2030, |
| "valid_targets_mean": 2390.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 3.245614035087719, |
| "grad_norm": 0.5518442305418664, |
| "learning_rate": 2.595298149830433e-05, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16078054904937744, |
| "step": 2035, |
| "valid_targets_mean": 2902.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 3.2535885167464116, |
| "grad_norm": 0.5690058283856204, |
| "learning_rate": 2.5877005486758424e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18337497115135193, |
| "step": 2040, |
| "valid_targets_mean": 2966.4, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 3.2615629984051036, |
| "grad_norm": 0.497799727420445, |
| "learning_rate": 2.5800936535550954e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1807919144630432, |
| "step": 2045, |
| "valid_targets_mean": 3695.0, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 3.269537480063796, |
| "grad_norm": 0.544150458920545, |
| "learning_rate": 2.5724775847645345e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.283038467168808, |
| "step": 2050, |
| "valid_targets_mean": 3945.1, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 3.277511961722488, |
| "grad_norm": 0.4913399971466565, |
| "learning_rate": 2.5648524627455738e-05, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19701933860778809, |
| "step": 2055, |
| "valid_targets_mean": 4155.9, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 3.2854864433811803, |
| "grad_norm": 0.5691728034505411, |
| "learning_rate": 2.557218408082798e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18620505928993225, |
| "step": 2060, |
| "valid_targets_mean": 2885.2, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 3.2934609250398723, |
| "grad_norm": 0.5111010875857084, |
| "learning_rate": 2.5495755415020504e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1496405005455017, |
| "step": 2065, |
| "valid_targets_mean": 2963.8, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 3.3014354066985647, |
| "grad_norm": 0.5407424289252192, |
| "learning_rate": 2.5419239838685325e-05, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15042206645011902, |
| "step": 2070, |
| "valid_targets_mean": 3061.2, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 3.3094098883572567, |
| "grad_norm": 0.5973954022258182, |
| "learning_rate": 2.5342638561848817e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1537877321243286, |
| "step": 2075, |
| "valid_targets_mean": 2506.9, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 3.317384370015949, |
| "grad_norm": 0.5830150859025254, |
| "learning_rate": 2.526595279589265e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1255737543106079, |
| "step": 2080, |
| "valid_targets_mean": 2168.4, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 3.325358851674641, |
| "grad_norm": 0.5136748644322553, |
| "learning_rate": 2.5189183753534634e-05, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17841193079948425, |
| "step": 2085, |
| "valid_targets_mean": 3524.8, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.5444148283630629, |
| "learning_rate": 2.5112332648809495e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19738224148750305, |
| "step": 2090, |
| "valid_targets_mean": 3265.0, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 3.3413078149920254, |
| "grad_norm": 0.5736105889034541, |
| "learning_rate": 2.503540069704973e-05, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18508929014205933, |
| "step": 2095, |
| "valid_targets_mean": 3098.3, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 3.349282296650718, |
| "grad_norm": 0.5444972670187521, |
| "learning_rate": 2.4958389114866326e-05, |
| "loss": 0.2084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23350661993026733, |
| "step": 2100, |
| "valid_targets_mean": 3487.3, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 3.35725677830941, |
| "grad_norm": 0.607507746990593, |
| "learning_rate": 2.488129912012958e-05, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1646861582994461, |
| "step": 2105, |
| "valid_targets_mean": 2289.1, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 3.3652312599681022, |
| "grad_norm": 0.5590542729013029, |
| "learning_rate": 2.4804131931949823e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1932382434606552, |
| "step": 2110, |
| "valid_targets_mean": 3424.1, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 3.373205741626794, |
| "grad_norm": 0.5792226727709087, |
| "learning_rate": 2.4726888770658103e-05, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1489265263080597, |
| "step": 2115, |
| "valid_targets_mean": 2261.2, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 3.3811802232854866, |
| "grad_norm": 0.6496431060482095, |
| "learning_rate": 2.4649570857786928e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15027418732643127, |
| "step": 2120, |
| "valid_targets_mean": 2156.9, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 3.3891547049441786, |
| "grad_norm": 0.5528609427449673, |
| "learning_rate": 2.4572179416050953e-05, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16369466483592987, |
| "step": 2125, |
| "valid_targets_mean": 2808.6, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 3.397129186602871, |
| "grad_norm": 0.5312391691731903, |
| "learning_rate": 2.449471566932761e-05, |
| "loss": 0.1894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17131400108337402, |
| "step": 2130, |
| "valid_targets_mean": 3416.1, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 3.405103668261563, |
| "grad_norm": 0.6228851428878182, |
| "learning_rate": 2.4417180842637764e-05, |
| "loss": 0.176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23682790994644165, |
| "step": 2135, |
| "valid_targets_mean": 3038.9, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 3.4130781499202554, |
| "grad_norm": 0.5882304013111794, |
| "learning_rate": 2.4339576162126362e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15148214995861053, |
| "step": 2140, |
| "valid_targets_mean": 2432.0, |
| "valid_targets_min": 248 |
| }, |
| { |
| "epoch": 3.4210526315789473, |
| "grad_norm": 0.5783651613849465, |
| "learning_rate": 2.4261902855043027e-05, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17573174834251404, |
| "step": 2145, |
| "valid_targets_mean": 2605.1, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 3.4290271132376393, |
| "grad_norm": 0.6002324738524472, |
| "learning_rate": 2.418416214972265e-05, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1507042646408081, |
| "step": 2150, |
| "valid_targets_mean": 1904.8, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 3.4370015948963317, |
| "grad_norm": 0.49264136447640344, |
| "learning_rate": 2.4106355275565937e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1505666971206665, |
| "step": 2155, |
| "valid_targets_mean": 2797.3, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 3.444976076555024, |
| "grad_norm": 0.5621913458885389, |
| "learning_rate": 2.4028483463020053e-05, |
| "loss": 0.1813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16950352489948273, |
| "step": 2160, |
| "valid_targets_mean": 2679.9, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 3.452950558213716, |
| "grad_norm": 0.5401249898056637, |
| "learning_rate": 2.3950547943559056e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22693544626235962, |
| "step": 2165, |
| "valid_targets_mean": 3421.9, |
| "valid_targets_min": 1372 |
| }, |
| { |
| "epoch": 3.460925039872408, |
| "grad_norm": 0.6699395433332309, |
| "learning_rate": 2.3872549949664493e-05, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16658160090446472, |
| "step": 2170, |
| "valid_targets_mean": 2192.9, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 3.4688995215311005, |
| "grad_norm": 0.6254529715179462, |
| "learning_rate": 2.3794490714805897e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186039999127388, |
| "step": 2175, |
| "valid_targets_mean": 2131.5, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 3.476874003189793, |
| "grad_norm": 0.5627992056782284, |
| "learning_rate": 2.3716371473421242e-05, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15978986024856567, |
| "step": 2180, |
| "valid_targets_mean": 2397.3, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 3.484848484848485, |
| "grad_norm": 0.5869604883871188, |
| "learning_rate": 2.36381934608975e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18033649027347565, |
| "step": 2185, |
| "valid_targets_mean": 2868.6, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 3.492822966507177, |
| "grad_norm": 0.5069371015301846, |
| "learning_rate": 2.3559957913551014e-05, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19203317165374756, |
| "step": 2190, |
| "valid_targets_mean": 4175.7, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 3.5007974481658692, |
| "grad_norm": 0.6745474518471709, |
| "learning_rate": 2.3481666068607994e-05, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18692749738693237, |
| "step": 2195, |
| "valid_targets_mean": 2161.5, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 3.5087719298245617, |
| "grad_norm": 0.5614763734838379, |
| "learning_rate": 2.3403319164184986e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1870293766260147, |
| "step": 2200, |
| "valid_targets_mean": 2776.0, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 3.5167464114832536, |
| "grad_norm": 0.5970202439939211, |
| "learning_rate": 2.3324918439269206e-05, |
| "loss": 0.1943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16551634669303894, |
| "step": 2205, |
| "valid_targets_mean": 2269.2, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 3.5247208931419456, |
| "grad_norm": 0.621103572086824, |
| "learning_rate": 2.3246465133699024e-05, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16670405864715576, |
| "step": 2210, |
| "valid_targets_mean": 2442.2, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 3.532695374800638, |
| "grad_norm": 0.49934228070645226, |
| "learning_rate": 2.31679604881443e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18905407190322876, |
| "step": 2215, |
| "valid_targets_mean": 3872.6, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 3.5406698564593304, |
| "grad_norm": 0.6269225467887087, |
| "learning_rate": 2.3089405744086823e-05, |
| "loss": 0.1595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16947981715202332, |
| "step": 2220, |
| "valid_targets_mean": 2441.1, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 3.5486443381180224, |
| "grad_norm": 0.5286942755540239, |
| "learning_rate": 2.3010802143800626e-05, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1366422474384308, |
| "step": 2225, |
| "valid_targets_mean": 2366.1, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 3.5566188197767143, |
| "grad_norm": 0.5109251022213953, |
| "learning_rate": 2.2932150930332363e-05, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14900361001491547, |
| "step": 2230, |
| "valid_targets_mean": 3294.4, |
| "valid_targets_min": 1424 |
| }, |
| { |
| "epoch": 3.5645933014354068, |
| "grad_norm": 0.6397212335830404, |
| "learning_rate": 2.2853453347481635e-05, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1566600203514099, |
| "step": 2235, |
| "valid_targets_mean": 2303.5, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 3.5725677830940987, |
| "grad_norm": 0.5801376421441098, |
| "learning_rate": 2.277471063978137e-05, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1630595624446869, |
| "step": 2240, |
| "valid_targets_mean": 2375.6, |
| "valid_targets_min": 1396 |
| }, |
| { |
| "epoch": 3.580542264752791, |
| "grad_norm": 0.5790198614924473, |
| "learning_rate": 2.2695924052478065e-05, |
| "loss": 0.1879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17185233533382416, |
| "step": 2245, |
| "valid_targets_mean": 2518.6, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 3.588516746411483, |
| "grad_norm": 0.5243705768816054, |
| "learning_rate": 2.2617094831512167e-05, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20980407297611237, |
| "step": 2250, |
| "valid_targets_mean": 3963.8, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 3.5964912280701755, |
| "grad_norm": 0.5504953256074006, |
| "learning_rate": 2.253822422349831e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18440350890159607, |
| "step": 2255, |
| "valid_targets_mean": 2997.2, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 3.6044657097288675, |
| "grad_norm": 0.5728779102295528, |
| "learning_rate": 2.2459313475705645e-05, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16484129428863525, |
| "step": 2260, |
| "valid_targets_mean": 2457.5, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 3.61244019138756, |
| "grad_norm": 0.6105030719650987, |
| "learning_rate": 2.23803638360381e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16316813230514526, |
| "step": 2265, |
| "valid_targets_mean": 2532.6, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 3.620414673046252, |
| "grad_norm": 0.5665339579502443, |
| "learning_rate": 2.2301376553014625e-05, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16501827538013458, |
| "step": 2270, |
| "valid_targets_mean": 2997.6, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 3.6283891547049443, |
| "grad_norm": 0.6138831066285112, |
| "learning_rate": 2.2222352875749493e-05, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19114506244659424, |
| "step": 2275, |
| "valid_targets_mean": 3209.3, |
| "valid_targets_min": 1469 |
| }, |
| { |
| "epoch": 3.6363636363636362, |
| "grad_norm": 0.4615867272467092, |
| "learning_rate": 2.214329405393249e-05, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1981082260608673, |
| "step": 2280, |
| "valid_targets_mean": 4500.8, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 3.6443381180223287, |
| "grad_norm": 0.5442457635323399, |
| "learning_rate": 2.2064201337809212e-05, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1776713728904724, |
| "step": 2285, |
| "valid_targets_mean": 3355.9, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 3.6523125996810206, |
| "grad_norm": 0.5407377473015359, |
| "learning_rate": 2.1985075978161236e-05, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15134361386299133, |
| "step": 2290, |
| "valid_targets_mean": 2769.6, |
| "valid_targets_min": 1416 |
| }, |
| { |
| "epoch": 3.660287081339713, |
| "grad_norm": 0.5905714881664845, |
| "learning_rate": 2.1905919226286385e-05, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13224008679389954, |
| "step": 2295, |
| "valid_targets_mean": 2251.6, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 3.668261562998405, |
| "grad_norm": 0.6215279831334835, |
| "learning_rate": 2.1826732333978924e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22618988156318665, |
| "step": 2300, |
| "valid_targets_mean": 2626.7, |
| "valid_targets_min": 1169 |
| }, |
| { |
| "epoch": 3.6762360446570974, |
| "grad_norm": 0.5696379458737713, |
| "learning_rate": 2.1747516553509755e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13785511255264282, |
| "step": 2305, |
| "valid_targets_mean": 2088.3, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 3.6842105263157894, |
| "grad_norm": 0.5709846807235273, |
| "learning_rate": 2.166827313760662e-05, |
| "loss": 0.19, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1877063363790512, |
| "step": 2310, |
| "valid_targets_mean": 2509.9, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 3.692185007974482, |
| "grad_norm": 0.546669144933103, |
| "learning_rate": 2.1589003339434292e-05, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21933197975158691, |
| "step": 2315, |
| "valid_targets_mean": 3100.3, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 3.7001594896331738, |
| "grad_norm": 0.5776670004886075, |
| "learning_rate": 2.150970841257476e-05, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21792183816432953, |
| "step": 2320, |
| "valid_targets_mean": 3190.8, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 3.708133971291866, |
| "grad_norm": 0.5740982492996695, |
| "learning_rate": 2.1430389611007393e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16459020972251892, |
| "step": 2325, |
| "valid_targets_mean": 2925.2, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 3.716108452950558, |
| "grad_norm": 0.5443262921569451, |
| "learning_rate": 2.135104818908913e-05, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16006751358509064, |
| "step": 2330, |
| "valid_targets_mean": 2719.9, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 3.7240829346092506, |
| "grad_norm": 0.5979662168113598, |
| "learning_rate": 2.1271685401534617e-05, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18777906894683838, |
| "step": 2335, |
| "valid_targets_mean": 2444.4, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 3.7320574162679425, |
| "grad_norm": 0.5280536723772452, |
| "learning_rate": 2.11923025033964e-05, |
| "loss": 0.1554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12486009299755096, |
| "step": 2340, |
| "valid_targets_mean": 2508.4, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 3.740031897926635, |
| "grad_norm": 0.5014224094405413, |
| "learning_rate": 2.111290075004503e-05, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2104087471961975, |
| "step": 2345, |
| "valid_targets_mean": 4018.2, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 3.748006379585327, |
| "grad_norm": 0.5329277393739597, |
| "learning_rate": 2.103348139714925e-05, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15234363079071045, |
| "step": 2350, |
| "valid_targets_mean": 2975.2, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 3.7559808612440193, |
| "grad_norm": 0.602906573401119, |
| "learning_rate": 2.0954045700656126e-05, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23616360127925873, |
| "step": 2355, |
| "valid_targets_mean": 2888.1, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 3.7639553429027113, |
| "grad_norm": 0.593349469128777, |
| "learning_rate": 2.0874594916771174e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17083615064620972, |
| "step": 2360, |
| "valid_targets_mean": 2501.6, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 3.7719298245614032, |
| "grad_norm": 0.6659895307842664, |
| "learning_rate": 2.079513030193852e-05, |
| "loss": 0.1944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18279269337654114, |
| "step": 2365, |
| "valid_targets_mean": 3181.6, |
| "valid_targets_min": 1554 |
| }, |
| { |
| "epoch": 3.7799043062200957, |
| "grad_norm": 0.5481485498020948, |
| "learning_rate": 2.071565311282099e-05, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15074336528778076, |
| "step": 2370, |
| "valid_targets_mean": 2559.0, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 3.787878787878788, |
| "grad_norm": 0.5064359267566692, |
| "learning_rate": 2.063616460628029e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13388487696647644, |
| "step": 2375, |
| "valid_targets_mean": 2798.5, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 3.79585326953748, |
| "grad_norm": 0.6015447662377474, |
| "learning_rate": 2.0556666039357084e-05, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1580061912536621, |
| "step": 2380, |
| "valid_targets_mean": 2257.2, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 3.803827751196172, |
| "grad_norm": 0.6425996831220174, |
| "learning_rate": 2.047715866925113e-05, |
| "loss": 0.1682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17762739956378937, |
| "step": 2385, |
| "valid_targets_mean": 2541.7, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 3.8118022328548644, |
| "grad_norm": 0.6128275854039842, |
| "learning_rate": 2.0397643753301403e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1614629626274109, |
| "step": 2390, |
| "valid_targets_mean": 2946.4, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 3.819776714513557, |
| "grad_norm": 0.5505144745464942, |
| "learning_rate": 2.0318122548966225e-05, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21430611610412598, |
| "step": 2395, |
| "valid_targets_mean": 3036.6, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 3.827751196172249, |
| "grad_norm": 0.4407896880987488, |
| "learning_rate": 2.0238596313803337e-05, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17456912994384766, |
| "step": 2400, |
| "valid_targets_mean": 4507.5, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 3.8357256778309408, |
| "grad_norm": 0.533906121005407, |
| "learning_rate": 2.015906630545005e-05, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19968262314796448, |
| "step": 2405, |
| "valid_targets_mean": 3266.3, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 3.843700159489633, |
| "grad_norm": 0.6010100638921084, |
| "learning_rate": 2.0079533781603352e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15822017192840576, |
| "step": 2410, |
| "valid_targets_mean": 2278.6, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 3.8516746411483256, |
| "grad_norm": 0.6656969404639518, |
| "learning_rate": 2e-05, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15312731266021729, |
| "step": 2415, |
| "valid_targets_mean": 1937.1, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 3.8596491228070176, |
| "grad_norm": 0.5908822557428244, |
| "learning_rate": 1.9920466218396655e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1849689483642578, |
| "step": 2420, |
| "valid_targets_mean": 2551.8, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 3.8676236044657095, |
| "grad_norm": 0.5868172639371974, |
| "learning_rate": 1.9840933694549956e-05, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16618412733078003, |
| "step": 2425, |
| "valid_targets_mean": 2423.7, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 3.875598086124402, |
| "grad_norm": 0.5929987209389399, |
| "learning_rate": 1.976140368619667e-05, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2104598581790924, |
| "step": 2430, |
| "valid_targets_mean": 2879.4, |
| "valid_targets_min": 1403 |
| }, |
| { |
| "epoch": 3.8835725677830943, |
| "grad_norm": 0.5696736725853189, |
| "learning_rate": 1.9681877451033778e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1889794021844864, |
| "step": 2435, |
| "valid_targets_mean": 2941.5, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 3.8915470494417863, |
| "grad_norm": 0.8300816587532014, |
| "learning_rate": 1.9602356246698597e-05, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22295412421226501, |
| "step": 2440, |
| "valid_targets_mean": 2925.1, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 3.8995215311004783, |
| "grad_norm": 0.5343275886193569, |
| "learning_rate": 1.9522841330748877e-05, |
| "loss": 0.1828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1584158092737198, |
| "step": 2445, |
| "valid_targets_mean": 2872.1, |
| "valid_targets_min": 1526 |
| }, |
| { |
| "epoch": 3.9074960127591707, |
| "grad_norm": 0.5571151028017529, |
| "learning_rate": 1.944333396064292e-05, |
| "loss": 0.1929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2206161618232727, |
| "step": 2450, |
| "valid_targets_mean": 3363.2, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 3.915470494417863, |
| "grad_norm": 0.557234488585679, |
| "learning_rate": 1.936383539371971e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22577141225337982, |
| "step": 2455, |
| "valid_targets_mean": 3063.4, |
| "valid_targets_min": 1112 |
| }, |
| { |
| "epoch": 3.923444976076555, |
| "grad_norm": 0.6518598913086615, |
| "learning_rate": 1.9284346887179016e-05, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18474088609218597, |
| "step": 2460, |
| "valid_targets_mean": 2250.4, |
| "valid_targets_min": 1063 |
| }, |
| { |
| "epoch": 3.931419457735247, |
| "grad_norm": 0.591784233490105, |
| "learning_rate": 1.9204869698061493e-05, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18672320246696472, |
| "step": 2465, |
| "valid_targets_mean": 2717.3, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 3.9393939393939394, |
| "grad_norm": 0.6029208831187829, |
| "learning_rate": 1.9125405083228833e-05, |
| "loss": 0.2183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21028904616832733, |
| "step": 2470, |
| "valid_targets_mean": 2852.6, |
| "valid_targets_min": 1309 |
| }, |
| { |
| "epoch": 3.9473684210526314, |
| "grad_norm": 0.5681207981391441, |
| "learning_rate": 1.9045954299343884e-05, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1799524873495102, |
| "step": 2475, |
| "valid_targets_mean": 3248.3, |
| "valid_targets_min": 1519 |
| }, |
| { |
| "epoch": 3.955342902711324, |
| "grad_norm": 0.5531686772161876, |
| "learning_rate": 1.896651860285076e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17599454522132874, |
| "step": 2480, |
| "valid_targets_mean": 2960.8, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 3.963317384370016, |
| "grad_norm": 0.567746336035401, |
| "learning_rate": 1.8887099249954976e-05, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19742515683174133, |
| "step": 2485, |
| "valid_targets_mean": 2644.5, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 3.971291866028708, |
| "grad_norm": 0.5926141200227866, |
| "learning_rate": 1.8807697496603604e-05, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16229791939258575, |
| "step": 2490, |
| "valid_targets_mean": 2446.4, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 3.9792663476874, |
| "grad_norm": 0.5559012262231059, |
| "learning_rate": 1.8728314598465386e-05, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1845509111881256, |
| "step": 2495, |
| "valid_targets_mean": 3171.1, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 3.9872408293460926, |
| "grad_norm": 0.6154642770548927, |
| "learning_rate": 1.8648951810910878e-05, |
| "loss": 0.1851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15992483496665955, |
| "step": 2500, |
| "valid_targets_mean": 2345.1, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 3.9952153110047846, |
| "grad_norm": 0.5570345470466502, |
| "learning_rate": 1.856961038899261e-05, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21707212924957275, |
| "step": 2505, |
| "valid_targets_mean": 3223.9, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 4.003189792663477, |
| "grad_norm": 0.4820862025485545, |
| "learning_rate": 1.849029158742525e-05, |
| "loss": 0.1583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13848713040351868, |
| "step": 2510, |
| "valid_targets_mean": 3489.1, |
| "valid_targets_min": 1517 |
| }, |
| { |
| "epoch": 4.011164274322169, |
| "grad_norm": 0.5449115879256036, |
| "learning_rate": 1.8410996660565714e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17959289252758026, |
| "step": 2515, |
| "valid_targets_mean": 3114.4, |
| "valid_targets_min": 1154 |
| }, |
| { |
| "epoch": 4.019138755980861, |
| "grad_norm": 0.5821484435562528, |
| "learning_rate": 1.8331726862393385e-05, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15955208241939545, |
| "step": 2520, |
| "valid_targets_mean": 3422.6, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 4.027113237639553, |
| "grad_norm": 0.5333494672871051, |
| "learning_rate": 1.8252483446490245e-05, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16043981909751892, |
| "step": 2525, |
| "valid_targets_mean": 3289.8, |
| "valid_targets_min": 1258 |
| }, |
| { |
| "epoch": 4.035087719298246, |
| "grad_norm": 0.681384185389914, |
| "learning_rate": 1.8173267666021075e-05, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15066920220851898, |
| "step": 2530, |
| "valid_targets_mean": 1848.1, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 4.043062200956938, |
| "grad_norm": 0.5926951676146437, |
| "learning_rate": 1.8094080773713615e-05, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1673404574394226, |
| "step": 2535, |
| "valid_targets_mean": 2794.1, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 4.05103668261563, |
| "grad_norm": 0.6585195947195234, |
| "learning_rate": 1.8014924021838774e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15531276166439056, |
| "step": 2540, |
| "valid_targets_mean": 2173.6, |
| "valid_targets_min": 1112 |
| }, |
| { |
| "epoch": 4.059011164274322, |
| "grad_norm": 0.6431155766625963, |
| "learning_rate": 1.7935798662190798e-05, |
| "loss": 0.177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20385132730007172, |
| "step": 2545, |
| "valid_targets_mean": 3026.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 4.0669856459330145, |
| "grad_norm": 0.6055270197304871, |
| "learning_rate": 1.785670594606752e-05, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16407035291194916, |
| "step": 2550, |
| "valid_targets_mean": 2962.2, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 4.074960127591707, |
| "grad_norm": 0.527292972057754, |
| "learning_rate": 1.777764712425052e-05, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1590946912765503, |
| "step": 2555, |
| "valid_targets_mean": 3571.1, |
| "valid_targets_min": 424 |
| }, |
| { |
| "epoch": 4.082934609250398, |
| "grad_norm": 0.5778748659086131, |
| "learning_rate": 1.7698623446985378e-05, |
| "loss": 0.1482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1918186992406845, |
| "step": 2560, |
| "valid_targets_mean": 3398.8, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 4.090909090909091, |
| "grad_norm": 0.5230022966524009, |
| "learning_rate": 1.7619636163961907e-05, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16492609679698944, |
| "step": 2565, |
| "valid_targets_mean": 3574.9, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 4.098883572567783, |
| "grad_norm": 0.600059132410499, |
| "learning_rate": 1.754068652429436e-05, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22227483987808228, |
| "step": 2570, |
| "valid_targets_mean": 3160.7, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 4.106858054226476, |
| "grad_norm": 0.5506153806974453, |
| "learning_rate": 1.74617757765017e-05, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15465757250785828, |
| "step": 2575, |
| "valid_targets_mean": 3507.8, |
| "valid_targets_min": 1169 |
| }, |
| { |
| "epoch": 4.114832535885167, |
| "grad_norm": 0.5872195929772528, |
| "learning_rate": 1.738290516848784e-05, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1792100965976715, |
| "step": 2580, |
| "valid_targets_mean": 3182.6, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 4.12280701754386, |
| "grad_norm": 0.5568326980647963, |
| "learning_rate": 1.730407594752194e-05, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13268157839775085, |
| "step": 2585, |
| "valid_targets_mean": 2716.8, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 4.130781499202552, |
| "grad_norm": 0.5337621603486079, |
| "learning_rate": 1.722528936021864e-05, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13221563398838043, |
| "step": 2590, |
| "valid_targets_mean": 2776.6, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 4.138755980861244, |
| "grad_norm": 0.594154146656907, |
| "learning_rate": 1.714654665251837e-05, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2037222981452942, |
| "step": 2595, |
| "valid_targets_mean": 3069.6, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 4.146730462519936, |
| "grad_norm": 0.5991382655130797, |
| "learning_rate": 1.7067849069667644e-05, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1336292177438736, |
| "step": 2600, |
| "valid_targets_mean": 2691.4, |
| "valid_targets_min": 1362 |
| }, |
| { |
| "epoch": 4.154704944178628, |
| "grad_norm": 0.6333054733885867, |
| "learning_rate": 1.6989197856199377e-05, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12979856133460999, |
| "step": 2605, |
| "valid_targets_mean": 2420.9, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 4.162679425837321, |
| "grad_norm": 0.5693331370434527, |
| "learning_rate": 1.6910594255913177e-05, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1348324865102768, |
| "step": 2610, |
| "valid_targets_mean": 2557.1, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 4.170653907496013, |
| "grad_norm": 0.6158456534730181, |
| "learning_rate": 1.6832039511855702e-05, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17839965224266052, |
| "step": 2615, |
| "valid_targets_mean": 2557.9, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 4.178628389154705, |
| "grad_norm": 0.6569117165395834, |
| "learning_rate": 1.6753534866300983e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12349331378936768, |
| "step": 2620, |
| "valid_targets_mean": 2012.1, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 4.186602870813397, |
| "grad_norm": 0.5649615489956892, |
| "learning_rate": 1.6675081560730804e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15348169207572937, |
| "step": 2625, |
| "valid_targets_mean": 3120.9, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 4.1945773524720895, |
| "grad_norm": 0.6662040972505084, |
| "learning_rate": 1.6596680835815024e-05, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1765637993812561, |
| "step": 2630, |
| "valid_targets_mean": 2654.2, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 4.202551834130782, |
| "grad_norm": 0.6225824529089881, |
| "learning_rate": 1.651833393139201e-05, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14078602194786072, |
| "step": 2635, |
| "valid_targets_mean": 3025.2, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 4.2105263157894735, |
| "grad_norm": 0.6675069947682166, |
| "learning_rate": 1.6440042086449e-05, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14914357662200928, |
| "step": 2640, |
| "valid_targets_mean": 2228.6, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 4.218500797448166, |
| "grad_norm": 0.5649692767485978, |
| "learning_rate": 1.6361806539102508e-05, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22645841538906097, |
| "step": 2645, |
| "valid_targets_mean": 3634.6, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 4.226475279106858, |
| "grad_norm": 0.5594120744991358, |
| "learning_rate": 1.628362852657876e-05, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.133091002702713, |
| "step": 2650, |
| "valid_targets_mean": 2490.9, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 4.23444976076555, |
| "grad_norm": 0.6130688435516675, |
| "learning_rate": 1.620550928519411e-05, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17605170607566833, |
| "step": 2655, |
| "valid_targets_mean": 3088.2, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 4.242424242424242, |
| "grad_norm": 0.5599311671798608, |
| "learning_rate": 1.612745005033551e-05, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20437359809875488, |
| "step": 2660, |
| "valid_targets_mean": 3273.9, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 4.250398724082935, |
| "grad_norm": 0.524405728232288, |
| "learning_rate": 1.6049452056440948e-05, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1535736620426178, |
| "step": 2665, |
| "valid_targets_mean": 3528.8, |
| "valid_targets_min": 1250 |
| }, |
| { |
| "epoch": 4.258373205741627, |
| "grad_norm": 0.9543428316028962, |
| "learning_rate": 1.597151653697995e-05, |
| "loss": 0.1987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12014397233724594, |
| "step": 2670, |
| "valid_targets_mean": 1957.2, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 4.266347687400319, |
| "grad_norm": 0.6675333452530134, |
| "learning_rate": 1.5893644724434066e-05, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17045184969902039, |
| "step": 2675, |
| "valid_targets_mean": 2527.7, |
| "valid_targets_min": 1129 |
| }, |
| { |
| "epoch": 4.274322169059011, |
| "grad_norm": 0.5530104226801451, |
| "learning_rate": 1.581583785027736e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15394771099090576, |
| "step": 2680, |
| "valid_targets_mean": 3375.9, |
| "valid_targets_min": 1485 |
| }, |
| { |
| "epoch": 4.282296650717703, |
| "grad_norm": 0.6198052315537499, |
| "learning_rate": 1.5738097144956976e-05, |
| "loss": 0.174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18288853764533997, |
| "step": 2685, |
| "valid_targets_mean": 2741.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 4.290271132376396, |
| "grad_norm": 0.5705456528708921, |
| "learning_rate": 1.566042383787364e-05, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17937612533569336, |
| "step": 2690, |
| "valid_targets_mean": 3222.2, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 4.298245614035087, |
| "grad_norm": 0.6678666574110236, |
| "learning_rate": 1.558281915736224e-05, |
| "loss": 0.1595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17287465929985046, |
| "step": 2695, |
| "valid_targets_mean": 2454.9, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 4.30622009569378, |
| "grad_norm": 0.58460956144151, |
| "learning_rate": 1.550528433067239e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15777446329593658, |
| "step": 2700, |
| "valid_targets_mean": 2841.6, |
| "valid_targets_min": 1330 |
| }, |
| { |
| "epoch": 4.314194577352472, |
| "grad_norm": 0.6720009602673392, |
| "learning_rate": 1.5427820583949054e-05, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17180287837982178, |
| "step": 2705, |
| "valid_targets_mean": 2462.7, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 4.3221690590111645, |
| "grad_norm": 0.6831596441857424, |
| "learning_rate": 1.5350429142213075e-05, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1586819291114807, |
| "step": 2710, |
| "valid_targets_mean": 1872.5, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 4.330143540669856, |
| "grad_norm": 0.5344175912658572, |
| "learning_rate": 1.5273111229341907e-05, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18215686082839966, |
| "step": 2715, |
| "valid_targets_mean": 3179.9, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 4.3381180223285485, |
| "grad_norm": 0.6216985426268544, |
| "learning_rate": 1.5195868068050185e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1297648698091507, |
| "step": 2720, |
| "valid_targets_mean": 2275.3, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 4.346092503987241, |
| "grad_norm": 0.6239029857349583, |
| "learning_rate": 1.5118700879870426e-05, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13424813747406006, |
| "step": 2725, |
| "valid_targets_mean": 2379.4, |
| "valid_targets_min": 1273 |
| }, |
| { |
| "epoch": 4.354066985645933, |
| "grad_norm": 0.5723646011985536, |
| "learning_rate": 1.5041610885133681e-05, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16782692074775696, |
| "step": 2730, |
| "valid_targets_mean": 3187.6, |
| "valid_targets_min": 1287 |
| }, |
| { |
| "epoch": 4.362041467304625, |
| "grad_norm": 0.5813610738573333, |
| "learning_rate": 1.496459930295028e-05, |
| "loss": 0.1532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15391327440738678, |
| "step": 2735, |
| "valid_targets_mean": 2778.6, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 4.370015948963317, |
| "grad_norm": 0.658300475272945, |
| "learning_rate": 1.4887667351190508e-05, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15785977244377136, |
| "step": 2740, |
| "valid_targets_mean": 2196.1, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 4.37799043062201, |
| "grad_norm": 0.6029868584965588, |
| "learning_rate": 1.4810816246465374e-05, |
| "loss": 0.1416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15540479123592377, |
| "step": 2745, |
| "valid_targets_mean": 2765.9, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 4.385964912280702, |
| "grad_norm": 0.5597027272525674, |
| "learning_rate": 1.4734047204107358e-05, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13575266301631927, |
| "step": 2750, |
| "valid_targets_mean": 2654.2, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 4.393939393939394, |
| "grad_norm": 0.5407528721459675, |
| "learning_rate": 1.4657361438151192e-05, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16623978316783905, |
| "step": 2755, |
| "valid_targets_mean": 3222.1, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 4.401913875598086, |
| "grad_norm": 0.6874305661080543, |
| "learning_rate": 1.458076016131468e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1757175326347351, |
| "step": 2760, |
| "valid_targets_mean": 2338.8, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 4.409888357256778, |
| "grad_norm": 0.5591760680100331, |
| "learning_rate": 1.4504244584979494e-05, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17732250690460205, |
| "step": 2765, |
| "valid_targets_mean": 3493.1, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 4.417862838915471, |
| "grad_norm": 0.6006214490581323, |
| "learning_rate": 1.442781591917203e-05, |
| "loss": 0.1556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10994596034288406, |
| "step": 2770, |
| "valid_targets_mean": 1990.3, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 4.425837320574162, |
| "grad_norm": 0.6136597184600974, |
| "learning_rate": 1.4351475372544262e-05, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1602148413658142, |
| "step": 2775, |
| "valid_targets_mean": 2516.6, |
| "valid_targets_min": 1300 |
| }, |
| { |
| "epoch": 4.433811802232855, |
| "grad_norm": 0.6063956457279249, |
| "learning_rate": 1.4275224152354658e-05, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20220395922660828, |
| "step": 2780, |
| "valid_targets_mean": 3064.8, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 4.441786283891547, |
| "grad_norm": 0.6960689470943858, |
| "learning_rate": 1.4199063464449047e-05, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23058322072029114, |
| "step": 2785, |
| "valid_targets_mean": 2944.1, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 4.44976076555024, |
| "grad_norm": 0.581843784735055, |
| "learning_rate": 1.4122994513241587e-05, |
| "loss": 0.1682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16655464470386505, |
| "step": 2790, |
| "valid_targets_mean": 2789.2, |
| "valid_targets_min": 1179 |
| }, |
| { |
| "epoch": 4.457735247208931, |
| "grad_norm": 0.5850624942481338, |
| "learning_rate": 1.4047018501695677e-05, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18775057792663574, |
| "step": 2795, |
| "valid_targets_mean": 3112.1, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 4.4657097288676235, |
| "grad_norm": 0.7725419945300261, |
| "learning_rate": 1.3971136631304978e-05, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13948987424373627, |
| "step": 2800, |
| "valid_targets_mean": 3131.8, |
| "valid_targets_min": 1342 |
| }, |
| { |
| "epoch": 4.473684210526316, |
| "grad_norm": 0.6442207373438252, |
| "learning_rate": 1.3895350102074386e-05, |
| "loss": 0.1533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13303601741790771, |
| "step": 2805, |
| "valid_targets_mean": 2095.6, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 4.481658692185008, |
| "grad_norm": 0.6268169440228296, |
| "learning_rate": 1.3819660112501054e-05, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19091369211673737, |
| "step": 2810, |
| "valid_targets_mean": 2760.9, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 4.4896331738437, |
| "grad_norm": 0.7797827360900279, |
| "learning_rate": 1.3744067859555461e-05, |
| "loss": 0.1596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14364150166511536, |
| "step": 2815, |
| "valid_targets_mean": 2647.5, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 4.497607655502392, |
| "grad_norm": 0.5958486269846882, |
| "learning_rate": 1.3668574538662451e-05, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3153199553489685, |
| "step": 2820, |
| "valid_targets_mean": 4524.3, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 4.505582137161085, |
| "grad_norm": 0.6464530618817084, |
| "learning_rate": 1.3593181343682353e-05, |
| "loss": 0.1509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12288454174995422, |
| "step": 2825, |
| "valid_targets_mean": 1907.5, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 4.513556618819777, |
| "grad_norm": 0.5766089488256633, |
| "learning_rate": 1.3517889466892085e-05, |
| "loss": 0.1511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18093323707580566, |
| "step": 2830, |
| "valid_targets_mean": 3210.1, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 4.521531100478469, |
| "grad_norm": 0.6277488852884846, |
| "learning_rate": 1.3442700098966326e-05, |
| "loss": 0.1548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14466340839862823, |
| "step": 2835, |
| "valid_targets_mean": 2295.5, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 4.529505582137161, |
| "grad_norm": 0.5780933276759791, |
| "learning_rate": 1.3367614428958646e-05, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13822069764137268, |
| "step": 2840, |
| "valid_targets_mean": 2436.6, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 4.5374800637958534, |
| "grad_norm": 0.5182007147664368, |
| "learning_rate": 1.3292633644282735e-05, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1259920299053192, |
| "step": 2845, |
| "valid_targets_mean": 3187.9, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 4.545454545454545, |
| "grad_norm": 0.5371658448891603, |
| "learning_rate": 1.3217758930693608e-05, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12785111367702484, |
| "step": 2850, |
| "valid_targets_mean": 2966.3, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 4.553429027113237, |
| "grad_norm": 0.6492823713058845, |
| "learning_rate": 1.314299147226887e-05, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17848286032676697, |
| "step": 2855, |
| "valid_targets_mean": 3112.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 4.56140350877193, |
| "grad_norm": 0.5833526819664339, |
| "learning_rate": 1.3068332451389969e-05, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14901649951934814, |
| "step": 2860, |
| "valid_targets_mean": 2962.1, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 4.569377990430622, |
| "grad_norm": 0.6044763831376962, |
| "learning_rate": 1.2993783048723515e-05, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18289071321487427, |
| "step": 2865, |
| "valid_targets_mean": 2793.9, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 4.577352472089315, |
| "grad_norm": 0.5907034874662462, |
| "learning_rate": 1.2919344443202602e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1798447072505951, |
| "step": 2870, |
| "valid_targets_mean": 3851.8, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 4.585326953748006, |
| "grad_norm": 0.5614296037672958, |
| "learning_rate": 1.2845017812008158e-05, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1698157787322998, |
| "step": 2875, |
| "valid_targets_mean": 3441.5, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 4.5933014354066986, |
| "grad_norm": 0.5713076100304711, |
| "learning_rate": 1.277080433055034e-05, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14279823005199432, |
| "step": 2880, |
| "valid_targets_mean": 2656.8, |
| "valid_targets_min": 1218 |
| }, |
| { |
| "epoch": 4.601275917065391, |
| "grad_norm": 0.6010777119114208, |
| "learning_rate": 1.2696705172449944e-05, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16096925735473633, |
| "step": 2885, |
| "valid_targets_mean": 2882.9, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 4.6092503987240825, |
| "grad_norm": 0.6510728768592932, |
| "learning_rate": 1.2622721509519846e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18414732813835144, |
| "step": 2890, |
| "valid_targets_mean": 2611.4, |
| "valid_targets_min": 1102 |
| }, |
| { |
| "epoch": 4.617224880382775, |
| "grad_norm": 0.5891857819758494, |
| "learning_rate": 1.2548854511746461e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1432403326034546, |
| "step": 2895, |
| "valid_targets_mean": 2906.4, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 4.625199362041467, |
| "grad_norm": 0.5997581297495093, |
| "learning_rate": 1.247510534727125e-05, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17660380899906158, |
| "step": 2900, |
| "valid_targets_mean": 4153.6, |
| "valid_targets_min": 1566 |
| }, |
| { |
| "epoch": 4.63317384370016, |
| "grad_norm": 0.5704940600430232, |
| "learning_rate": 1.240147518237224e-05, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17439067363739014, |
| "step": 2905, |
| "valid_targets_mean": 2826.9, |
| "valid_targets_min": 1557 |
| }, |
| { |
| "epoch": 4.641148325358852, |
| "grad_norm": 0.6041235814136545, |
| "learning_rate": 1.2327965181445593e-05, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1622115969657898, |
| "step": 2910, |
| "valid_targets_mean": 2654.2, |
| "valid_targets_min": 1260 |
| }, |
| { |
| "epoch": 4.649122807017544, |
| "grad_norm": 0.5904064735068515, |
| "learning_rate": 1.2254576506987182e-05, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14826351404190063, |
| "step": 2915, |
| "valid_targets_mean": 2521.2, |
| "valid_targets_min": 1203 |
| }, |
| { |
| "epoch": 4.657097288676236, |
| "grad_norm": 0.6708883356957397, |
| "learning_rate": 1.21813103195742e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15236374735832214, |
| "step": 2920, |
| "valid_targets_mean": 2082.2, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 4.6650717703349285, |
| "grad_norm": 0.5410250981706312, |
| "learning_rate": 1.2108167777846815e-05, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1691250205039978, |
| "step": 2925, |
| "valid_targets_mean": 3658.4, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 4.67304625199362, |
| "grad_norm": 0.5600363452922104, |
| "learning_rate": 1.203515003848987e-05, |
| "loss": 0.1532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17247727513313293, |
| "step": 2930, |
| "valid_targets_mean": 3237.1, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 4.681020733652312, |
| "grad_norm": 0.6269773523410778, |
| "learning_rate": 1.1962258256214545e-05, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16801588237285614, |
| "step": 2935, |
| "valid_targets_mean": 2773.1, |
| "valid_targets_min": 1145 |
| }, |
| { |
| "epoch": 4.688995215311005, |
| "grad_norm": 0.6416942531641958, |
| "learning_rate": 1.1889493583740124e-05, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15715159475803375, |
| "step": 2940, |
| "valid_targets_mean": 2487.7, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 4.696969696969697, |
| "grad_norm": 0.6032413565847697, |
| "learning_rate": 1.1816857171775767e-05, |
| "loss": 0.1401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15060892701148987, |
| "step": 2945, |
| "valid_targets_mean": 2569.9, |
| "valid_targets_min": 1571 |
| }, |
| { |
| "epoch": 4.70494417862839, |
| "grad_norm": 0.6229235355749451, |
| "learning_rate": 1.1744350169002308e-05, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16957922279834747, |
| "step": 2950, |
| "valid_targets_mean": 2637.2, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 4.712918660287081, |
| "grad_norm": 0.5305233008927874, |
| "learning_rate": 1.1671973722054077e-05, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20151448249816895, |
| "step": 2955, |
| "valid_targets_mean": 3813.4, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 4.720893141945774, |
| "grad_norm": 0.5928610616782457, |
| "learning_rate": 1.159972897550079e-05, |
| "loss": 0.1765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17702104151248932, |
| "step": 2960, |
| "valid_targets_mean": 3135.0, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 4.728867623604466, |
| "grad_norm": 0.6549965052438604, |
| "learning_rate": 1.1527617071829447e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21487164497375488, |
| "step": 2965, |
| "valid_targets_mean": 2599.4, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 4.7368421052631575, |
| "grad_norm": 0.5878382112347069, |
| "learning_rate": 1.145563915142622e-05, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16524244844913483, |
| "step": 2970, |
| "valid_targets_mean": 3205.4, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 4.74481658692185, |
| "grad_norm": 0.5829785508403137, |
| "learning_rate": 1.1383796352558489e-05, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13480517268180847, |
| "step": 2975, |
| "valid_targets_mean": 2421.6, |
| "valid_targets_min": 1389 |
| }, |
| { |
| "epoch": 4.752791068580542, |
| "grad_norm": 0.9528420577486767, |
| "learning_rate": 1.1312089811356803e-05, |
| "loss": 0.1511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.142283096909523, |
| "step": 2980, |
| "valid_targets_mean": 2265.3, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 4.760765550239235, |
| "grad_norm": 0.6379187971048914, |
| "learning_rate": 1.1240520661796882e-05, |
| "loss": 0.1434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12618593871593475, |
| "step": 2985, |
| "valid_targets_mean": 2114.1, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 4.768740031897926, |
| "grad_norm": 0.581096748192637, |
| "learning_rate": 1.1169090035681772e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17308899760246277, |
| "step": 2990, |
| "valid_targets_mean": 3163.0, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 4.776714513556619, |
| "grad_norm": 0.6490837955490153, |
| "learning_rate": 1.109779906262383e-05, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2551341652870178, |
| "step": 2995, |
| "valid_targets_mean": 3147.7, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 4.784688995215311, |
| "grad_norm": 0.5933551257310504, |
| "learning_rate": 1.102664887002698e-05, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15214470028877258, |
| "step": 3000, |
| "valid_targets_mean": 3350.6, |
| "valid_targets_min": 1496 |
| }, |
| { |
| "epoch": 4.7926634768740035, |
| "grad_norm": 0.5823345389450942, |
| "learning_rate": 1.0955640583068802e-05, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16861368715763092, |
| "step": 3005, |
| "valid_targets_mean": 2921.8, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 4.800637958532695, |
| "grad_norm": 0.5903270104669966, |
| "learning_rate": 1.0884775324682755e-05, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14034119248390198, |
| "step": 3010, |
| "valid_targets_mean": 2480.7, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 4.8086124401913874, |
| "grad_norm": 0.5924958725908289, |
| "learning_rate": 1.081405421554044e-05, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13198724389076233, |
| "step": 3015, |
| "valid_targets_mean": 2427.5, |
| "valid_targets_min": 1250 |
| }, |
| { |
| "epoch": 4.81658692185008, |
| "grad_norm": 0.5951560445307537, |
| "learning_rate": 1.074347837403387e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1821703463792801, |
| "step": 3020, |
| "valid_targets_mean": 3043.9, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 4.824561403508772, |
| "grad_norm": 0.5894961447208159, |
| "learning_rate": 1.067304891625776e-05, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1578672230243683, |
| "step": 3025, |
| "valid_targets_mean": 3003.2, |
| "valid_targets_min": 1063 |
| }, |
| { |
| "epoch": 4.832535885167464, |
| "grad_norm": 0.6377603875579224, |
| "learning_rate": 1.0602766955991913e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16185033321380615, |
| "step": 3030, |
| "valid_targets_mean": 2483.1, |
| "valid_targets_min": 1017 |
| }, |
| { |
| "epoch": 4.840510366826156, |
| "grad_norm": 0.48915397672553124, |
| "learning_rate": 1.053263360468358e-05, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1294403374195099, |
| "step": 3035, |
| "valid_targets_mean": 3507.8, |
| "valid_targets_min": 1335 |
| }, |
| { |
| "epoch": 4.848484848484849, |
| "grad_norm": 0.6547180933536588, |
| "learning_rate": 1.0462649971429884e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1606912463903427, |
| "step": 3040, |
| "valid_targets_mean": 2161.8, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 4.856459330143541, |
| "grad_norm": 0.5527293462604799, |
| "learning_rate": 1.0392817162960304e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17694956064224243, |
| "step": 3045, |
| "valid_targets_mean": 3561.0, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 4.8644338118022326, |
| "grad_norm": 0.7548532786478716, |
| "learning_rate": 1.0323136283619167e-05, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15897555649280548, |
| "step": 3050, |
| "valid_targets_mean": 2484.4, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 4.872408293460925, |
| "grad_norm": 0.5513293334710877, |
| "learning_rate": 1.0253608435348136e-05, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18371330201625824, |
| "step": 3055, |
| "valid_targets_mean": 3966.9, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 4.880382775119617, |
| "grad_norm": 0.6031939961843086, |
| "learning_rate": 1.0184234717668867e-05, |
| "loss": 0.1702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18013069033622742, |
| "step": 3060, |
| "valid_targets_mean": 2705.5, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 4.88835725677831, |
| "grad_norm": 0.6892842856879766, |
| "learning_rate": 1.0115016227665544e-05, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13218329846858978, |
| "step": 3065, |
| "valid_targets_mean": 1881.2, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 4.896331738437001, |
| "grad_norm": 0.543825197475642, |
| "learning_rate": 1.0045954059967577e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13563859462738037, |
| "step": 3070, |
| "valid_targets_mean": 3105.5, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 4.904306220095694, |
| "grad_norm": 0.6591944511943134, |
| "learning_rate": 9.977049306732287e-06, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15450099110603333, |
| "step": 3075, |
| "valid_targets_mean": 2669.7, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 4.912280701754386, |
| "grad_norm": 0.5795314772456565, |
| "learning_rate": 9.908303057627591e-06, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16409224271774292, |
| "step": 3080, |
| "valid_targets_mean": 3158.5, |
| "valid_targets_min": 1344 |
| }, |
| { |
| "epoch": 4.920255183413078, |
| "grad_norm": 0.6592054493281521, |
| "learning_rate": 9.83971639981484e-06, |
| "loss": 0.1901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22291454672813416, |
| "step": 3085, |
| "valid_targets_mean": 3663.3, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 4.92822966507177, |
| "grad_norm": 0.5726489277415606, |
| "learning_rate": 9.771290417931559e-06, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16419470310211182, |
| "step": 3090, |
| "valid_targets_mean": 2881.9, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 4.9362041467304625, |
| "grad_norm": 0.6137702893297173, |
| "learning_rate": 9.703026194074342e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16602787375450134, |
| "step": 3095, |
| "valid_targets_mean": 2241.7, |
| "valid_targets_min": 1492 |
| }, |
| { |
| "epoch": 4.944178628389155, |
| "grad_norm": 0.625860695726005, |
| "learning_rate": 9.634924807781729e-06, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13178279995918274, |
| "step": 3100, |
| "valid_targets_mean": 2148.7, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 4.952153110047847, |
| "grad_norm": 0.6614163326110132, |
| "learning_rate": 9.566987336017102e-06, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15211498737335205, |
| "step": 3105, |
| "valid_targets_mean": 2294.9, |
| "valid_targets_min": 1449 |
| }, |
| { |
| "epoch": 4.960127591706539, |
| "grad_norm": 0.6339096958861727, |
| "learning_rate": 9.499214853151699e-06, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13669738173484802, |
| "step": 3110, |
| "valid_targets_mean": 2579.0, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 4.968102073365231, |
| "grad_norm": 0.6201778623086089, |
| "learning_rate": 9.431608430947619e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13577091693878174, |
| "step": 3115, |
| "valid_targets_mean": 2413.5, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 4.976076555023924, |
| "grad_norm": 0.5945194233107883, |
| "learning_rate": 9.364169138540805e-06, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16690418124198914, |
| "step": 3120, |
| "valid_targets_mean": 2853.1, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 4.984051036682615, |
| "grad_norm": 0.583377612270226, |
| "learning_rate": 9.296898042424237e-06, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13808023929595947, |
| "step": 3125, |
| "valid_targets_mean": 2496.2, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 4.992025518341308, |
| "grad_norm": 0.5532057544654067, |
| "learning_rate": 9.229796206431015e-06, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2222648710012436, |
| "step": 3130, |
| "valid_targets_mean": 4848.7, |
| "valid_targets_min": 1038 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.531789644788238, |
| "learning_rate": 9.162864691717513e-06, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18254606425762177, |
| "step": 3135, |
| "valid_targets_mean": 3269.1, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 5.007974481658692, |
| "grad_norm": 0.5616721527680314, |
| "learning_rate": 9.096104556746654e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1832147091627121, |
| "step": 3140, |
| "valid_targets_mean": 3542.6, |
| "valid_targets_min": 1594 |
| }, |
| { |
| "epoch": 5.015948963317384, |
| "grad_norm": 0.6088692960009601, |
| "learning_rate": 9.029516857271115e-06, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1366785764694214, |
| "step": 3145, |
| "valid_targets_mean": 2708.7, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 5.023923444976076, |
| "grad_norm": 0.5285306796042663, |
| "learning_rate": 8.963102646316677e-06, |
| "loss": 0.1594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16185930371284485, |
| "step": 3150, |
| "valid_targets_mean": 3778.3, |
| "valid_targets_min": 1154 |
| }, |
| { |
| "epoch": 5.031897926634769, |
| "grad_norm": 0.6115365337267124, |
| "learning_rate": 8.896862974165553e-06, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14206919074058533, |
| "step": 3155, |
| "valid_targets_mean": 3075.5, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 5.039872408293461, |
| "grad_norm": 0.6388639498863427, |
| "learning_rate": 8.830798888339756e-06, |
| "loss": 0.1512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13919368386268616, |
| "step": 3160, |
| "valid_targets_mean": 2328.9, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 5.047846889952153, |
| "grad_norm": 0.5869360038685693, |
| "learning_rate": 8.764911433584581e-06, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17949020862579346, |
| "step": 3165, |
| "valid_targets_mean": 3294.6, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 5.055821371610845, |
| "grad_norm": 0.5747885813337419, |
| "learning_rate": 8.699201651852056e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15749900043010712, |
| "step": 3170, |
| "valid_targets_mean": 3640.9, |
| "valid_targets_min": 1226 |
| }, |
| { |
| "epoch": 5.0637958532695375, |
| "grad_norm": 0.5817079808666326, |
| "learning_rate": 8.633670582284446e-06, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11290596425533295, |
| "step": 3175, |
| "valid_targets_mean": 2822.5, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 5.07177033492823, |
| "grad_norm": 0.6680362984019289, |
| "learning_rate": 8.56831926119787e-06, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11178924143314362, |
| "step": 3180, |
| "valid_targets_mean": 1960.3, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 5.0797448165869215, |
| "grad_norm": 0.584769533808893, |
| "learning_rate": 8.503148722065851e-06, |
| "loss": 0.1894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2956717610359192, |
| "step": 3185, |
| "valid_targets_mean": 4416.9, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 5.087719298245614, |
| "grad_norm": 0.572702746875333, |
| "learning_rate": 8.43815999550303e-06, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1503574550151825, |
| "step": 3190, |
| "valid_targets_mean": 3477.9, |
| "valid_targets_min": 1398 |
| }, |
| { |
| "epoch": 5.095693779904306, |
| "grad_norm": 0.6379898231385502, |
| "learning_rate": 8.373354109248842e-06, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15601392090320587, |
| "step": 3195, |
| "valid_targets_mean": 2786.6, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 5.103668261562999, |
| "grad_norm": 0.6570400100898655, |
| "learning_rate": 8.308732088151245e-06, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13875964283943176, |
| "step": 3200, |
| "valid_targets_mean": 2495.5, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 5.11164274322169, |
| "grad_norm": 0.598589916212468, |
| "learning_rate": 8.24429495415054e-06, |
| "loss": 0.1542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17209793627262115, |
| "step": 3205, |
| "valid_targets_mean": 3544.8, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 5.119617224880383, |
| "grad_norm": 0.5905187204371102, |
| "learning_rate": 8.180043726263216e-06, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15271854400634766, |
| "step": 3210, |
| "valid_targets_mean": 3155.5, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 5.127591706539075, |
| "grad_norm": 0.638961162391656, |
| "learning_rate": 8.115979420565794e-06, |
| "loss": 0.1467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15162287652492523, |
| "step": 3215, |
| "valid_targets_mean": 3120.7, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 5.1355661881977674, |
| "grad_norm": 0.6929090202401988, |
| "learning_rate": 8.052103050178806e-06, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15893588960170746, |
| "step": 3220, |
| "valid_targets_mean": 2715.9, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 5.143540669856459, |
| "grad_norm": 0.6531239078174592, |
| "learning_rate": 7.988415625250755e-06, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17716528475284576, |
| "step": 3225, |
| "valid_targets_mean": 3181.6, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 5.151515151515151, |
| "grad_norm": 0.6723920338293383, |
| "learning_rate": 7.924918152942117e-06, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16147425770759583, |
| "step": 3230, |
| "valid_targets_mean": 2302.5, |
| "valid_targets_min": 1238 |
| }, |
| { |
| "epoch": 5.159489633173844, |
| "grad_norm": 0.6602533766749181, |
| "learning_rate": 7.861611637409462e-06, |
| "loss": 0.1376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1290948987007141, |
| "step": 3235, |
| "valid_targets_mean": 1941.5, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 5.167464114832536, |
| "grad_norm": 0.6264465102021803, |
| "learning_rate": 7.798497079789513e-06, |
| "loss": 0.1616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16076138615608215, |
| "step": 3240, |
| "valid_targets_mean": 3415.3, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 5.175438596491228, |
| "grad_norm": 0.6240803701984488, |
| "learning_rate": 7.735575478183381e-06, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11426462233066559, |
| "step": 3245, |
| "valid_targets_mean": 2283.6, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 5.18341307814992, |
| "grad_norm": 0.5078898685113183, |
| "learning_rate": 7.672847827640735e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10710498690605164, |
| "step": 3250, |
| "valid_targets_mean": 3287.6, |
| "valid_targets_min": 1326 |
| }, |
| { |
| "epoch": 5.1913875598086126, |
| "grad_norm": 0.6613642718503813, |
| "learning_rate": 7.610315120144067e-06, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2189890742301941, |
| "step": 3255, |
| "valid_targets_mean": 3137.3, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 5.199362041467305, |
| "grad_norm": 0.6542926532200951, |
| "learning_rate": 7.5479783445930414e-06, |
| "loss": 0.1436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13109362125396729, |
| "step": 3260, |
| "valid_targets_mean": 2605.9, |
| "valid_targets_min": 1169 |
| }, |
| { |
| "epoch": 5.2073365231259965, |
| "grad_norm": 0.6132656516318115, |
| "learning_rate": 7.485838486788803e-06, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521100401878357, |
| "step": 3265, |
| "valid_targets_mean": 2872.9, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 5.215311004784689, |
| "grad_norm": 0.5793143995524747, |
| "learning_rate": 7.4238965294184374e-06, |
| "loss": 0.1398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1307733952999115, |
| "step": 3270, |
| "valid_targets_mean": 2821.3, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 5.223285486443381, |
| "grad_norm": 0.616310991142214, |
| "learning_rate": 7.362153452039409e-06, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14505207538604736, |
| "step": 3275, |
| "valid_targets_mean": 3195.2, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 5.231259968102074, |
| "grad_norm": 0.6618556740317185, |
| "learning_rate": 7.300610231064056e-06, |
| "loss": 0.1609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1720818281173706, |
| "step": 3280, |
| "valid_targets_mean": 2992.6, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 5.239234449760765, |
| "grad_norm": 0.5790679579947826, |
| "learning_rate": 7.239267839744166e-06, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14833727478981018, |
| "step": 3285, |
| "valid_targets_mean": 3526.7, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 5.247208931419458, |
| "grad_norm": 0.6637878617650812, |
| "learning_rate": 7.178127248155604e-06, |
| "loss": 0.1422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14050063490867615, |
| "step": 3290, |
| "valid_targets_mean": 2340.9, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 5.25518341307815, |
| "grad_norm": 0.660304590549916, |
| "learning_rate": 7.117189423182917e-06, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12989658117294312, |
| "step": 3295, |
| "valid_targets_mean": 2483.1, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 5.2631578947368425, |
| "grad_norm": 0.5943952448901542, |
| "learning_rate": 7.056455328504104e-06, |
| "loss": 0.1338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11984672397375107, |
| "step": 3300, |
| "valid_targets_mean": 2756.2, |
| "valid_targets_min": 1486 |
| }, |
| { |
| "epoch": 5.271132376395534, |
| "grad_norm": 0.7138160232972223, |
| "learning_rate": 6.995925924575342e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19342780113220215, |
| "step": 3305, |
| "valid_targets_mean": 2799.3, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 5.279106858054226, |
| "grad_norm": 0.6073033076078348, |
| "learning_rate": 6.935602168615792e-06, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17981265485286713, |
| "step": 3310, |
| "valid_targets_mean": 3221.4, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 5.287081339712919, |
| "grad_norm": 0.6198408636633029, |
| "learning_rate": 6.875485014592493e-06, |
| "loss": 0.1542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15747490525245667, |
| "step": 3315, |
| "valid_targets_mean": 2937.5, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 5.295055821371611, |
| "grad_norm": 0.6767478976464635, |
| "learning_rate": 6.815575413205235e-06, |
| "loss": 0.1414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1285533607006073, |
| "step": 3320, |
| "valid_targets_mean": 1891.3, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 5.303030303030303, |
| "grad_norm": 0.7336904785294537, |
| "learning_rate": 6.755874311871562e-06, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17466244101524353, |
| "step": 3325, |
| "valid_targets_mean": 3122.5, |
| "valid_targets_min": 1476 |
| }, |
| { |
| "epoch": 5.311004784688995, |
| "grad_norm": 0.6194185101743505, |
| "learning_rate": 6.696382654711777e-06, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17486578226089478, |
| "step": 3330, |
| "valid_targets_mean": 3025.5, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 5.318979266347688, |
| "grad_norm": 0.560663116939223, |
| "learning_rate": 6.637101382533986e-06, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14362575113773346, |
| "step": 3335, |
| "valid_targets_mean": 4083.6, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 5.32695374800638, |
| "grad_norm": 0.558896380159237, |
| "learning_rate": 6.578031432819263e-06, |
| "loss": 0.1324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13198032975196838, |
| "step": 3340, |
| "valid_targets_mean": 3352.3, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 5.3349282296650715, |
| "grad_norm": 0.5773043179265, |
| "learning_rate": 6.5191737397068015e-06, |
| "loss": 0.145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14222127199172974, |
| "step": 3345, |
| "valid_targets_mean": 3164.2, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 5.342902711323764, |
| "grad_norm": 0.6580880391527406, |
| "learning_rate": 6.460529233979127e-06, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14480651915073395, |
| "step": 3350, |
| "valid_targets_mean": 2353.7, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 5.350877192982456, |
| "grad_norm": 0.6843060196894174, |
| "learning_rate": 6.402098843047417e-06, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14741107821464539, |
| "step": 3355, |
| "valid_targets_mean": 2423.2, |
| "valid_targets_min": 1307 |
| }, |
| { |
| "epoch": 5.358851674641148, |
| "grad_norm": 0.6168049212851636, |
| "learning_rate": 6.343883490936791e-06, |
| "loss": 0.152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19296379387378693, |
| "step": 3360, |
| "valid_targets_mean": 2869.9, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 5.36682615629984, |
| "grad_norm": 0.6000631965540703, |
| "learning_rate": 6.285884098271739e-06, |
| "loss": 0.1371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13257285952568054, |
| "step": 3365, |
| "valid_targets_mean": 2764.1, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 5.374800637958533, |
| "grad_norm": 0.6563286214420883, |
| "learning_rate": 6.228101582261532e-06, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17767846584320068, |
| "step": 3370, |
| "valid_targets_mean": 2802.8, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 5.382775119617225, |
| "grad_norm": 0.6960377409393284, |
| "learning_rate": 6.170536856685716e-06, |
| "loss": 0.1399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14913170039653778, |
| "step": 3375, |
| "valid_targets_mean": 2647.2, |
| "valid_targets_min": 983 |
| }, |
| { |
| "epoch": 5.3907496012759175, |
| "grad_norm": 0.6035783453810492, |
| "learning_rate": 6.113190831879698e-06, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1609422266483307, |
| "step": 3380, |
| "valid_targets_mean": 2827.8, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 5.398724082934609, |
| "grad_norm": 0.6576832684505226, |
| "learning_rate": 6.056064414720317e-06, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1647460162639618, |
| "step": 3385, |
| "valid_targets_mean": 2748.5, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 5.4066985645933014, |
| "grad_norm": 0.6402347861728089, |
| "learning_rate": 5.999158508611496e-06, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13792529702186584, |
| "step": 3390, |
| "valid_targets_mean": 2541.5, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 5.414673046251994, |
| "grad_norm": 0.6754352948702881, |
| "learning_rate": 5.942474013469983e-06, |
| "loss": 0.1415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12908028066158295, |
| "step": 3395, |
| "valid_targets_mean": 2440.5, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 5.422647527910685, |
| "grad_norm": 0.6188190631444767, |
| "learning_rate": 5.886011825711117e-06, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15597115457057953, |
| "step": 3400, |
| "valid_targets_mean": 3018.2, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 5.430622009569378, |
| "grad_norm": 0.6027543335163618, |
| "learning_rate": 5.829772838234615e-06, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14923419058322906, |
| "step": 3405, |
| "valid_targets_mean": 3284.5, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 5.43859649122807, |
| "grad_norm": 0.6397744296419502, |
| "learning_rate": 5.773757940410503e-06, |
| "loss": 0.1446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1353510320186615, |
| "step": 3410, |
| "valid_targets_mean": 2694.5, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 5.446570972886763, |
| "grad_norm": 0.6602471322717809, |
| "learning_rate": 5.7179680180650055e-06, |
| "loss": 0.1592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12969273328781128, |
| "step": 3415, |
| "valid_targets_mean": 2616.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 5.454545454545454, |
| "grad_norm": 0.5963165890470659, |
| "learning_rate": 5.6624039534665775e-06, |
| "loss": 0.1587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13266560435295105, |
| "step": 3420, |
| "valid_targets_mean": 3448.6, |
| "valid_targets_min": 1318 |
| }, |
| { |
| "epoch": 5.4625199362041466, |
| "grad_norm": 0.5800990660141001, |
| "learning_rate": 5.607066625311925e-06, |
| "loss": 0.1416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12376489490270615, |
| "step": 3425, |
| "valid_targets_mean": 3497.6, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 5.470494417862839, |
| "grad_norm": 0.6832162024266292, |
| "learning_rate": 5.55195690871211e-06, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19239741563796997, |
| "step": 3430, |
| "valid_targets_mean": 2752.0, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 5.478468899521531, |
| "grad_norm": 0.6673288640941466, |
| "learning_rate": 5.497075675178727e-06, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12479984760284424, |
| "step": 3435, |
| "valid_targets_mean": 2185.1, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 5.486443381180223, |
| "grad_norm": 0.6827660786954963, |
| "learning_rate": 5.442423792610118e-06, |
| "loss": 0.1624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15979987382888794, |
| "step": 3440, |
| "valid_targets_mean": 2559.2, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 5.494417862838915, |
| "grad_norm": 0.6648142440724466, |
| "learning_rate": 5.388002125277627e-06, |
| "loss": 0.1548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17778322100639343, |
| "step": 3445, |
| "valid_targets_mean": 2779.8, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 5.502392344497608, |
| "grad_norm": 0.6355104542187777, |
| "learning_rate": 5.333811533811945e-06, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2083851397037506, |
| "step": 3450, |
| "valid_targets_mean": 3374.8, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 5.5103668261563, |
| "grad_norm": 0.6324432750904236, |
| "learning_rate": 5.2798528751895265e-06, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14686718583106995, |
| "step": 3455, |
| "valid_targets_mean": 3143.6, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 5.518341307814992, |
| "grad_norm": 0.64304470738957, |
| "learning_rate": 5.226127002718984e-06, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13552545011043549, |
| "step": 3460, |
| "valid_targets_mean": 2855.8, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 5.526315789473684, |
| "grad_norm": 0.6068488328932702, |
| "learning_rate": 5.1726347660276424e-06, |
| "loss": 0.1479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1278594583272934, |
| "step": 3465, |
| "valid_targets_mean": 2640.1, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 5.5342902711323765, |
| "grad_norm": 0.6186581531893287, |
| "learning_rate": 5.119377011048066e-06, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18196257948875427, |
| "step": 3470, |
| "valid_targets_mean": 3513.9, |
| "valid_targets_min": 1403 |
| }, |
| { |
| "epoch": 5.542264752791069, |
| "grad_norm": 0.6669804977769721, |
| "learning_rate": 5.066354580004713e-06, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15941552817821503, |
| "step": 3475, |
| "valid_targets_mean": 2656.9, |
| "valid_targets_min": 1576 |
| }, |
| { |
| "epoch": 5.55023923444976, |
| "grad_norm": 0.5584247466984443, |
| "learning_rate": 5.013568311400599e-06, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1496984362602234, |
| "step": 3480, |
| "valid_targets_mean": 3440.2, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 5.558213716108453, |
| "grad_norm": 0.5968686738437612, |
| "learning_rate": 4.96101904000402e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17291352152824402, |
| "step": 3485, |
| "valid_targets_mean": 3329.5, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 5.566188197767145, |
| "grad_norm": 0.6237372043857617, |
| "learning_rate": 4.908707596835396e-06, |
| "loss": 0.1515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12298108637332916, |
| "step": 3490, |
| "valid_targets_mean": 2981.9, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 5.574162679425838, |
| "grad_norm": 0.6346515143599728, |
| "learning_rate": 4.856634809154093e-06, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1985761821269989, |
| "step": 3495, |
| "valid_targets_mean": 3093.9, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 5.582137161084529, |
| "grad_norm": 0.6081952670860399, |
| "learning_rate": 4.804801500445338e-06, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17497466504573822, |
| "step": 3500, |
| "valid_targets_mean": 3463.1, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 5.590111642743222, |
| "grad_norm": 0.5677532822167262, |
| "learning_rate": 4.753208490407233e-06, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1865505427122116, |
| "step": 3505, |
| "valid_targets_mean": 3796.1, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 5.598086124401914, |
| "grad_norm": 0.6876441442315494, |
| "learning_rate": 4.701856594937744e-06, |
| "loss": 0.1466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17622287571430206, |
| "step": 3510, |
| "valid_targets_mean": 2459.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 5.606060606060606, |
| "grad_norm": 0.6121241994834047, |
| "learning_rate": 4.650746626121838e-06, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16413599252700806, |
| "step": 3515, |
| "valid_targets_mean": 2919.9, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 5.614035087719298, |
| "grad_norm": 0.6187331081816392, |
| "learning_rate": 4.5998793922186315e-06, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1643972545862198, |
| "step": 3520, |
| "valid_targets_mean": 3124.5, |
| "valid_targets_min": 1606 |
| }, |
| { |
| "epoch": 5.62200956937799, |
| "grad_norm": 0.578937807626536, |
| "learning_rate": 4.549255697648576e-06, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14879783987998962, |
| "step": 3525, |
| "valid_targets_mean": 2991.8, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 5.629984051036683, |
| "grad_norm": 0.558863133501645, |
| "learning_rate": 4.498876342980796e-06, |
| "loss": 0.1311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16602568328380585, |
| "step": 3530, |
| "valid_targets_mean": 3746.1, |
| "valid_targets_min": 1425 |
| }, |
| { |
| "epoch": 5.637958532695375, |
| "grad_norm": 0.5968740877187344, |
| "learning_rate": 4.448742124920368e-06, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16445884108543396, |
| "step": 3535, |
| "valid_targets_mean": 3706.6, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 5.645933014354067, |
| "grad_norm": 0.59401001935693, |
| "learning_rate": 4.39885383629576e-06, |
| "loss": 0.1424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12195871025323868, |
| "step": 3540, |
| "valid_targets_mean": 2801.0, |
| "valid_targets_min": 1402 |
| }, |
| { |
| "epoch": 5.653907496012759, |
| "grad_norm": 0.6810295811672586, |
| "learning_rate": 4.349212266046285e-06, |
| "loss": 0.1475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14159944653511047, |
| "step": 3545, |
| "valid_targets_mean": 2317.9, |
| "valid_targets_min": 1367 |
| }, |
| { |
| "epoch": 5.6618819776714515, |
| "grad_norm": 0.5657955138742755, |
| "learning_rate": 4.299818199209629e-06, |
| "loss": 0.1456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13119353353977203, |
| "step": 3550, |
| "valid_targets_mean": 3540.1, |
| "valid_targets_min": 1045 |
| }, |
| { |
| "epoch": 5.669856459330144, |
| "grad_norm": 0.8104409273690198, |
| "learning_rate": 4.250672416909407e-06, |
| "loss": 0.1576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1876513808965683, |
| "step": 3555, |
| "valid_targets_mean": 3162.6, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 5.6778309409888355, |
| "grad_norm": 0.6124381093965978, |
| "learning_rate": 4.201775696342862e-06, |
| "loss": 0.1579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13993270695209503, |
| "step": 3560, |
| "valid_targets_mean": 2776.8, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 5.685805422647528, |
| "grad_norm": 0.6570663102638316, |
| "learning_rate": 4.153128810768517e-06, |
| "loss": 0.1452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19519951939582825, |
| "step": 3565, |
| "valid_targets_mean": 3120.6, |
| "valid_targets_min": 1299 |
| }, |
| { |
| "epoch": 5.69377990430622, |
| "grad_norm": 0.6605723879914376, |
| "learning_rate": 4.104732529493991e-06, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13901135325431824, |
| "step": 3570, |
| "valid_targets_mean": 2307.8, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 5.701754385964913, |
| "grad_norm": 0.6408169381973454, |
| "learning_rate": 4.056587617863825e-06, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14372986555099487, |
| "step": 3575, |
| "valid_targets_mean": 2505.6, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 5.709728867623604, |
| "grad_norm": 0.6526244361410768, |
| "learning_rate": 4.008694837247345e-06, |
| "loss": 0.1506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15499386191368103, |
| "step": 3580, |
| "valid_targets_mean": 2597.3, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 5.717703349282297, |
| "grad_norm": 0.7711661892385364, |
| "learning_rate": 3.961054945026674e-06, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13299037516117096, |
| "step": 3585, |
| "valid_targets_mean": 2595.4, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 5.725677830940989, |
| "grad_norm": 0.5653622529411262, |
| "learning_rate": 3.913668694584705e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1906440258026123, |
| "step": 3590, |
| "valid_targets_mean": 4048.9, |
| "valid_targets_min": 1326 |
| }, |
| { |
| "epoch": 5.733652312599681, |
| "grad_norm": 0.6059994868500017, |
| "learning_rate": 3.866536835293227e-06, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1835460066795349, |
| "step": 3595, |
| "valid_targets_mean": 3213.8, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 5.741626794258373, |
| "grad_norm": 0.5632286313650832, |
| "learning_rate": 3.819660112501053e-06, |
| "loss": 0.1405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11964814364910126, |
| "step": 3600, |
| "valid_targets_mean": 3211.3, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 5.749601275917065, |
| "grad_norm": 0.5656484979331154, |
| "learning_rate": 3.773039267522227e-06, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13798847794532776, |
| "step": 3605, |
| "valid_targets_mean": 3497.9, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 5.757575757575758, |
| "grad_norm": 0.6669280692908005, |
| "learning_rate": 3.72667503762433e-06, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12836626172065735, |
| "step": 3610, |
| "valid_targets_mean": 2467.6, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 5.76555023923445, |
| "grad_norm": 0.6105128759695477, |
| "learning_rate": 3.680568156016786e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21265044808387756, |
| "step": 3615, |
| "valid_targets_mean": 3298.8, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 5.773524720893142, |
| "grad_norm": 0.7614562771653794, |
| "learning_rate": 3.6347193518392776e-06, |
| "loss": 0.1462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14158612489700317, |
| "step": 3620, |
| "valid_targets_mean": 2508.9, |
| "valid_targets_min": 862 |
| }, |
| { |
| "epoch": 5.781499202551834, |
| "grad_norm": 0.5871957486109551, |
| "learning_rate": 3.58912935015024e-06, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1426844745874405, |
| "step": 3625, |
| "valid_targets_mean": 3297.4, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 5.7894736842105265, |
| "grad_norm": 0.7064727598286994, |
| "learning_rate": 3.543798871915367e-06, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.154343381524086, |
| "step": 3630, |
| "valid_targets_mean": 2664.8, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 5.797448165869218, |
| "grad_norm": 0.6633685511467207, |
| "learning_rate": 3.498728633996209e-06, |
| "loss": 0.1357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12906265258789062, |
| "step": 3635, |
| "valid_targets_mean": 2260.7, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 5.8054226475279105, |
| "grad_norm": 0.6214965202746205, |
| "learning_rate": 3.453919349138859e-06, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11440666764974594, |
| "step": 3640, |
| "valid_targets_mean": 2508.8, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 5.813397129186603, |
| "grad_norm": 0.5769112478791388, |
| "learning_rate": 3.4093717259626514e-06, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11280746757984161, |
| "step": 3645, |
| "valid_targets_mean": 2709.9, |
| "valid_targets_min": 1568 |
| }, |
| { |
| "epoch": 5.821371610845295, |
| "grad_norm": 0.6463824538730006, |
| "learning_rate": 3.365086468948988e-06, |
| "loss": 0.173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1195705458521843, |
| "step": 3650, |
| "valid_targets_mean": 2292.4, |
| "valid_targets_min": 1154 |
| }, |
| { |
| "epoch": 5.829346092503988, |
| "grad_norm": 0.6391150749806931, |
| "learning_rate": 3.321064278430175e-06, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1568872481584549, |
| "step": 3655, |
| "valid_targets_mean": 3043.6, |
| "valid_targets_min": 1213 |
| }, |
| { |
| "epoch": 5.837320574162679, |
| "grad_norm": 0.519107762034051, |
| "learning_rate": 3.277305850578345e-06, |
| "loss": 0.1359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11462641507387161, |
| "step": 3660, |
| "valid_targets_mean": 3768.6, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 5.845295055821372, |
| "grad_norm": 0.5558282842216485, |
| "learning_rate": 3.2338118773944684e-06, |
| "loss": 0.1562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13219889998435974, |
| "step": 3665, |
| "valid_targets_mean": 3827.9, |
| "valid_targets_min": 1308 |
| }, |
| { |
| "epoch": 5.853269537480064, |
| "grad_norm": 0.712652647722326, |
| "learning_rate": 3.1905830466973975e-06, |
| "loss": 0.1713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2413114309310913, |
| "step": 3670, |
| "valid_targets_mean": 3104.1, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 5.861244019138756, |
| "grad_norm": 0.8087033611981687, |
| "learning_rate": 3.14762004211298e-06, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13118065893650055, |
| "step": 3675, |
| "valid_targets_mean": 2179.2, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 5.869218500797448, |
| "grad_norm": 0.6965194625677074, |
| "learning_rate": 3.1049235430632696e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17841684818267822, |
| "step": 3680, |
| "valid_targets_mean": 2457.4, |
| "valid_targets_min": 1164 |
| }, |
| { |
| "epoch": 5.87719298245614, |
| "grad_norm": 0.6429474542089771, |
| "learning_rate": 3.062494224755759e-06, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20610585808753967, |
| "step": 3685, |
| "valid_targets_mean": 3904.6, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 5.885167464114833, |
| "grad_norm": 0.6122324755768935, |
| "learning_rate": 3.0203327581727195e-06, |
| "loss": 0.1431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11550375819206238, |
| "step": 3690, |
| "valid_targets_mean": 2673.4, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 5.893141945773524, |
| "grad_norm": 0.6890872162742891, |
| "learning_rate": 2.9784398100605937e-06, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17845694720745087, |
| "step": 3695, |
| "valid_targets_mean": 2944.2, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 5.901116427432217, |
| "grad_norm": 0.6524913255544141, |
| "learning_rate": 2.9368160429194127e-06, |
| "loss": 0.1511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1449909806251526, |
| "step": 3700, |
| "valid_targets_mean": 2448.1, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 5.909090909090909, |
| "grad_norm": 0.5680543220274574, |
| "learning_rate": 2.895462114992371e-06, |
| "loss": 0.1521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11523935198783875, |
| "step": 3705, |
| "valid_targets_mean": 2600.8, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 5.917065390749602, |
| "grad_norm": 0.6588147712991279, |
| "learning_rate": 2.8543786802553943e-06, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1229035034775734, |
| "step": 3710, |
| "valid_targets_mean": 2522.4, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 5.925039872408293, |
| "grad_norm": 0.7745513255839773, |
| "learning_rate": 2.813566388406781e-06, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12802991271018982, |
| "step": 3715, |
| "valid_targets_mean": 2456.6, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 5.9330143540669855, |
| "grad_norm": 0.7446954349027073, |
| "learning_rate": 2.773025884856957e-06, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17623551189899445, |
| "step": 3720, |
| "valid_targets_mean": 2696.7, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 5.940988835725678, |
| "grad_norm": 0.6780845611384435, |
| "learning_rate": 2.7327578107182585e-06, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13724076747894287, |
| "step": 3725, |
| "valid_targets_mean": 2162.1, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 5.94896331738437, |
| "grad_norm": 0.6943638613747845, |
| "learning_rate": 2.692762802794775e-06, |
| "loss": 0.1502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17806532979011536, |
| "step": 3730, |
| "valid_targets_mean": 2529.4, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 5.956937799043062, |
| "grad_norm": 0.6260683420021232, |
| "learning_rate": 2.6530414935723104e-06, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14727982878684998, |
| "step": 3735, |
| "valid_targets_mean": 3022.1, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 5.964912280701754, |
| "grad_norm": 0.5711184251561199, |
| "learning_rate": 2.6135945112083506e-06, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2091876119375229, |
| "step": 3740, |
| "valid_targets_mean": 3923.7, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 5.972886762360447, |
| "grad_norm": 0.660900776552596, |
| "learning_rate": 2.574422479522156e-06, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14469899237155914, |
| "step": 3745, |
| "valid_targets_mean": 2478.1, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 5.980861244019139, |
| "grad_norm": 0.6698862853262395, |
| "learning_rate": 2.535526017984884e-06, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1301461160182953, |
| "step": 3750, |
| "valid_targets_mean": 2119.2, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 5.988835725677831, |
| "grad_norm": 0.6050519500902528, |
| "learning_rate": 2.4969057417097807e-06, |
| "loss": 0.1389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1766177862882614, |
| "step": 3755, |
| "valid_targets_mean": 3424.4, |
| "valid_targets_min": 1367 |
| }, |
| { |
| "epoch": 5.996810207336523, |
| "grad_norm": 0.6388975080344989, |
| "learning_rate": 2.458562261442483e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12530069053173065, |
| "step": 3760, |
| "valid_targets_mean": 2602.0, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 6.0047846889952154, |
| "grad_norm": 0.5447128366200804, |
| "learning_rate": 2.4204961835513263e-06, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13561969995498657, |
| "step": 3765, |
| "valid_targets_mean": 3309.5, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 6.012759170653908, |
| "grad_norm": 0.6139508350380686, |
| "learning_rate": 2.3827081100177797e-06, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.161412313580513, |
| "step": 3770, |
| "valid_targets_mean": 2966.3, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 6.020733652312599, |
| "grad_norm": 0.6194921775961351, |
| "learning_rate": 2.3451986384269266e-06, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1445777714252472, |
| "step": 3775, |
| "valid_targets_mean": 2521.9, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 6.028708133971292, |
| "grad_norm": 0.637631777049995, |
| "learning_rate": 2.307968361957993e-06, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2161223292350769, |
| "step": 3780, |
| "valid_targets_mean": 3306.6, |
| "valid_targets_min": 1087 |
| }, |
| { |
| "epoch": 6.036682615629984, |
| "grad_norm": 0.738533022432783, |
| "learning_rate": 2.2710178693749805e-06, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17869213223457336, |
| "step": 3785, |
| "valid_targets_mean": 2190.9, |
| "valid_targets_min": 1312 |
| }, |
| { |
| "epoch": 6.044657097288677, |
| "grad_norm": 0.6527674057226728, |
| "learning_rate": 2.2343477450173665e-06, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1218600869178772, |
| "step": 3790, |
| "valid_targets_mean": 2779.9, |
| "valid_targets_min": 1470 |
| }, |
| { |
| "epoch": 6.052631578947368, |
| "grad_norm": 0.6630351920280422, |
| "learning_rate": 2.197958568790839e-06, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17970821261405945, |
| "step": 3795, |
| "valid_targets_mean": 3350.1, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 6.0606060606060606, |
| "grad_norm": 0.5672542193779837, |
| "learning_rate": 2.161850916158148e-06, |
| "loss": 0.1267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12792956829071045, |
| "step": 3800, |
| "valid_targets_mean": 3574.1, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 6.068580542264753, |
| "grad_norm": 0.6123013687625073, |
| "learning_rate": 2.1260253581299996e-06, |
| "loss": 0.135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13635091483592987, |
| "step": 3805, |
| "valid_targets_mean": 3412.9, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 6.076555023923445, |
| "grad_norm": 0.6534334160731141, |
| "learning_rate": 2.0904824612560046e-06, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.125827357172966, |
| "step": 3810, |
| "valid_targets_mean": 2346.2, |
| "valid_targets_min": 1172 |
| }, |
| { |
| "epoch": 6.084529505582137, |
| "grad_norm": 0.6294651199199671, |
| "learning_rate": 2.0552227876157536e-06, |
| "loss": 0.1283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12857142090797424, |
| "step": 3815, |
| "valid_targets_mean": 2880.9, |
| "valid_targets_min": 1383 |
| }, |
| { |
| "epoch": 6.092503987240829, |
| "grad_norm": 0.6391181961066408, |
| "learning_rate": 2.020246894809912e-06, |
| "loss": 0.1473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14293187856674194, |
| "step": 3820, |
| "valid_targets_mean": 2485.8, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 6.100478468899522, |
| "grad_norm": 0.7234527348754299, |
| "learning_rate": 1.9855553359513836e-06, |
| "loss": 0.1298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1257050782442093, |
| "step": 3825, |
| "valid_targets_mean": 2228.8, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 6.108452950558214, |
| "grad_norm": 0.6192919926151812, |
| "learning_rate": 1.9511486596566054e-06, |
| "loss": 0.1596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10207498073577881, |
| "step": 3830, |
| "valid_targets_mean": 2159.6, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 6.116427432216906, |
| "grad_norm": 0.5359741447900245, |
| "learning_rate": 1.917027410036825e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1523303985595703, |
| "step": 3835, |
| "valid_targets_mean": 4409.8, |
| "valid_targets_min": 1701 |
| }, |
| { |
| "epoch": 6.124401913875598, |
| "grad_norm": 0.6692422456172075, |
| "learning_rate": 1.8831921266895348e-06, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1260911226272583, |
| "step": 3840, |
| "valid_targets_mean": 2306.9, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 6.1323763955342905, |
| "grad_norm": 0.6423890090470709, |
| "learning_rate": 1.8496433446899197e-06, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13464131951332092, |
| "step": 3845, |
| "valid_targets_mean": 2437.8, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 6.140350877192983, |
| "grad_norm": 0.6902212059072099, |
| "learning_rate": 1.8163815945823881e-06, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1537630259990692, |
| "step": 3850, |
| "valid_targets_mean": 2586.1, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 6.148325358851674, |
| "grad_norm": 0.5846067426158729, |
| "learning_rate": 1.7834074023722082e-06, |
| "loss": 0.1369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1573687642812729, |
| "step": 3855, |
| "valid_targets_mean": 3312.4, |
| "valid_targets_min": 1595 |
| }, |
| { |
| "epoch": 6.156299840510367, |
| "grad_norm": 0.6205363998371608, |
| "learning_rate": 1.7507212895171632e-06, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17224471271038055, |
| "step": 3860, |
| "valid_targets_mean": 3192.4, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 6.164274322169059, |
| "grad_norm": 0.6482621142553876, |
| "learning_rate": 1.7183237729193081e-06, |
| "loss": 0.1554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14119577407836914, |
| "step": 3865, |
| "valid_targets_mean": 3200.1, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 6.172248803827751, |
| "grad_norm": 0.5945417763389266, |
| "learning_rate": 1.6862153649168211e-06, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15197794139385223, |
| "step": 3870, |
| "valid_targets_mean": 4120.8, |
| "valid_targets_min": 1689 |
| }, |
| { |
| "epoch": 6.180223285486443, |
| "grad_norm": 0.6424920862651418, |
| "learning_rate": 1.6543965732758737e-06, |
| "loss": 0.1434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16543099284172058, |
| "step": 3875, |
| "valid_targets_mean": 3316.8, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 6.188197767145136, |
| "grad_norm": 0.7111768445227941, |
| "learning_rate": 1.6228679011826032e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13221696019172668, |
| "step": 3880, |
| "valid_targets_mean": 2675.8, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 6.196172248803828, |
| "grad_norm": 0.5797517020648623, |
| "learning_rate": 1.591629847235172e-06, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18317551910877228, |
| "step": 3885, |
| "valid_targets_mean": 3720.1, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 6.2041467304625195, |
| "grad_norm": 0.6961211896005433, |
| "learning_rate": 1.5606829054358686e-06, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1390981823205948, |
| "step": 3890, |
| "valid_targets_mean": 2520.2, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 6.212121212121212, |
| "grad_norm": 0.647792425598567, |
| "learning_rate": 1.5300275651832963e-06, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1477465182542801, |
| "step": 3895, |
| "valid_targets_mean": 2948.1, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 6.220095693779904, |
| "grad_norm": 0.6425614569659422, |
| "learning_rate": 1.499664311264648e-06, |
| "loss": 0.1331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11879262328147888, |
| "step": 3900, |
| "valid_targets_mean": 2411.4, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 6.228070175438597, |
| "grad_norm": 0.6560346228896774, |
| "learning_rate": 1.4695936238480135e-06, |
| "loss": 0.1544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11653897911310196, |
| "step": 3905, |
| "valid_targets_mean": 2464.3, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 6.236044657097288, |
| "grad_norm": 0.5913785898356396, |
| "learning_rate": 1.4398159784748144e-06, |
| "loss": 0.12, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11476568132638931, |
| "step": 3910, |
| "valid_targets_mean": 2866.1, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 6.244019138755981, |
| "grad_norm": 0.6344887654680683, |
| "learning_rate": 1.4103318460522598e-06, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11846456676721573, |
| "step": 3915, |
| "valid_targets_mean": 2540.3, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 6.251993620414673, |
| "grad_norm": 0.6352575814931524, |
| "learning_rate": 1.3811416928459177e-06, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12151379138231277, |
| "step": 3920, |
| "valid_targets_mean": 3051.1, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 6.2599681020733655, |
| "grad_norm": 0.6533137247391657, |
| "learning_rate": 1.3522459804723353e-06, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15973787009716034, |
| "step": 3925, |
| "valid_targets_mean": 2525.4, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 6.267942583732057, |
| "grad_norm": 0.6295268930003071, |
| "learning_rate": 1.3236451658917293e-06, |
| "loss": 0.1299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1486193835735321, |
| "step": 3930, |
| "valid_targets_mean": 3116.2, |
| "valid_targets_min": 1571 |
| }, |
| { |
| "epoch": 6.2759170653907494, |
| "grad_norm": 0.6830753046565643, |
| "learning_rate": 1.2953397014007728e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14981475472450256, |
| "step": 3935, |
| "valid_targets_mean": 2623.8, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 6.283891547049442, |
| "grad_norm": 0.6028379965845788, |
| "learning_rate": 1.2673300346254447e-06, |
| "loss": 0.1402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14106810092926025, |
| "step": 3940, |
| "valid_targets_mean": 3649.6, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 6.291866028708134, |
| "grad_norm": 0.6231653564515409, |
| "learning_rate": 1.239616608513925e-06, |
| "loss": 0.1443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.132007896900177, |
| "step": 3945, |
| "valid_targets_mean": 2914.5, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 6.299840510366826, |
| "grad_norm": 0.7144670706226991, |
| "learning_rate": 1.2121998613296259e-06, |
| "loss": 0.1372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1385582983493805, |
| "step": 3950, |
| "valid_targets_mean": 3412.4, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 6.307814992025518, |
| "grad_norm": 0.6711423788649739, |
| "learning_rate": 1.1850802266442396e-06, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1569822132587433, |
| "step": 3955, |
| "valid_targets_mean": 2483.0, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 6.315789473684211, |
| "grad_norm": 0.6347098632735023, |
| "learning_rate": 1.1582581333308784e-06, |
| "loss": 0.1583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17010065913200378, |
| "step": 3960, |
| "valid_targets_mean": 3410.2, |
| "valid_targets_min": 1383 |
| }, |
| { |
| "epoch": 6.323763955342903, |
| "grad_norm": 0.7134750123487895, |
| "learning_rate": 1.1317340055573122e-06, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14928308129310608, |
| "step": 3965, |
| "valid_targets_mean": 2386.5, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 6.3317384370015946, |
| "grad_norm": 0.7403552637539116, |
| "learning_rate": 1.1055082627792357e-06, |
| "loss": 0.1535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1645737886428833, |
| "step": 3970, |
| "valid_targets_mean": 2855.1, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 6.339712918660287, |
| "grad_norm": 0.7439603296881704, |
| "learning_rate": 1.0795813197336602e-06, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16814234852790833, |
| "step": 3975, |
| "valid_targets_mean": 2641.1, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 6.347687400318979, |
| "grad_norm": 0.8558358007646358, |
| "learning_rate": 1.0539535864323391e-06, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17330396175384521, |
| "step": 3980, |
| "valid_targets_mean": 2434.4, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 6.355661881977672, |
| "grad_norm": 0.596512645985537, |
| "learning_rate": 1.0286254681552777e-06, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15838459134101868, |
| "step": 3985, |
| "valid_targets_mean": 3372.1, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 6.363636363636363, |
| "grad_norm": 0.6467431933291012, |
| "learning_rate": 1.0035973654443466e-06, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12675225734710693, |
| "step": 3990, |
| "valid_targets_mean": 2303.3, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 6.371610845295056, |
| "grad_norm": 0.6266060938418669, |
| "learning_rate": 9.788696740969295e-07, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19282695651054382, |
| "step": 3995, |
| "valid_targets_mean": 3250.9, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 6.379585326953748, |
| "grad_norm": 0.603105276214445, |
| "learning_rate": 9.544427851596661e-07, |
| "loss": 0.1489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1304808259010315, |
| "step": 4000, |
| "valid_targets_mean": 2783.1, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 6.3875598086124405, |
| "grad_norm": 0.6045810868867998, |
| "learning_rate": 9.303170849222764e-07, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13092729449272156, |
| "step": 4005, |
| "valid_targets_mean": 3034.9, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 6.395534290271132, |
| "grad_norm": 0.6725605538366902, |
| "learning_rate": 9.064929549114421e-07, |
| "loss": 0.1489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13961663842201233, |
| "step": 4010, |
| "valid_targets_mean": 3021.6, |
| "valid_targets_min": 1365 |
| }, |
| { |
| "epoch": 6.4035087719298245, |
| "grad_norm": 0.5280456680065018, |
| "learning_rate": 8.829707718847835e-07, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21119526028633118, |
| "step": 4015, |
| "valid_targets_mean": 5034.1, |
| "valid_targets_min": 1383 |
| }, |
| { |
| "epoch": 6.411483253588517, |
| "grad_norm": 0.6870027710411994, |
| "learning_rate": 8.597509078248923e-07, |
| "loss": 0.1373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11793472617864609, |
| "step": 4020, |
| "valid_targets_mean": 3262.4, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 6.419457735247209, |
| "grad_norm": 0.6636142716776369, |
| "learning_rate": 8.368337299334461e-07, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15093785524368286, |
| "step": 4025, |
| "valid_targets_mean": 2730.2, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 6.427432216905901, |
| "grad_norm": 0.6510224950909901, |
| "learning_rate": 8.142196006254144e-07, |
| "loss": 0.1526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12001948803663254, |
| "step": 4030, |
| "valid_targets_mean": 2182.4, |
| "valid_targets_min": 1179 |
| }, |
| { |
| "epoch": 6.435406698564593, |
| "grad_norm": 0.6245752131587334, |
| "learning_rate": 7.919088775233264e-07, |
| "loss": 0.1422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11676537990570068, |
| "step": 4035, |
| "valid_targets_mean": 2794.9, |
| "valid_targets_min": 1104 |
| }, |
| { |
| "epoch": 6.443381180223286, |
| "grad_norm": 0.7044813681400015, |
| "learning_rate": 7.699019134515917e-07, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16797736287117004, |
| "step": 4040, |
| "valid_targets_mean": 2557.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 6.451355661881978, |
| "grad_norm": 0.6616002971033802, |
| "learning_rate": 7.48199056430956e-07, |
| "loss": 0.1454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13709191977977753, |
| "step": 4045, |
| "valid_targets_mean": 2547.1, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 6.45933014354067, |
| "grad_norm": 0.5983415327849058, |
| "learning_rate": 7.268006496729762e-07, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1570061445236206, |
| "step": 4050, |
| "valid_targets_mean": 3875.0, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 6.467304625199362, |
| "grad_norm": 0.5883938864827607, |
| "learning_rate": 7.057070315745851e-07, |
| "loss": 0.1454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14021623134613037, |
| "step": 4055, |
| "valid_targets_mean": 3387.9, |
| "valid_targets_min": 1158 |
| }, |
| { |
| "epoch": 6.475279106858054, |
| "grad_norm": 0.6381148460727919, |
| "learning_rate": 6.849185357127686e-07, |
| "loss": 0.1436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1419590264558792, |
| "step": 4060, |
| "valid_targets_mean": 2658.4, |
| "valid_targets_min": 1063 |
| }, |
| { |
| "epoch": 6.483253588516747, |
| "grad_norm": 0.5626153764312638, |
| "learning_rate": 6.64435490839257e-07, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1861887127161026, |
| "step": 4065, |
| "valid_targets_mean": 4139.4, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 6.491228070175438, |
| "grad_norm": 0.6357101886196256, |
| "learning_rate": 6.442582208753578e-07, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15499606728553772, |
| "step": 4070, |
| "valid_targets_mean": 2689.3, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 6.499202551834131, |
| "grad_norm": 0.6910304026583559, |
| "learning_rate": 6.243870449068068e-07, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2073277235031128, |
| "step": 4075, |
| "valid_targets_mean": 2765.3, |
| "valid_targets_min": 1104 |
| }, |
| { |
| "epoch": 6.507177033492823, |
| "grad_norm": 0.58851977473546, |
| "learning_rate": 6.048222771787382e-07, |
| "loss": 0.1526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14743703603744507, |
| "step": 4080, |
| "valid_targets_mean": 3211.2, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 6.515151515151516, |
| "grad_norm": 0.6178750502243548, |
| "learning_rate": 5.85564227090707e-07, |
| "loss": 0.1472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17087917029857635, |
| "step": 4085, |
| "valid_targets_mean": 3659.9, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 6.523125996810207, |
| "grad_norm": 0.6938061545052304, |
| "learning_rate": 5.666131991917989e-07, |
| "loss": 0.1333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1300240010023117, |
| "step": 4090, |
| "valid_targets_mean": 2109.9, |
| "valid_targets_min": 1371 |
| }, |
| { |
| "epoch": 6.5311004784688995, |
| "grad_norm": 0.6642575349820269, |
| "learning_rate": 5.479694931758194e-07, |
| "loss": 0.1434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1611027717590332, |
| "step": 4095, |
| "valid_targets_mean": 2830.8, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 6.539074960127592, |
| "grad_norm": 0.6070107059437827, |
| "learning_rate": 5.296334038765483e-07, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13571247458457947, |
| "step": 4100, |
| "valid_targets_mean": 2914.1, |
| "valid_targets_min": 1169 |
| }, |
| { |
| "epoch": 6.5470494417862835, |
| "grad_norm": 0.6293749348387128, |
| "learning_rate": 5.116052212630696e-07, |
| "loss": 0.1219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12869954109191895, |
| "step": 4105, |
| "valid_targets_mean": 2649.8, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 6.555023923444976, |
| "grad_norm": 0.6390191087235467, |
| "learning_rate": 4.938852304352026e-07, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2021748423576355, |
| "step": 4110, |
| "valid_targets_mean": 3688.9, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 6.562998405103668, |
| "grad_norm": 0.6627492608631983, |
| "learning_rate": 4.7647371161898547e-07, |
| "loss": 0.123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11246272921562195, |
| "step": 4115, |
| "valid_targets_mean": 2175.8, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 6.570972886762361, |
| "grad_norm": 0.62234154665454, |
| "learning_rate": 4.593709401622359e-07, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13496442139148712, |
| "step": 4120, |
| "valid_targets_mean": 2949.5, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 6.578947368421053, |
| "grad_norm": 0.605016951584934, |
| "learning_rate": 4.425771865302153e-07, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14617837965488434, |
| "step": 4125, |
| "valid_targets_mean": 3346.9, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 6.586921850079745, |
| "grad_norm": 0.7083006189079447, |
| "learning_rate": 4.2609271630133174e-07, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17233526706695557, |
| "step": 4130, |
| "valid_targets_mean": 2765.6, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 6.594896331738437, |
| "grad_norm": 0.6422713513507917, |
| "learning_rate": 4.099177901629525e-07, |
| "loss": 0.1546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14676770567893982, |
| "step": 4135, |
| "valid_targets_mean": 2894.6, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 6.6028708133971294, |
| "grad_norm": 0.5862133305303223, |
| "learning_rate": 3.9405266390727836e-07, |
| "loss": 0.143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1555536389350891, |
| "step": 4140, |
| "valid_targets_mean": 4025.8, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 6.610845295055821, |
| "grad_norm": 0.649117157563772, |
| "learning_rate": 3.7849758842729344e-07, |
| "loss": 0.1335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13616587221622467, |
| "step": 4145, |
| "valid_targets_mean": 2954.0, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 6.618819776714513, |
| "grad_norm": 0.7199166365178159, |
| "learning_rate": 3.632528097128085e-07, |
| "loss": 0.1491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14053437113761902, |
| "step": 4150, |
| "valid_targets_mean": 2117.9, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 6.626794258373206, |
| "grad_norm": 0.6425703556421833, |
| "learning_rate": 3.48318568846564e-07, |
| "loss": 0.1454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14537614583969116, |
| "step": 4155, |
| "valid_targets_mean": 3269.3, |
| "valid_targets_min": 1160 |
| }, |
| { |
| "epoch": 6.634768740031898, |
| "grad_norm": 0.6587464590369769, |
| "learning_rate": 3.336951020004087e-07, |
| "loss": 0.1276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13485220074653625, |
| "step": 4160, |
| "valid_targets_mean": 2578.7, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 6.64274322169059, |
| "grad_norm": 0.6768113096854557, |
| "learning_rate": 3.1938264043158694e-07, |
| "loss": 0.1319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13307702541351318, |
| "step": 4165, |
| "valid_targets_mean": 2578.9, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 6.650717703349282, |
| "grad_norm": 0.5890393534004379, |
| "learning_rate": 3.05381410479062e-07, |
| "loss": 0.1327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11060281097888947, |
| "step": 4170, |
| "valid_targets_mean": 2939.9, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 6.6586921850079746, |
| "grad_norm": 0.6522407226289458, |
| "learning_rate": 2.916916335599407e-07, |
| "loss": 0.1301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13013817369937897, |
| "step": 4175, |
| "valid_targets_mean": 2759.8, |
| "valid_targets_min": 1309 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.6332293594628468, |
| "learning_rate": 2.783135261659831e-07, |
| "loss": 0.1254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10817860811948776, |
| "step": 4180, |
| "valid_targets_mean": 2399.8, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 6.6746411483253585, |
| "grad_norm": 0.592325682164998, |
| "learning_rate": 2.6524729986016293e-07, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13545538485050201, |
| "step": 4185, |
| "valid_targets_mean": 3311.6, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 6.682615629984051, |
| "grad_norm": 0.673758679985898, |
| "learning_rate": 2.524931612733328e-07, |
| "loss": 0.1335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13675081729888916, |
| "step": 4190, |
| "valid_targets_mean": 2591.3, |
| "valid_targets_min": 1481 |
| }, |
| { |
| "epoch": 6.690590111642743, |
| "grad_norm": 0.6966576529900051, |
| "learning_rate": 2.400513121009529e-07, |
| "loss": 0.1458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1509852409362793, |
| "step": 4195, |
| "valid_targets_mean": 2215.1, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 6.698564593301436, |
| "grad_norm": 0.6478122100991643, |
| "learning_rate": 2.279219490998985e-07, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1596289575099945, |
| "step": 4200, |
| "valid_targets_mean": 2952.1, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 6.706539074960127, |
| "grad_norm": 0.6952489954446537, |
| "learning_rate": 2.161052640853578e-07, |
| "loss": 0.1526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15504632890224457, |
| "step": 4205, |
| "valid_targets_mean": 3227.2, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 6.71451355661882, |
| "grad_norm": 0.6514941213275741, |
| "learning_rate": 2.0460144392778768e-07, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10687048733234406, |
| "step": 4210, |
| "valid_targets_mean": 2079.6, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 6.722488038277512, |
| "grad_norm": 0.6063876513438099, |
| "learning_rate": 1.9341067054996277e-07, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13883773982524872, |
| "step": 4215, |
| "valid_targets_mean": 2910.4, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 6.7304625199362045, |
| "grad_norm": 0.6791687773478821, |
| "learning_rate": 1.8253312092409992e-07, |
| "loss": 0.1434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15515685081481934, |
| "step": 4220, |
| "valid_targets_mean": 3073.0, |
| "valid_targets_min": 1273 |
| }, |
| { |
| "epoch": 6.738437001594896, |
| "grad_norm": 0.6218041337473685, |
| "learning_rate": 1.7196896706906273e-07, |
| "loss": 0.1353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11648586392402649, |
| "step": 4225, |
| "valid_targets_mean": 2936.0, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 6.746411483253588, |
| "grad_norm": 0.6617392762256765, |
| "learning_rate": 1.6171837604762597e-07, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16125863790512085, |
| "step": 4230, |
| "valid_targets_mean": 3518.8, |
| "valid_targets_min": 1593 |
| }, |
| { |
| "epoch": 6.754385964912281, |
| "grad_norm": 0.6784609926009033, |
| "learning_rate": 1.5178150996385755e-07, |
| "loss": 0.1372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12986430525779724, |
| "step": 4235, |
| "valid_targets_mean": 2628.8, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 6.762360446570973, |
| "grad_norm": 0.696201617201948, |
| "learning_rate": 1.421585259605318e-07, |
| "loss": 0.128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11709525436162949, |
| "step": 4240, |
| "valid_targets_mean": 1826.1, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 6.770334928229665, |
| "grad_norm": 0.6367805811916879, |
| "learning_rate": 1.3284957621666039e-07, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11604160070419312, |
| "step": 4245, |
| "valid_targets_mean": 2452.1, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 6.778309409888357, |
| "grad_norm": 0.6346156166777578, |
| "learning_rate": 1.2385480794507853e-07, |
| "loss": 0.1226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1615995466709137, |
| "step": 4250, |
| "valid_targets_mean": 2704.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 6.78628389154705, |
| "grad_norm": 0.6614819884519686, |
| "learning_rate": 1.1517436339011589e-07, |
| "loss": 0.1269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1173841580748558, |
| "step": 4255, |
| "valid_targets_mean": 2531.2, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 6.794258373205742, |
| "grad_norm": 0.5967106394852402, |
| "learning_rate": 1.0680837982535607e-07, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10654541105031967, |
| "step": 4260, |
| "valid_targets_mean": 2876.8, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 6.8022328548644335, |
| "grad_norm": 0.6070899574042022, |
| "learning_rate": 9.875698955145174e-08, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14284199476242065, |
| "step": 4265, |
| "valid_targets_mean": 3178.1, |
| "valid_targets_min": 1513 |
| }, |
| { |
| "epoch": 6.810207336523126, |
| "grad_norm": 0.6780997054136256, |
| "learning_rate": 9.102031989404403e-08, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16974301636219025, |
| "step": 4270, |
| "valid_targets_mean": 2744.4, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 6.818181818181818, |
| "grad_norm": 0.6754612475098248, |
| "learning_rate": 8.359849320174196e-08, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14120808243751526, |
| "step": 4275, |
| "valid_targets_mean": 2615.7, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 6.826156299840511, |
| "grad_norm": 0.693794580517889, |
| "learning_rate": 7.649162684419731e-08, |
| "loss": 0.1353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12366122752428055, |
| "step": 4280, |
| "valid_targets_mean": 2165.4, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 6.834130781499202, |
| "grad_norm": 0.6818500018106061, |
| "learning_rate": 6.969983321023499e-08, |
| "loss": 0.1479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14141970872879028, |
| "step": 4285, |
| "valid_targets_mean": 2466.6, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 6.842105263157895, |
| "grad_norm": 0.5987656732671883, |
| "learning_rate": 6.322321970608337e-08, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16968190670013428, |
| "step": 4290, |
| "valid_targets_mean": 3152.5, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 6.850079744816587, |
| "grad_norm": 0.6439966316378877, |
| "learning_rate": 5.7061888753677796e-08, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14066863059997559, |
| "step": 4295, |
| "valid_targets_mean": 2770.7, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 6.858054226475279, |
| "grad_norm": 0.6544479541120145, |
| "learning_rate": 5.121593778903755e-08, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17600896954536438, |
| "step": 4300, |
| "valid_targets_mean": 3378.7, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 6.866028708133971, |
| "grad_norm": 0.5672287636141157, |
| "learning_rate": 4.5685459260722544e-08, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21883684396743774, |
| "step": 4305, |
| "valid_targets_mean": 4971.3, |
| "valid_targets_min": 975 |
| }, |
| { |
| "epoch": 6.8740031897926634, |
| "grad_norm": 0.6252371250774587, |
| "learning_rate": 4.047054062837452e-08, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13992947340011597, |
| "step": 4310, |
| "valid_targets_mean": 2978.4, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 6.881977671451356, |
| "grad_norm": 0.6625804873828336, |
| "learning_rate": 3.55712643613404e-08, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14451831579208374, |
| "step": 4315, |
| "valid_targets_mean": 2907.2, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 6.889952153110048, |
| "grad_norm": 0.9522650055323967, |
| "learning_rate": 3.0987707937351066e-08, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21254639327526093, |
| "step": 4320, |
| "valid_targets_mean": 2916.5, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 6.89792663476874, |
| "grad_norm": 0.7728711461821048, |
| "learning_rate": 2.6719943841311268e-08, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15055662393569946, |
| "step": 4325, |
| "valid_targets_mean": 2948.6, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 6.905901116427432, |
| "grad_norm": 0.6584848163843601, |
| "learning_rate": 2.2768039564151635e-08, |
| "loss": 0.1317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13766586780548096, |
| "step": 4330, |
| "valid_targets_mean": 2726.1, |
| "valid_targets_min": 1372 |
| }, |
| { |
| "epoch": 6.913875598086125, |
| "grad_norm": 0.6431909009393747, |
| "learning_rate": 1.913205760175174e-08, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15910640358924866, |
| "step": 4335, |
| "valid_targets_mean": 3045.4, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 6.921850079744816, |
| "grad_norm": 0.5604331917524619, |
| "learning_rate": 1.5812055453963136e-08, |
| "loss": 0.123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1279834806919098, |
| "step": 4340, |
| "valid_targets_mean": 3657.7, |
| "valid_targets_min": 1548 |
| }, |
| { |
| "epoch": 6.9298245614035086, |
| "grad_norm": 0.5809407923917316, |
| "learning_rate": 1.280808562369229e-08, |
| "loss": 0.1573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1330064982175827, |
| "step": 4345, |
| "valid_targets_mean": 3600.9, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 6.937799043062201, |
| "grad_norm": 0.621224573617775, |
| "learning_rate": 1.01201956160768e-08, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12491903454065323, |
| "step": 4350, |
| "valid_targets_mean": 2639.5, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 6.945773524720893, |
| "grad_norm": 0.8297368312305293, |
| "learning_rate": 7.74842793772601e-09, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3191789388656616, |
| "step": 4355, |
| "valid_targets_mean": 4091.2, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 6.953748006379586, |
| "grad_norm": 0.5672862404897413, |
| "learning_rate": 5.692820096054874e-09, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16838830709457397, |
| "step": 4360, |
| "valid_targets_mean": 3874.2, |
| "valid_targets_min": 1136 |
| }, |
| { |
| "epoch": 6.961722488038277, |
| "grad_norm": 0.6673410547733448, |
| "learning_rate": 3.9534045986888706e-09, |
| "loss": 0.1445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1458224207162857, |
| "step": 4365, |
| "valid_targets_mean": 2595.8, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 6.96969696969697, |
| "grad_norm": 0.6454669130283491, |
| "learning_rate": 2.530208952953306e-09, |
| "loss": 0.135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1391116827726364, |
| "step": 4370, |
| "valid_targets_mean": 2461.1, |
| "valid_targets_min": 1391 |
| }, |
| { |
| "epoch": 6.977671451355662, |
| "grad_norm": 0.6808531645909409, |
| "learning_rate": 1.4232556654314445e-09, |
| "loss": 0.1572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16542094945907593, |
| "step": 4375, |
| "valid_targets_mean": 3267.7, |
| "valid_targets_min": 1393 |
| }, |
| { |
| "epoch": 6.985645933014354, |
| "grad_norm": 0.6848879103739742, |
| "learning_rate": 6.325622416136767e-10, |
| "loss": 0.1422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15867075324058533, |
| "step": 4380, |
| "valid_targets_mean": 2476.5, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 6.993620414673046, |
| "grad_norm": 0.6367183670875135, |
| "learning_rate": 1.581411856199644e-10, |
| "loss": 0.1396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10416804254055023, |
| "step": 4385, |
| "valid_targets_mean": 2126.0, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13487885892391205, |
| "step": 4389, |
| "total_flos": 841177935118336.0, |
| "train_loss": 0.10868970680736577, |
| "train_runtime": 11861.0153, |
| "train_samples_per_second": 5.919, |
| "train_steps_per_second": 0.37, |
| "valid_targets_mean": 2596.9, |
| "valid_targets_min": 1254 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4389, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 841177935118336.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|