| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4186, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.012626262626262626, |
| "grad_norm": 8.8502213152326, |
| "learning_rate": 5.755395683453238e-07, |
| "loss": 0.9749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 1.0252163410186768, |
| "step": 5, |
| "valid_targets_mean": 3810.4, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 0.025252525252525252, |
| "grad_norm": 7.0326382192271595, |
| "learning_rate": 1.2949640287769785e-06, |
| "loss": 0.97, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8746949434280396, |
| "step": 10, |
| "valid_targets_mean": 4736.2, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 0.03787878787878788, |
| "grad_norm": 6.6940046336920975, |
| "learning_rate": 2.0143884892086333e-06, |
| "loss": 0.9064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8456529378890991, |
| "step": 15, |
| "valid_targets_mean": 3504.3, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 0.050505050505050504, |
| "grad_norm": 7.365976748970077, |
| "learning_rate": 2.733812949640288e-06, |
| "loss": 0.8841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.9217684268951416, |
| "step": 20, |
| "valid_targets_mean": 2712.1, |
| "valid_targets_min": 1633 |
| }, |
| { |
| "epoch": 0.06313131313131314, |
| "grad_norm": 4.630647013342811, |
| "learning_rate": 3.453237410071943e-06, |
| "loss": 0.8408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7999893426895142, |
| "step": 25, |
| "valid_targets_mean": 2972.6, |
| "valid_targets_min": 1862 |
| }, |
| { |
| "epoch": 0.07575757575757576, |
| "grad_norm": 2.9138235176363723, |
| "learning_rate": 4.172661870503597e-06, |
| "loss": 0.7736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7608543634414673, |
| "step": 30, |
| "valid_targets_mean": 3347.9, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 0.08838383838383838, |
| "grad_norm": 1.7558069634979983, |
| "learning_rate": 4.892086330935253e-06, |
| "loss": 0.7821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.826799750328064, |
| "step": 35, |
| "valid_targets_mean": 4368.2, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 0.10101010101010101, |
| "grad_norm": 1.7134790575388017, |
| "learning_rate": 5.611510791366906e-06, |
| "loss": 0.7603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.8243893384933472, |
| "step": 40, |
| "valid_targets_mean": 3075.2, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 0.11363636363636363, |
| "grad_norm": 1.2388060565695977, |
| "learning_rate": 6.330935251798561e-06, |
| "loss": 0.6669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6428935527801514, |
| "step": 45, |
| "valid_targets_mean": 3558.9, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 0.12626262626262627, |
| "grad_norm": 1.0686895415900157, |
| "learning_rate": 7.050359712230216e-06, |
| "loss": 0.6699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6036921143531799, |
| "step": 50, |
| "valid_targets_mean": 2548.7, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 0.1388888888888889, |
| "grad_norm": 0.8408313638128855, |
| "learning_rate": 7.769784172661872e-06, |
| "loss": 0.6825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6488921642303467, |
| "step": 55, |
| "valid_targets_mean": 3712.4, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 0.15151515151515152, |
| "grad_norm": 0.8793404803472428, |
| "learning_rate": 8.489208633093526e-06, |
| "loss": 0.6406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5900353193283081, |
| "step": 60, |
| "valid_targets_mean": 2931.1, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 0.16414141414141414, |
| "grad_norm": 0.9233082070664455, |
| "learning_rate": 9.20863309352518e-06, |
| "loss": 0.6118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6843211650848389, |
| "step": 65, |
| "valid_targets_mean": 2688.2, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 0.17676767676767677, |
| "grad_norm": 0.7695618266666612, |
| "learning_rate": 9.928057553956835e-06, |
| "loss": 0.5512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5856298208236694, |
| "step": 70, |
| "valid_targets_mean": 2935.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.1893939393939394, |
| "grad_norm": 0.7101539830507525, |
| "learning_rate": 1.0647482014388491e-05, |
| "loss": 0.5928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.602681577205658, |
| "step": 75, |
| "valid_targets_mean": 3589.7, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 0.20202020202020202, |
| "grad_norm": 0.6757736826618855, |
| "learning_rate": 1.1366906474820146e-05, |
| "loss": 0.5919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5044267177581787, |
| "step": 80, |
| "valid_targets_mean": 3180.0, |
| "valid_targets_min": 1420 |
| }, |
| { |
| "epoch": 0.21464646464646464, |
| "grad_norm": 0.7052512337384288, |
| "learning_rate": 1.20863309352518e-05, |
| "loss": 0.5713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.546467661857605, |
| "step": 85, |
| "valid_targets_mean": 2828.8, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 0.22727272727272727, |
| "grad_norm": 0.8245207595088883, |
| "learning_rate": 1.2805755395683454e-05, |
| "loss": 0.5641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.605029284954071, |
| "step": 90, |
| "valid_targets_mean": 2803.2, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 0.2398989898989899, |
| "grad_norm": 0.7141934894188182, |
| "learning_rate": 1.3525179856115109e-05, |
| "loss": 0.5706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5871100425720215, |
| "step": 95, |
| "valid_targets_mean": 3075.2, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 0.25252525252525254, |
| "grad_norm": 0.7508217175713096, |
| "learning_rate": 1.4244604316546765e-05, |
| "loss": 0.5615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5834653973579407, |
| "step": 100, |
| "valid_targets_mean": 3024.4, |
| "valid_targets_min": 1610 |
| }, |
| { |
| "epoch": 0.26515151515151514, |
| "grad_norm": 0.6869296589904229, |
| "learning_rate": 1.496402877697842e-05, |
| "loss": 0.5107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5773706436157227, |
| "step": 105, |
| "valid_targets_mean": 3346.2, |
| "valid_targets_min": 465 |
| }, |
| { |
| "epoch": 0.2777777777777778, |
| "grad_norm": 0.6649670199118626, |
| "learning_rate": 1.5683453237410072e-05, |
| "loss": 0.6192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5906274318695068, |
| "step": 110, |
| "valid_targets_mean": 4020.4, |
| "valid_targets_min": 1802 |
| }, |
| { |
| "epoch": 0.2904040404040404, |
| "grad_norm": 0.749817497328354, |
| "learning_rate": 1.640287769784173e-05, |
| "loss": 0.542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6468950510025024, |
| "step": 115, |
| "valid_targets_mean": 3753.2, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 0.30303030303030304, |
| "grad_norm": 0.6555186253660183, |
| "learning_rate": 1.7122302158273384e-05, |
| "loss": 0.5134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5901004076004028, |
| "step": 120, |
| "valid_targets_mean": 4881.6, |
| "valid_targets_min": 1494 |
| }, |
| { |
| "epoch": 0.31565656565656564, |
| "grad_norm": 0.7273014966297405, |
| "learning_rate": 1.784172661870504e-05, |
| "loss": 0.5702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5654794573783875, |
| "step": 125, |
| "valid_targets_mean": 3368.1, |
| "valid_targets_min": 1521 |
| }, |
| { |
| "epoch": 0.3282828282828283, |
| "grad_norm": 0.7586180547020986, |
| "learning_rate": 1.8561151079136693e-05, |
| "loss": 0.5293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41630545258522034, |
| "step": 130, |
| "valid_targets_mean": 3200.5, |
| "valid_targets_min": 1661 |
| }, |
| { |
| "epoch": 0.3409090909090909, |
| "grad_norm": 0.7688770234195088, |
| "learning_rate": 1.9280575539568347e-05, |
| "loss": 0.5299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5642590522766113, |
| "step": 135, |
| "valid_targets_mean": 3158.9, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 0.35353535353535354, |
| "grad_norm": 0.8258141160820167, |
| "learning_rate": 2e-05, |
| "loss": 0.4706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43767279386520386, |
| "step": 140, |
| "valid_targets_mean": 2534.0, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 0.3661616161616162, |
| "grad_norm": 0.6638208230368448, |
| "learning_rate": 2.0719424460431656e-05, |
| "loss": 0.5226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5216605067253113, |
| "step": 145, |
| "valid_targets_mean": 3478.1, |
| "valid_targets_min": 1455 |
| }, |
| { |
| "epoch": 0.3787878787878788, |
| "grad_norm": 0.6659508828600877, |
| "learning_rate": 2.143884892086331e-05, |
| "loss": 0.5054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46430742740631104, |
| "step": 150, |
| "valid_targets_mean": 3356.1, |
| "valid_targets_min": 1804 |
| }, |
| { |
| "epoch": 0.39141414141414144, |
| "grad_norm": 0.6857469917039041, |
| "learning_rate": 2.2158273381294965e-05, |
| "loss": 0.4803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46997326612472534, |
| "step": 155, |
| "valid_targets_mean": 3069.1, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 0.40404040404040403, |
| "grad_norm": 0.7497478551719995, |
| "learning_rate": 2.287769784172662e-05, |
| "loss": 0.5096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5357323884963989, |
| "step": 160, |
| "valid_targets_mean": 2978.5, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 0.4166666666666667, |
| "grad_norm": 0.6266767386519286, |
| "learning_rate": 2.3597122302158274e-05, |
| "loss": 0.4854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49465256929397583, |
| "step": 165, |
| "valid_targets_mean": 4385.0, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 0.4292929292929293, |
| "grad_norm": 0.7198305240954321, |
| "learning_rate": 2.431654676258993e-05, |
| "loss": 0.5133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4758256673812866, |
| "step": 170, |
| "valid_targets_mean": 3358.2, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 0.44191919191919193, |
| "grad_norm": 0.744564295446295, |
| "learning_rate": 2.5035971223021586e-05, |
| "loss": 0.4285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4645718038082123, |
| "step": 175, |
| "valid_targets_mean": 3257.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 0.45454545454545453, |
| "grad_norm": 0.741277701622229, |
| "learning_rate": 2.575539568345324e-05, |
| "loss": 0.4867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5038046836853027, |
| "step": 180, |
| "valid_targets_mean": 3023.1, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 0.4671717171717172, |
| "grad_norm": 0.7440421968116456, |
| "learning_rate": 2.6474820143884895e-05, |
| "loss": 0.5095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.570155918598175, |
| "step": 185, |
| "valid_targets_mean": 3422.4, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 0.4797979797979798, |
| "grad_norm": 0.8024642384967607, |
| "learning_rate": 2.719424460431655e-05, |
| "loss": 0.4493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5823109149932861, |
| "step": 190, |
| "valid_targets_mean": 2894.9, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 0.49242424242424243, |
| "grad_norm": 0.7498359662712905, |
| "learning_rate": 2.7913669064748203e-05, |
| "loss": 0.5014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5892109870910645, |
| "step": 195, |
| "valid_targets_mean": 3757.8, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 0.5050505050505051, |
| "grad_norm": 0.6969972771455335, |
| "learning_rate": 2.8633093525179858e-05, |
| "loss": 0.4966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4585283696651459, |
| "step": 200, |
| "valid_targets_mean": 3301.2, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 0.5176767676767676, |
| "grad_norm": 0.7428922534210859, |
| "learning_rate": 2.9352517985611512e-05, |
| "loss": 0.4873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35433435440063477, |
| "step": 205, |
| "valid_targets_mean": 2534.4, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 0.5303030303030303, |
| "grad_norm": 0.7952927627365796, |
| "learning_rate": 3.0071942446043167e-05, |
| "loss": 0.4483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3344321846961975, |
| "step": 210, |
| "valid_targets_mean": 2273.5, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 0.5429292929292929, |
| "grad_norm": 0.7452719253142043, |
| "learning_rate": 3.0791366906474824e-05, |
| "loss": 0.4887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4398002624511719, |
| "step": 215, |
| "valid_targets_mean": 2894.6, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 0.5555555555555556, |
| "grad_norm": 0.793089120317565, |
| "learning_rate": 3.1510791366906475e-05, |
| "loss": 0.4446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3552176058292389, |
| "step": 220, |
| "valid_targets_mean": 2370.2, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 0.5681818181818182, |
| "grad_norm": 0.6957948039355799, |
| "learning_rate": 3.223021582733813e-05, |
| "loss": 0.4677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4744777977466583, |
| "step": 225, |
| "valid_targets_mean": 3270.9, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 0.5808080808080808, |
| "grad_norm": 0.9598066573051235, |
| "learning_rate": 3.2949640287769784e-05, |
| "loss": 0.4678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.53702712059021, |
| "step": 230, |
| "valid_targets_mean": 3305.6, |
| "valid_targets_min": 1465 |
| }, |
| { |
| "epoch": 0.5934343434343434, |
| "grad_norm": 0.7385990473183633, |
| "learning_rate": 3.366906474820144e-05, |
| "loss": 0.4269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4913618564605713, |
| "step": 235, |
| "valid_targets_mean": 3022.6, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 0.6060606060606061, |
| "grad_norm": 0.8954334270151011, |
| "learning_rate": 3.438848920863309e-05, |
| "loss": 0.4773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4261593222618103, |
| "step": 240, |
| "valid_targets_mean": 3027.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 0.6186868686868687, |
| "grad_norm": 0.7460534615902407, |
| "learning_rate": 3.510791366906475e-05, |
| "loss": 0.4695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5014075040817261, |
| "step": 245, |
| "valid_targets_mean": 3182.8, |
| "valid_targets_min": 1704 |
| }, |
| { |
| "epoch": 0.6313131313131313, |
| "grad_norm": 0.7476045212031468, |
| "learning_rate": 3.582733812949641e-05, |
| "loss": 0.4897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5569243431091309, |
| "step": 250, |
| "valid_targets_mean": 4160.6, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 0.6439393939393939, |
| "grad_norm": 0.7290825841839375, |
| "learning_rate": 3.654676258992806e-05, |
| "loss": 0.5141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5026414394378662, |
| "step": 255, |
| "valid_targets_mean": 3161.4, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 0.6565656565656566, |
| "grad_norm": 0.7490321855827192, |
| "learning_rate": 3.726618705035972e-05, |
| "loss": 0.5036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46991053223609924, |
| "step": 260, |
| "valid_targets_mean": 2653.6, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 0.6691919191919192, |
| "grad_norm": 0.739603256968017, |
| "learning_rate": 3.798561151079137e-05, |
| "loss": 0.4898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4988292157649994, |
| "step": 265, |
| "valid_targets_mean": 3293.9, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 0.6818181818181818, |
| "grad_norm": 0.8025519110811695, |
| "learning_rate": 3.8705035971223026e-05, |
| "loss": 0.5011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5377944707870483, |
| "step": 270, |
| "valid_targets_mean": 3180.2, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 0.6944444444444444, |
| "grad_norm": 0.7900087471325877, |
| "learning_rate": 3.942446043165468e-05, |
| "loss": 0.4673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5039912462234497, |
| "step": 275, |
| "valid_targets_mean": 2830.6, |
| "valid_targets_min": 1799 |
| }, |
| { |
| "epoch": 0.7070707070707071, |
| "grad_norm": 0.7659391333417415, |
| "learning_rate": 3.999998413256274e-05, |
| "loss": 0.5003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4912080764770508, |
| "step": 280, |
| "valid_targets_mean": 3327.0, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 0.7196969696969697, |
| "grad_norm": 0.694845702448467, |
| "learning_rate": 3.9999428774902425e-05, |
| "loss": 0.4588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5030688643455505, |
| "step": 285, |
| "valid_targets_mean": 3079.2, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 0.7323232323232324, |
| "grad_norm": 0.7144245421458943, |
| "learning_rate": 3.999808007055667e-05, |
| "loss": 0.4796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5815045237541199, |
| "step": 290, |
| "valid_targets_mean": 4749.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 0.7449494949494949, |
| "grad_norm": 0.8137606805905706, |
| "learning_rate": 3.999593807302654e-05, |
| "loss": 0.4778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3889826536178589, |
| "step": 295, |
| "valid_targets_mean": 2409.6, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 0.7575757575757576, |
| "grad_norm": 0.7671755034689156, |
| "learning_rate": 3.999300286728176e-05, |
| "loss": 0.4424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40401798486709595, |
| "step": 300, |
| "valid_targets_mean": 2374.2, |
| "valid_targets_min": 412 |
| }, |
| { |
| "epoch": 0.7702020202020202, |
| "grad_norm": 0.775435011663138, |
| "learning_rate": 3.9989274569757467e-05, |
| "loss": 0.4529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5113080143928528, |
| "step": 305, |
| "valid_targets_mean": 3065.1, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 0.7828282828282829, |
| "grad_norm": 0.7829159491303057, |
| "learning_rate": 3.99847533283495e-05, |
| "loss": 0.4483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4134717285633087, |
| "step": 310, |
| "valid_targets_mean": 2551.4, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 0.7954545454545454, |
| "grad_norm": 0.70594805762661, |
| "learning_rate": 3.9979439322408575e-05, |
| "loss": 0.4722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5452604293823242, |
| "step": 315, |
| "valid_targets_mean": 4207.9, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 0.8080808080808081, |
| "grad_norm": 0.741059134063674, |
| "learning_rate": 3.9973332762733165e-05, |
| "loss": 0.4703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.523596465587616, |
| "step": 320, |
| "valid_targets_mean": 3050.4, |
| "valid_targets_min": 1682 |
| }, |
| { |
| "epoch": 0.8207070707070707, |
| "grad_norm": 0.646169301673137, |
| "learning_rate": 3.996643389156114e-05, |
| "loss": 0.4531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4629998803138733, |
| "step": 325, |
| "valid_targets_mean": 3761.1, |
| "valid_targets_min": 1341 |
| }, |
| { |
| "epoch": 0.8333333333333334, |
| "grad_norm": 0.7311851901523451, |
| "learning_rate": 3.995874298256014e-05, |
| "loss": 0.4769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49332910776138306, |
| "step": 330, |
| "valid_targets_mean": 3003.4, |
| "valid_targets_min": 1840 |
| }, |
| { |
| "epoch": 0.8459595959595959, |
| "grad_norm": 0.684697792793549, |
| "learning_rate": 3.9950260340816723e-05, |
| "loss": 0.4772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.476440966129303, |
| "step": 335, |
| "valid_targets_mean": 3521.4, |
| "valid_targets_min": 1763 |
| }, |
| { |
| "epoch": 0.8585858585858586, |
| "grad_norm": 0.7235672828868595, |
| "learning_rate": 3.9940986302824305e-05, |
| "loss": 0.4573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4808931350708008, |
| "step": 340, |
| "valid_targets_mean": 3157.8, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 0.8712121212121212, |
| "grad_norm": 0.618583293178677, |
| "learning_rate": 3.993092123646975e-05, |
| "loss": 0.4419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4222564101219177, |
| "step": 345, |
| "valid_targets_mean": 3462.4, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 0.8838383838383839, |
| "grad_norm": 0.9731914681849075, |
| "learning_rate": 3.992006554101881e-05, |
| "loss": 0.4431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4798777997493744, |
| "step": 350, |
| "valid_targets_mean": 2746.6, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 0.8964646464646465, |
| "grad_norm": 0.6711603679996875, |
| "learning_rate": 3.99084196471003e-05, |
| "loss": 0.4315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39052852988243103, |
| "step": 355, |
| "valid_targets_mean": 2697.2, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 0.9090909090909091, |
| "grad_norm": 0.6756824530106742, |
| "learning_rate": 3.9895984016688956e-05, |
| "loss": 0.4208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4884558618068695, |
| "step": 360, |
| "valid_targets_mean": 3316.8, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 0.9217171717171717, |
| "grad_norm": 0.6730754745335135, |
| "learning_rate": 3.9882759143087194e-05, |
| "loss": 0.4558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4529365003108978, |
| "step": 365, |
| "valid_targets_mean": 2792.6, |
| "valid_targets_min": 1934 |
| }, |
| { |
| "epoch": 0.9343434343434344, |
| "grad_norm": 0.7396239570533569, |
| "learning_rate": 3.9868745550905475e-05, |
| "loss": 0.4806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.48611992597579956, |
| "step": 370, |
| "valid_targets_mean": 3224.1, |
| "valid_targets_min": 1756 |
| }, |
| { |
| "epoch": 0.946969696969697, |
| "grad_norm": 0.5859949295622379, |
| "learning_rate": 3.985394379604152e-05, |
| "loss": 0.4543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4721411466598511, |
| "step": 375, |
| "valid_targets_mean": 4448.3, |
| "valid_targets_min": 1472 |
| }, |
| { |
| "epoch": 0.9595959595959596, |
| "grad_norm": 0.6661047355223618, |
| "learning_rate": 3.983835446565826e-05, |
| "loss": 0.4424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49498146772384644, |
| "step": 380, |
| "valid_targets_mean": 3239.3, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 0.9722222222222222, |
| "grad_norm": 0.5805898239548394, |
| "learning_rate": 3.982197817816054e-05, |
| "loss": 0.4422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38239431381225586, |
| "step": 385, |
| "valid_targets_mean": 3780.7, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 0.9848484848484849, |
| "grad_norm": 0.7798921127063227, |
| "learning_rate": 3.980481558317057e-05, |
| "loss": 0.4662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5424267053604126, |
| "step": 390, |
| "valid_targets_mean": 3867.1, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 0.9974747474747475, |
| "grad_norm": 0.6339986265381534, |
| "learning_rate": 3.978686736150221e-05, |
| "loss": 0.4535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47920912504196167, |
| "step": 395, |
| "valid_targets_mean": 3606.8, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 1.0101010101010102, |
| "grad_norm": 0.6706130776528586, |
| "learning_rate": 3.976813422513388e-05, |
| "loss": 0.437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4376629590988159, |
| "step": 400, |
| "valid_targets_mean": 3430.6, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 1.0227272727272727, |
| "grad_norm": 0.6708127261682855, |
| "learning_rate": 3.9748616917180406e-05, |
| "loss": 0.3809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3455820381641388, |
| "step": 405, |
| "valid_targets_mean": 2637.0, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 1.0353535353535352, |
| "grad_norm": 0.7742495725599213, |
| "learning_rate": 3.972831621186345e-05, |
| "loss": 0.417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3599938154220581, |
| "step": 410, |
| "valid_targets_mean": 2649.8, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 1.047979797979798, |
| "grad_norm": 0.6102251044562367, |
| "learning_rate": 3.970723291448092e-05, |
| "loss": 0.4354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.445651650428772, |
| "step": 415, |
| "valid_targets_mean": 4083.1, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 1.0606060606060606, |
| "grad_norm": 0.6976342123087943, |
| "learning_rate": 3.968536786137487e-05, |
| "loss": 0.4382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40597984194755554, |
| "step": 420, |
| "valid_targets_mean": 2881.2, |
| "valid_targets_min": 1527 |
| }, |
| { |
| "epoch": 1.0732323232323233, |
| "grad_norm": 0.8976764193372789, |
| "learning_rate": 3.966272191989847e-05, |
| "loss": 0.4593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5112510323524475, |
| "step": 425, |
| "valid_targets_mean": 3042.1, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 1.0858585858585859, |
| "grad_norm": 0.7365732301930217, |
| "learning_rate": 3.963929598838149e-05, |
| "loss": 0.4145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43491220474243164, |
| "step": 430, |
| "valid_targets_mean": 2794.9, |
| "valid_targets_min": 1679 |
| }, |
| { |
| "epoch": 1.0984848484848484, |
| "grad_norm": 0.6773959614029044, |
| "learning_rate": 3.9615090996094726e-05, |
| "loss": 0.4226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5162553787231445, |
| "step": 435, |
| "valid_targets_mean": 4462.0, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 1.1111111111111112, |
| "grad_norm": 0.5970043671496138, |
| "learning_rate": 3.959010790321313e-05, |
| "loss": 0.4334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33793818950653076, |
| "step": 440, |
| "valid_targets_mean": 3196.2, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 1.1237373737373737, |
| "grad_norm": 0.7763112041835692, |
| "learning_rate": 3.9564347700777705e-05, |
| "loss": 0.4279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4716646075248718, |
| "step": 445, |
| "valid_targets_mean": 2790.6, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 1.1363636363636362, |
| "grad_norm": 0.7191861233677, |
| "learning_rate": 3.953781141065619e-05, |
| "loss": 0.4571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4991220235824585, |
| "step": 450, |
| "valid_targets_mean": 2805.2, |
| "valid_targets_min": 1500 |
| }, |
| { |
| "epoch": 1.148989898989899, |
| "grad_norm": 0.6931761780564214, |
| "learning_rate": 3.9510500085502556e-05, |
| "loss": 0.403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3412482738494873, |
| "step": 455, |
| "valid_targets_mean": 2871.2, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 1.1616161616161615, |
| "grad_norm": 0.5776459149074374, |
| "learning_rate": 3.9482414808715194e-05, |
| "loss": 0.4203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4245602786540985, |
| "step": 460, |
| "valid_targets_mean": 4715.2, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 1.1742424242424243, |
| "grad_norm": 0.6555627012964024, |
| "learning_rate": 3.945355669439399e-05, |
| "loss": 0.4475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44374722242355347, |
| "step": 465, |
| "valid_targets_mean": 3508.2, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 1.1868686868686869, |
| "grad_norm": 1.2615252581904304, |
| "learning_rate": 3.9423926887296114e-05, |
| "loss": 0.4471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4283289909362793, |
| "step": 470, |
| "valid_targets_mean": 3297.8, |
| "valid_targets_min": 1445 |
| }, |
| { |
| "epoch": 1.1994949494949494, |
| "grad_norm": 0.7227367427497255, |
| "learning_rate": 3.939352656279059e-05, |
| "loss": 0.4105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4885120689868927, |
| "step": 475, |
| "valid_targets_mean": 3030.8, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 1.2121212121212122, |
| "grad_norm": 0.7171565868676774, |
| "learning_rate": 3.93623569268117e-05, |
| "loss": 0.4334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37661659717559814, |
| "step": 480, |
| "valid_targets_mean": 2516.6, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 1.2247474747474747, |
| "grad_norm": 0.6709298722578017, |
| "learning_rate": 3.933041921581113e-05, |
| "loss": 0.4524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4951278269290924, |
| "step": 485, |
| "valid_targets_mean": 3910.1, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 1.2373737373737375, |
| "grad_norm": 0.6284344251816701, |
| "learning_rate": 3.929771469670892e-05, |
| "loss": 0.4364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4901544451713562, |
| "step": 490, |
| "valid_targets_mean": 5372.7, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 1.25, |
| "grad_norm": 0.695150714261409, |
| "learning_rate": 3.926424466684321e-05, |
| "loss": 0.4036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3937031328678131, |
| "step": 495, |
| "valid_targets_mean": 2620.4, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 1.2626262626262625, |
| "grad_norm": 0.5659681496879514, |
| "learning_rate": 3.92300104539188e-05, |
| "loss": 0.4347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43232929706573486, |
| "step": 500, |
| "valid_targets_mean": 4517.9, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 1.2752525252525253, |
| "grad_norm": 0.6499437965902374, |
| "learning_rate": 3.919501341595442e-05, |
| "loss": 0.4463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4581197500228882, |
| "step": 505, |
| "valid_targets_mean": 3634.6, |
| "valid_targets_min": 1176 |
| }, |
| { |
| "epoch": 1.2878787878787878, |
| "grad_norm": 0.5715005441806082, |
| "learning_rate": 3.9159254941228944e-05, |
| "loss": 0.4015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3313661217689514, |
| "step": 510, |
| "valid_targets_mean": 3508.3, |
| "valid_targets_min": 1355 |
| }, |
| { |
| "epoch": 1.3005050505050506, |
| "grad_norm": 0.7308800974579575, |
| "learning_rate": 3.912273644822625e-05, |
| "loss": 0.4295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4216563105583191, |
| "step": 515, |
| "valid_targets_mean": 2695.7, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 1.3131313131313131, |
| "grad_norm": 0.6837093491179472, |
| "learning_rate": 3.9085459385578984e-05, |
| "loss": 0.3947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4423089027404785, |
| "step": 520, |
| "valid_targets_mean": 2883.6, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 1.3257575757575757, |
| "grad_norm": 0.6554872754713126, |
| "learning_rate": 3.9047425232011076e-05, |
| "loss": 0.3826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3657465875148773, |
| "step": 525, |
| "valid_targets_mean": 3170.8, |
| "valid_targets_min": 1136 |
| }, |
| { |
| "epoch": 1.3383838383838385, |
| "grad_norm": 0.6685453762625018, |
| "learning_rate": 3.900863549627911e-05, |
| "loss": 0.428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4607548713684082, |
| "step": 530, |
| "valid_targets_mean": 3880.3, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 1.351010101010101, |
| "grad_norm": 0.6443269502166363, |
| "learning_rate": 3.896909171711245e-05, |
| "loss": 0.4348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4501422941684723, |
| "step": 535, |
| "valid_targets_mean": 3417.6, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 1.3636363636363638, |
| "grad_norm": 0.6126406593256342, |
| "learning_rate": 3.8928795463152186e-05, |
| "loss": 0.3799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3543352782726288, |
| "step": 540, |
| "valid_targets_mean": 3163.1, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 1.3762626262626263, |
| "grad_norm": 0.6881727131350188, |
| "learning_rate": 3.888774833288898e-05, |
| "loss": 0.4257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4091816842556, |
| "step": 545, |
| "valid_targets_mean": 3140.7, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 1.3888888888888888, |
| "grad_norm": 0.6580723165353671, |
| "learning_rate": 3.8845951954599545e-05, |
| "loss": 0.3958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3906816244125366, |
| "step": 550, |
| "valid_targets_mean": 2895.7, |
| "valid_targets_min": 1240 |
| }, |
| { |
| "epoch": 1.4015151515151514, |
| "grad_norm": 0.6770136577009271, |
| "learning_rate": 3.8803407986282156e-05, |
| "loss": 0.4221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35806700587272644, |
| "step": 555, |
| "valid_targets_mean": 2287.6, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 1.4141414141414141, |
| "grad_norm": 0.6405715120436977, |
| "learning_rate": 3.876011811559084e-05, |
| "loss": 0.4279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4252093434333801, |
| "step": 560, |
| "valid_targets_mean": 3118.0, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 1.4267676767676767, |
| "grad_norm": 0.6944966556141179, |
| "learning_rate": 3.871608405976838e-05, |
| "loss": 0.4115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42029836773872375, |
| "step": 565, |
| "valid_targets_mean": 2919.8, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 1.4393939393939394, |
| "grad_norm": 0.6466971885955511, |
| "learning_rate": 3.867130756557832e-05, |
| "loss": 0.4312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3371127247810364, |
| "step": 570, |
| "valid_targets_mean": 2752.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 1.452020202020202, |
| "grad_norm": 0.6100566892783015, |
| "learning_rate": 3.862579040923552e-05, |
| "loss": 0.3838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3892483115196228, |
| "step": 575, |
| "valid_targets_mean": 3388.8, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 1.4646464646464645, |
| "grad_norm": 0.6600534442172271, |
| "learning_rate": 3.8579534396335835e-05, |
| "loss": 0.412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46965640783309937, |
| "step": 580, |
| "valid_targets_mean": 3274.4, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 1.4772727272727273, |
| "grad_norm": 0.6946470349793337, |
| "learning_rate": 3.853254136178437e-05, |
| "loss": 0.4195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4128877818584442, |
| "step": 585, |
| "valid_targets_mean": 2874.7, |
| "valid_targets_min": 1690 |
| }, |
| { |
| "epoch": 1.4898989898989898, |
| "grad_norm": 0.658007836439284, |
| "learning_rate": 3.8484813169722794e-05, |
| "loss": 0.4202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4265574812889099, |
| "step": 590, |
| "valid_targets_mean": 2866.8, |
| "valid_targets_min": 1791 |
| }, |
| { |
| "epoch": 1.5025252525252526, |
| "grad_norm": 0.7613954671864829, |
| "learning_rate": 3.843635171345532e-05, |
| "loss": 0.4369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44407981634140015, |
| "step": 595, |
| "valid_targets_mean": 3021.1, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 1.5151515151515151, |
| "grad_norm": 0.7625903826308273, |
| "learning_rate": 3.838715891537365e-05, |
| "loss": 0.3805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34579938650131226, |
| "step": 600, |
| "valid_targets_mean": 2343.3, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 1.5277777777777777, |
| "grad_norm": 0.6482084611263487, |
| "learning_rate": 3.8337236726880674e-05, |
| "loss": 0.441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41672322154045105, |
| "step": 605, |
| "valid_targets_mean": 2920.0, |
| "valid_targets_min": 1776 |
| }, |
| { |
| "epoch": 1.5404040404040404, |
| "grad_norm": 0.6065329237085881, |
| "learning_rate": 3.828658712831311e-05, |
| "loss": 0.398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3971773386001587, |
| "step": 610, |
| "valid_targets_mean": 3118.1, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 1.553030303030303, |
| "grad_norm": 0.6544115401255524, |
| "learning_rate": 3.823521212886287e-05, |
| "loss": 0.441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45314595103263855, |
| "step": 615, |
| "valid_targets_mean": 3466.2, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 1.5656565656565657, |
| "grad_norm": 0.7218840612228915, |
| "learning_rate": 3.818311376649746e-05, |
| "loss": 0.3962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40665388107299805, |
| "step": 620, |
| "valid_targets_mean": 3132.6, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 1.5782828282828283, |
| "grad_norm": 0.6457705553977882, |
| "learning_rate": 3.813029410787906e-05, |
| "loss": 0.4014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4007648229598999, |
| "step": 625, |
| "valid_targets_mean": 3385.1, |
| "valid_targets_min": 1276 |
| }, |
| { |
| "epoch": 1.5909090909090908, |
| "grad_norm": 0.6340707674027326, |
| "learning_rate": 3.807675524828255e-05, |
| "loss": 0.3921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3663696050643921, |
| "step": 630, |
| "valid_targets_mean": 2994.5, |
| "valid_targets_min": 1839 |
| }, |
| { |
| "epoch": 1.6035353535353534, |
| "grad_norm": 0.6510799288150312, |
| "learning_rate": 3.802249931151245e-05, |
| "loss": 0.4083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4528045356273651, |
| "step": 635, |
| "valid_targets_mean": 3057.3, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 1.6161616161616161, |
| "grad_norm": 0.7096957049322412, |
| "learning_rate": 3.7967528449818604e-05, |
| "loss": 0.4129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3862096667289734, |
| "step": 640, |
| "valid_targets_mean": 2390.7, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 1.628787878787879, |
| "grad_norm": 0.7345826232266963, |
| "learning_rate": 3.791184484381083e-05, |
| "loss": 0.433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3896709382534027, |
| "step": 645, |
| "valid_targets_mean": 2601.5, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 1.6414141414141414, |
| "grad_norm": 0.6381339146897167, |
| "learning_rate": 3.7855450702372446e-05, |
| "loss": 0.3921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42096877098083496, |
| "step": 650, |
| "valid_targets_mean": 2983.1, |
| "valid_targets_min": 1513 |
| }, |
| { |
| "epoch": 1.654040404040404, |
| "grad_norm": 0.7088141347121194, |
| "learning_rate": 3.7798348262572595e-05, |
| "loss": 0.4184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38489383459091187, |
| "step": 655, |
| "valid_targets_mean": 2589.2, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.6158104461556841, |
| "learning_rate": 3.774053978957754e-05, |
| "loss": 0.422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33309605717658997, |
| "step": 660, |
| "valid_targets_mean": 2628.7, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 1.6792929292929293, |
| "grad_norm": 0.6621621785950462, |
| "learning_rate": 3.76820275765608e-05, |
| "loss": 0.4482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3812219202518463, |
| "step": 665, |
| "valid_targets_mean": 2696.2, |
| "valid_targets_min": 1315 |
| }, |
| { |
| "epoch": 1.691919191919192, |
| "grad_norm": 0.5915638746228544, |
| "learning_rate": 3.7622813944612184e-05, |
| "loss": 0.4268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45549070835113525, |
| "step": 670, |
| "valid_targets_mean": 4037.2, |
| "valid_targets_min": 1593 |
| }, |
| { |
| "epoch": 1.7045454545454546, |
| "grad_norm": 0.6214323792581383, |
| "learning_rate": 3.75629012426457e-05, |
| "loss": 0.4049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30740225315093994, |
| "step": 675, |
| "valid_targets_mean": 2484.4, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 1.7171717171717171, |
| "grad_norm": 0.6181383119204046, |
| "learning_rate": 3.750229184730643e-05, |
| "loss": 0.4034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41900163888931274, |
| "step": 680, |
| "valid_targets_mean": 3214.8, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 1.7297979797979797, |
| "grad_norm": 0.7022543694921178, |
| "learning_rate": 3.744098816287616e-05, |
| "loss": 0.3934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3738209009170532, |
| "step": 685, |
| "valid_targets_mean": 2518.6, |
| "valid_targets_min": 1060 |
| }, |
| { |
| "epoch": 1.7424242424242424, |
| "grad_norm": 0.6444777112364757, |
| "learning_rate": 3.73789926211781e-05, |
| "loss": 0.4013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40667980909347534, |
| "step": 690, |
| "valid_targets_mean": 2943.8, |
| "valid_targets_min": 586 |
| }, |
| { |
| "epoch": 1.7550505050505052, |
| "grad_norm": 0.6456649483546918, |
| "learning_rate": 3.7316307681480364e-05, |
| "loss": 0.4464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5095163583755493, |
| "step": 695, |
| "valid_targets_mean": 3686.2, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 1.7676767676767677, |
| "grad_norm": 0.6312723135470779, |
| "learning_rate": 3.725293583039843e-05, |
| "loss": 0.4029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3778528869152069, |
| "step": 700, |
| "valid_targets_mean": 3107.6, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 1.7803030303030303, |
| "grad_norm": 0.6535661127784683, |
| "learning_rate": 3.71888795817965e-05, |
| "loss": 0.4127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47286659479141235, |
| "step": 705, |
| "valid_targets_mean": 4064.8, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 1.7929292929292928, |
| "grad_norm": 0.6896428501647339, |
| "learning_rate": 3.712414147668777e-05, |
| "loss": 0.4215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4112127423286438, |
| "step": 710, |
| "valid_targets_mean": 2654.4, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 1.8055555555555556, |
| "grad_norm": 0.5820441201531631, |
| "learning_rate": 3.7058724083133645e-05, |
| "loss": 0.4077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34681016206741333, |
| "step": 715, |
| "valid_targets_mean": 2884.4, |
| "valid_targets_min": 1351 |
| }, |
| { |
| "epoch": 1.8181818181818183, |
| "grad_norm": 0.6800591266970959, |
| "learning_rate": 3.6992629996141864e-05, |
| "loss": 0.4424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4916991591453552, |
| "step": 720, |
| "valid_targets_mean": 3417.7, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 1.8308080808080809, |
| "grad_norm": 0.6563197557373552, |
| "learning_rate": 3.692586183756354e-05, |
| "loss": 0.3807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3805094361305237, |
| "step": 725, |
| "valid_targets_mean": 2503.5, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 1.8434343434343434, |
| "grad_norm": 0.7047851378134344, |
| "learning_rate": 3.685842225598919e-05, |
| "loss": 0.4278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4543723464012146, |
| "step": 730, |
| "valid_targets_mean": 2930.4, |
| "valid_targets_min": 1798 |
| }, |
| { |
| "epoch": 1.856060606060606, |
| "grad_norm": 0.6499844550915188, |
| "learning_rate": 3.6790313926643664e-05, |
| "loss": 0.4119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3960087299346924, |
| "step": 735, |
| "valid_targets_mean": 2956.1, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 1.8686868686868687, |
| "grad_norm": 0.649385668021803, |
| "learning_rate": 3.6721539551279966e-05, |
| "loss": 0.4369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4332810640335083, |
| "step": 740, |
| "valid_targets_mean": 3076.4, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 1.8813131313131313, |
| "grad_norm": 0.7091254200389234, |
| "learning_rate": 3.665210185807217e-05, |
| "loss": 0.4388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44163447618484497, |
| "step": 745, |
| "valid_targets_mean": 3328.9, |
| "valid_targets_min": 1660 |
| }, |
| { |
| "epoch": 1.893939393939394, |
| "grad_norm": 0.5985641510783979, |
| "learning_rate": 3.658200360150713e-05, |
| "loss": 0.4091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37661778926849365, |
| "step": 750, |
| "valid_targets_mean": 3146.1, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 1.9065656565656566, |
| "grad_norm": 0.6268419140387759, |
| "learning_rate": 3.651124756227525e-05, |
| "loss": 0.401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4080426096916199, |
| "step": 755, |
| "valid_targets_mean": 3422.2, |
| "valid_targets_min": 1798 |
| }, |
| { |
| "epoch": 1.9191919191919191, |
| "grad_norm": 0.7426620476089505, |
| "learning_rate": 3.6439836547160144e-05, |
| "loss": 0.4044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38891446590423584, |
| "step": 760, |
| "valid_targets_mean": 3295.2, |
| "valid_targets_min": 1546 |
| }, |
| { |
| "epoch": 1.9318181818181817, |
| "grad_norm": 0.6671491506286603, |
| "learning_rate": 3.636777338892732e-05, |
| "loss": 0.4466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44117462635040283, |
| "step": 765, |
| "valid_targets_mean": 2958.4, |
| "valid_targets_min": 1837 |
| }, |
| { |
| "epoch": 1.9444444444444444, |
| "grad_norm": 0.6342292838426378, |
| "learning_rate": 3.629506094621183e-05, |
| "loss": 0.3886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3897709250450134, |
| "step": 770, |
| "valid_targets_mean": 2692.6, |
| "valid_targets_min": 1547 |
| }, |
| { |
| "epoch": 1.9570707070707072, |
| "grad_norm": 0.621675970891514, |
| "learning_rate": 3.622170210340482e-05, |
| "loss": 0.4183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38866496086120605, |
| "step": 775, |
| "valid_targets_mean": 2999.8, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 1.9696969696969697, |
| "grad_norm": 0.5905010144602377, |
| "learning_rate": 3.614769977053914e-05, |
| "loss": 0.4291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3574790060520172, |
| "step": 780, |
| "valid_targets_mean": 3125.0, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 1.9823232323232323, |
| "grad_norm": 0.5836024549642513, |
| "learning_rate": 3.607305688317391e-05, |
| "loss": 0.4046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4132801294326782, |
| "step": 785, |
| "valid_targets_mean": 3194.9, |
| "valid_targets_min": 1242 |
| }, |
| { |
| "epoch": 1.9949494949494948, |
| "grad_norm": 0.7228511270619273, |
| "learning_rate": 3.5997776402278055e-05, |
| "loss": 0.3925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42261964082717896, |
| "step": 790, |
| "valid_targets_mean": 3067.1, |
| "valid_targets_min": 1603 |
| }, |
| { |
| "epoch": 2.007575757575758, |
| "grad_norm": 0.6700499879024988, |
| "learning_rate": 3.592186131411288e-05, |
| "loss": 0.376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3675363063812256, |
| "step": 795, |
| "valid_targets_mean": 2926.6, |
| "valid_targets_min": 1575 |
| }, |
| { |
| "epoch": 2.0202020202020203, |
| "grad_norm": 0.6733433964569425, |
| "learning_rate": 3.584531463011356e-05, |
| "loss": 0.3648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3609054982662201, |
| "step": 800, |
| "valid_targets_mean": 3172.1, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 2.032828282828283, |
| "grad_norm": 0.6042940030317498, |
| "learning_rate": 3.576813938676973e-05, |
| "loss": 0.3973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3894050121307373, |
| "step": 805, |
| "valid_targets_mean": 3448.1, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 2.0454545454545454, |
| "grad_norm": 0.6749197830689422, |
| "learning_rate": 3.569033864550501e-05, |
| "loss": 0.38, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3814485967159271, |
| "step": 810, |
| "valid_targets_mean": 2783.8, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 2.058080808080808, |
| "grad_norm": 0.6483067354879916, |
| "learning_rate": 3.561191549255555e-05, |
| "loss": 0.3565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3972342312335968, |
| "step": 815, |
| "valid_targets_mean": 3241.1, |
| "valid_targets_min": 1649 |
| }, |
| { |
| "epoch": 2.0707070707070705, |
| "grad_norm": 0.6353320580780115, |
| "learning_rate": 3.553287303884762e-05, |
| "loss": 0.3695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3591780662536621, |
| "step": 820, |
| "valid_targets_mean": 2904.1, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 2.0833333333333335, |
| "grad_norm": 0.6551388984986852, |
| "learning_rate": 3.545321441987422e-05, |
| "loss": 0.3704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29770687222480774, |
| "step": 825, |
| "valid_targets_mean": 2442.8, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 2.095959595959596, |
| "grad_norm": 0.6968910493636307, |
| "learning_rate": 3.5372942795570644e-05, |
| "loss": 0.358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3901800215244293, |
| "step": 830, |
| "valid_targets_mean": 2854.0, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 2.1085858585858586, |
| "grad_norm": 0.568367502641086, |
| "learning_rate": 3.529206135018922e-05, |
| "loss": 0.3625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4262069761753082, |
| "step": 835, |
| "valid_targets_mean": 4330.8, |
| "valid_targets_min": 2021 |
| }, |
| { |
| "epoch": 2.121212121212121, |
| "grad_norm": 0.6824608784442717, |
| "learning_rate": 3.521057329217289e-05, |
| "loss": 0.3845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3504842519760132, |
| "step": 840, |
| "valid_targets_mean": 2486.9, |
| "valid_targets_min": 1574 |
| }, |
| { |
| "epoch": 2.1338383838383836, |
| "grad_norm": 0.6810643162239562, |
| "learning_rate": 3.512848185402804e-05, |
| "loss": 0.3885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42560821771621704, |
| "step": 845, |
| "valid_targets_mean": 3205.6, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 2.1464646464646466, |
| "grad_norm": 0.7051006217015395, |
| "learning_rate": 3.504579029219618e-05, |
| "loss": 0.385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47030025720596313, |
| "step": 850, |
| "valid_targets_mean": 4252.9, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 2.159090909090909, |
| "grad_norm": 0.6158184161250323, |
| "learning_rate": 3.4962501886924817e-05, |
| "loss": 0.3643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3438853621482849, |
| "step": 855, |
| "valid_targets_mean": 3000.1, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 2.1717171717171717, |
| "grad_norm": 0.9033510849058328, |
| "learning_rate": 3.4878619942137346e-05, |
| "loss": 0.3566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36623990535736084, |
| "step": 860, |
| "valid_targets_mean": 3486.9, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 2.1843434343434343, |
| "grad_norm": 0.6336084994385605, |
| "learning_rate": 3.479414778530194e-05, |
| "loss": 0.3553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3282182812690735, |
| "step": 865, |
| "valid_targets_mean": 2926.6, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 2.196969696969697, |
| "grad_norm": 0.642030989385258, |
| "learning_rate": 3.470908876729958e-05, |
| "loss": 0.3757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38485634326934814, |
| "step": 870, |
| "valid_targets_mean": 3797.9, |
| "valid_targets_min": 1802 |
| }, |
| { |
| "epoch": 2.20959595959596, |
| "grad_norm": 0.6859750653264282, |
| "learning_rate": 3.462344626229113e-05, |
| "loss": 0.3831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4057656526565552, |
| "step": 875, |
| "valid_targets_mean": 3077.2, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 2.2222222222222223, |
| "grad_norm": 0.7051975354184825, |
| "learning_rate": 3.4537223667583517e-05, |
| "loss": 0.3941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3670094311237335, |
| "step": 880, |
| "valid_targets_mean": 2480.9, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 2.234848484848485, |
| "grad_norm": 0.6263495715036997, |
| "learning_rate": 3.44504244034949e-05, |
| "loss": 0.3744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38415664434432983, |
| "step": 885, |
| "valid_targets_mean": 3738.8, |
| "valid_targets_min": 1905 |
| }, |
| { |
| "epoch": 2.2474747474747474, |
| "grad_norm": 0.6736583840874508, |
| "learning_rate": 3.4363051913219054e-05, |
| "loss": 0.3787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32438012957572937, |
| "step": 890, |
| "valid_targets_mean": 2544.9, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 2.26010101010101, |
| "grad_norm": 0.6358475233857454, |
| "learning_rate": 3.427510966268874e-05, |
| "loss": 0.4206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38413217663764954, |
| "step": 895, |
| "valid_targets_mean": 3256.4, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 2.2727272727272725, |
| "grad_norm": 0.5703544012357852, |
| "learning_rate": 3.418660114043824e-05, |
| "loss": 0.3628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34161847829818726, |
| "step": 900, |
| "valid_targets_mean": 3436.0, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 2.2853535353535355, |
| "grad_norm": 0.6756271018463891, |
| "learning_rate": 3.409752985746498e-05, |
| "loss": 0.3907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39379531145095825, |
| "step": 905, |
| "valid_targets_mean": 3228.2, |
| "valid_targets_min": 1693 |
| }, |
| { |
| "epoch": 2.297979797979798, |
| "grad_norm": 0.5750798297997253, |
| "learning_rate": 3.400789934709023e-05, |
| "loss": 0.4308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4697551727294922, |
| "step": 910, |
| "valid_targets_mean": 4887.2, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 2.3106060606060606, |
| "grad_norm": 0.6035695330159876, |
| "learning_rate": 3.391771316481895e-05, |
| "loss": 0.386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37602925300598145, |
| "step": 915, |
| "valid_targets_mean": 3335.6, |
| "valid_targets_min": 1865 |
| }, |
| { |
| "epoch": 2.323232323232323, |
| "grad_norm": 0.6231533529555526, |
| "learning_rate": 3.3826974888198764e-05, |
| "loss": 0.3847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46126362681388855, |
| "step": 920, |
| "valid_targets_mean": 4108.6, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 2.3358585858585856, |
| "grad_norm": 0.682022720271219, |
| "learning_rate": 3.373568811667802e-05, |
| "loss": 0.3822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39595192670822144, |
| "step": 925, |
| "valid_targets_mean": 2894.8, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 2.3484848484848486, |
| "grad_norm": 0.6797289333546708, |
| "learning_rate": 3.3643856471463036e-05, |
| "loss": 0.3785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38361161947250366, |
| "step": 930, |
| "valid_targets_mean": 3060.6, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 2.361111111111111, |
| "grad_norm": 0.6031465467740685, |
| "learning_rate": 3.355148359537441e-05, |
| "loss": 0.3961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44060710072517395, |
| "step": 935, |
| "valid_targets_mean": 4271.9, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 2.3737373737373737, |
| "grad_norm": 0.8364843828650894, |
| "learning_rate": 3.3458573152702556e-05, |
| "loss": 0.3854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36398792266845703, |
| "step": 940, |
| "valid_targets_mean": 2913.2, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 2.3863636363636362, |
| "grad_norm": 0.5980417429474294, |
| "learning_rate": 3.336512882906234e-05, |
| "loss": 0.3636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.307436466217041, |
| "step": 945, |
| "valid_targets_mean": 2891.1, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 2.398989898989899, |
| "grad_norm": 0.6020944292492557, |
| "learning_rate": 3.3271154331246825e-05, |
| "loss": 0.3548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3505295515060425, |
| "step": 950, |
| "valid_targets_mean": 4080.4, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 2.4116161616161618, |
| "grad_norm": 0.6948551306615971, |
| "learning_rate": 3.317665338708033e-05, |
| "loss": 0.3449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38028645515441895, |
| "step": 955, |
| "valid_targets_mean": 3400.9, |
| "valid_targets_min": 452 |
| }, |
| { |
| "epoch": 2.4242424242424243, |
| "grad_norm": 0.7054147906410959, |
| "learning_rate": 3.308162974527045e-05, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3440144658088684, |
| "step": 960, |
| "valid_targets_mean": 2568.9, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 2.436868686868687, |
| "grad_norm": 0.6502674537729093, |
| "learning_rate": 3.298608717525941e-05, |
| "loss": 0.3966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4167352616786957, |
| "step": 965, |
| "valid_targets_mean": 3487.2, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 2.4494949494949494, |
| "grad_norm": 0.6945755822435844, |
| "learning_rate": 3.289002946707452e-05, |
| "loss": 0.3618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38510334491729736, |
| "step": 970, |
| "valid_targets_mean": 3070.3, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 2.462121212121212, |
| "grad_norm": 0.7008172093994913, |
| "learning_rate": 3.2793460431177827e-05, |
| "loss": 0.3892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34910762310028076, |
| "step": 975, |
| "valid_targets_mean": 2654.6, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 2.474747474747475, |
| "grad_norm": 0.6315928723707651, |
| "learning_rate": 3.269638389831498e-05, |
| "loss": 0.3683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2948976755142212, |
| "step": 980, |
| "valid_targets_mean": 2513.4, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 2.4873737373737375, |
| "grad_norm": 0.659399817304144, |
| "learning_rate": 3.2598803719363234e-05, |
| "loss": 0.3995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3890318274497986, |
| "step": 985, |
| "valid_targets_mean": 2942.6, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.6602751081844956, |
| "learning_rate": 3.250072376517873e-05, |
| "loss": 0.39, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31299781799316406, |
| "step": 990, |
| "valid_targets_mean": 2744.5, |
| "valid_targets_min": 1621 |
| }, |
| { |
| "epoch": 2.5126262626262625, |
| "grad_norm": 0.5849536829497557, |
| "learning_rate": 3.240214792644291e-05, |
| "loss": 0.3908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4854844808578491, |
| "step": 995, |
| "valid_targets_mean": 4775.6, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 2.525252525252525, |
| "grad_norm": 0.5606732760702411, |
| "learning_rate": 3.2303080113508206e-05, |
| "loss": 0.3851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3052321672439575, |
| "step": 1000, |
| "valid_targets_mean": 3365.4, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 2.537878787878788, |
| "grad_norm": 0.6875908835706088, |
| "learning_rate": 3.220352425624292e-05, |
| "loss": 0.382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3734514117240906, |
| "step": 1005, |
| "valid_targets_mean": 2893.5, |
| "valid_targets_min": 1773 |
| }, |
| { |
| "epoch": 2.5505050505050506, |
| "grad_norm": 0.5931935199736621, |
| "learning_rate": 3.210348430387531e-05, |
| "loss": 0.404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3862113058567047, |
| "step": 1010, |
| "valid_targets_mean": 3470.7, |
| "valid_targets_min": 2311 |
| }, |
| { |
| "epoch": 2.563131313131313, |
| "grad_norm": 0.5854966748703261, |
| "learning_rate": 3.200296422483694e-05, |
| "loss": 0.3898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3955685496330261, |
| "step": 1015, |
| "valid_targets_mean": 3589.4, |
| "valid_targets_min": 1829 |
| }, |
| { |
| "epoch": 2.5757575757575757, |
| "grad_norm": 0.6466992426589206, |
| "learning_rate": 3.19019680066053e-05, |
| "loss": 0.3517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3543087840080261, |
| "step": 1020, |
| "valid_targets_mean": 2809.2, |
| "valid_targets_min": 1982 |
| }, |
| { |
| "epoch": 2.5883838383838382, |
| "grad_norm": 0.6437875698154034, |
| "learning_rate": 3.180049965554554e-05, |
| "loss": 0.4091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5216984748840332, |
| "step": 1025, |
| "valid_targets_mean": 4236.3, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 2.601010101010101, |
| "grad_norm": 0.6686276392769377, |
| "learning_rate": 3.169856319675163e-05, |
| "loss": 0.3711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4543102979660034, |
| "step": 1030, |
| "valid_targets_mean": 3561.1, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 2.6136363636363638, |
| "grad_norm": 0.5951534964453324, |
| "learning_rate": 3.159616267388665e-05, |
| "loss": 0.3683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3885546326637268, |
| "step": 1035, |
| "valid_targets_mean": 3710.8, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 2.6262626262626263, |
| "grad_norm": 0.5998214906422664, |
| "learning_rate": 3.1493302149022394e-05, |
| "loss": 0.3643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3495018482208252, |
| "step": 1040, |
| "valid_targets_mean": 3388.9, |
| "valid_targets_min": 1017 |
| }, |
| { |
| "epoch": 2.638888888888889, |
| "grad_norm": 0.679459404989866, |
| "learning_rate": 3.1389985702478204e-05, |
| "loss": 0.3733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40621423721313477, |
| "step": 1045, |
| "valid_targets_mean": 2743.4, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 2.6515151515151514, |
| "grad_norm": 0.49821839728054024, |
| "learning_rate": 3.1286217432659176e-05, |
| "loss": 0.3848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42677822709083557, |
| "step": 1050, |
| "valid_targets_mean": 5945.1, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 2.6641414141414144, |
| "grad_norm": 0.6245151459734792, |
| "learning_rate": 3.118200145589351e-05, |
| "loss": 0.4174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3920952081680298, |
| "step": 1055, |
| "valid_targets_mean": 3122.9, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 2.676767676767677, |
| "grad_norm": 0.6230627615382611, |
| "learning_rate": 3.1077341906269275e-05, |
| "loss": 0.3746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4046259820461273, |
| "step": 1060, |
| "valid_targets_mean": 3375.1, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 2.6893939393939394, |
| "grad_norm": 0.5984044868920384, |
| "learning_rate": 3.097224293547039e-05, |
| "loss": 0.3761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37177756428718567, |
| "step": 1065, |
| "valid_targets_mean": 3157.3, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 2.702020202020202, |
| "grad_norm": 0.6200698875715712, |
| "learning_rate": 3.086670871261193e-05, |
| "loss": 0.3824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4072413146495819, |
| "step": 1070, |
| "valid_targets_mean": 3493.7, |
| "valid_targets_min": 1659 |
| }, |
| { |
| "epoch": 2.7146464646464645, |
| "grad_norm": 0.7099464467086446, |
| "learning_rate": 3.076074342407476e-05, |
| "loss": 0.3903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3890324532985687, |
| "step": 1075, |
| "valid_targets_mean": 2398.0, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 2.7272727272727275, |
| "grad_norm": 0.5964382108688258, |
| "learning_rate": 3.0654351273339465e-05, |
| "loss": 0.3576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41678887605667114, |
| "step": 1080, |
| "valid_targets_mean": 4061.4, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 2.73989898989899, |
| "grad_norm": 0.6483267090943723, |
| "learning_rate": 3.0547536480819584e-05, |
| "loss": 0.4063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38063323497772217, |
| "step": 1085, |
| "valid_targets_mean": 2821.2, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 2.7525252525252526, |
| "grad_norm": 0.6126539646079129, |
| "learning_rate": 3.044030328369422e-05, |
| "loss": 0.3809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3242890238761902, |
| "step": 1090, |
| "valid_targets_mean": 2823.2, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 2.765151515151515, |
| "grad_norm": 0.666211099047787, |
| "learning_rate": 3.033265593573994e-05, |
| "loss": 0.3988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35766348242759705, |
| "step": 1095, |
| "valid_targets_mean": 2767.8, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 2.7777777777777777, |
| "grad_norm": 0.5893274171238146, |
| "learning_rate": 3.0224598707162037e-05, |
| "loss": 0.3812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35240688920021057, |
| "step": 1100, |
| "valid_targets_mean": 3162.4, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 2.7904040404040407, |
| "grad_norm": 0.6436336249871378, |
| "learning_rate": 3.0116135884425156e-05, |
| "loss": 0.377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4571429193019867, |
| "step": 1105, |
| "valid_targets_mean": 3306.6, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 2.8030303030303028, |
| "grad_norm": 0.6192587115834132, |
| "learning_rate": 3.0007271770083216e-05, |
| "loss": 0.3935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2913767397403717, |
| "step": 1110, |
| "valid_targets_mean": 2528.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 2.8156565656565657, |
| "grad_norm": 0.606484213579456, |
| "learning_rate": 2.989801068260878e-05, |
| "loss": 0.3754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29592519998550415, |
| "step": 1115, |
| "valid_targets_mean": 2622.3, |
| "valid_targets_min": 1436 |
| }, |
| { |
| "epoch": 2.8282828282828283, |
| "grad_norm": 0.645202232373261, |
| "learning_rate": 2.9788356956221712e-05, |
| "loss": 0.3682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3493780195713043, |
| "step": 1120, |
| "valid_targets_mean": 2796.6, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 2.840909090909091, |
| "grad_norm": 0.6382732894080507, |
| "learning_rate": 2.9678314940717276e-05, |
| "loss": 0.3192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31767457723617554, |
| "step": 1125, |
| "valid_targets_mean": 2719.1, |
| "valid_targets_min": 1784 |
| }, |
| { |
| "epoch": 2.8535353535353534, |
| "grad_norm": 0.6864660560112232, |
| "learning_rate": 2.9567889001293553e-05, |
| "loss": 0.3885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3313673436641693, |
| "step": 1130, |
| "valid_targets_mean": 2460.8, |
| "valid_targets_min": 588 |
| }, |
| { |
| "epoch": 2.866161616161616, |
| "grad_norm": 0.6023940706764531, |
| "learning_rate": 2.94570835183783e-05, |
| "loss": 0.3516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34224456548690796, |
| "step": 1135, |
| "valid_targets_mean": 3116.4, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 2.878787878787879, |
| "grad_norm": 0.6067779962957488, |
| "learning_rate": 2.93459028874552e-05, |
| "loss": 0.3723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3636412024497986, |
| "step": 1140, |
| "valid_targets_mean": 3337.4, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 2.8914141414141414, |
| "grad_norm": 0.6092698495443272, |
| "learning_rate": 2.9234351518889465e-05, |
| "loss": 0.4067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4876616597175598, |
| "step": 1145, |
| "valid_targets_mean": 4359.3, |
| "valid_targets_min": 1940 |
| }, |
| { |
| "epoch": 2.904040404040404, |
| "grad_norm": 0.6240475836405307, |
| "learning_rate": 2.9122433837752906e-05, |
| "loss": 0.3557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31040680408477783, |
| "step": 1150, |
| "valid_targets_mean": 2761.3, |
| "valid_targets_min": 1568 |
| }, |
| { |
| "epoch": 2.9166666666666665, |
| "grad_norm": 0.5730069310790777, |
| "learning_rate": 2.9010154283648382e-05, |
| "loss": 0.403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3821036219596863, |
| "step": 1155, |
| "valid_targets_mean": 3784.9, |
| "valid_targets_min": 1335 |
| }, |
| { |
| "epoch": 2.929292929292929, |
| "grad_norm": 0.6572646648160343, |
| "learning_rate": 2.8897517310533733e-05, |
| "loss": 0.3557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3128521740436554, |
| "step": 1160, |
| "valid_targets_mean": 2357.7, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 2.941919191919192, |
| "grad_norm": 0.6115860029185797, |
| "learning_rate": 2.8784527386545006e-05, |
| "loss": 0.4476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49554532766342163, |
| "step": 1165, |
| "valid_targets_mean": 4678.3, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 2.9545454545454546, |
| "grad_norm": 0.6535005566432543, |
| "learning_rate": 2.8671188993819327e-05, |
| "loss": 0.4041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4300668239593506, |
| "step": 1170, |
| "valid_targets_mean": 3714.4, |
| "valid_targets_min": 2330 |
| }, |
| { |
| "epoch": 2.967171717171717, |
| "grad_norm": 0.6344464229430659, |
| "learning_rate": 2.8557506628317e-05, |
| "loss": 0.3867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4097946882247925, |
| "step": 1175, |
| "valid_targets_mean": 3480.2, |
| "valid_targets_min": 1844 |
| }, |
| { |
| "epoch": 2.9797979797979797, |
| "grad_norm": 0.5549040647946087, |
| "learning_rate": 2.844348479964323e-05, |
| "loss": 0.3997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36530980467796326, |
| "step": 1180, |
| "valid_targets_mean": 3680.7, |
| "valid_targets_min": 2068 |
| }, |
| { |
| "epoch": 2.992424242424242, |
| "grad_norm": 0.6350789264846295, |
| "learning_rate": 2.8329128030869183e-05, |
| "loss": 0.3765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36941784620285034, |
| "step": 1185, |
| "valid_targets_mean": 2964.5, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 3.005050505050505, |
| "grad_norm": 0.6101230464628173, |
| "learning_rate": 2.8214440858352602e-05, |
| "loss": 0.3585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3312152624130249, |
| "step": 1190, |
| "valid_targets_mean": 3049.0, |
| "valid_targets_min": 1661 |
| }, |
| { |
| "epoch": 3.0176767676767677, |
| "grad_norm": 0.6717050734051245, |
| "learning_rate": 2.8099427831557836e-05, |
| "loss": 0.344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3820994794368744, |
| "step": 1195, |
| "valid_targets_mean": 3147.5, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 3.0303030303030303, |
| "grad_norm": 0.6855402222878124, |
| "learning_rate": 2.798409351287537e-05, |
| "loss": 0.3489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3795431852340698, |
| "step": 1200, |
| "valid_targets_mean": 3020.4, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 3.042929292929293, |
| "grad_norm": 0.6290362160754815, |
| "learning_rate": 2.7868442477440845e-05, |
| "loss": 0.3716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3297278881072998, |
| "step": 1205, |
| "valid_targets_mean": 3352.2, |
| "valid_targets_min": 1870 |
| }, |
| { |
| "epoch": 3.0555555555555554, |
| "grad_norm": 0.6542985881986048, |
| "learning_rate": 2.7752479312953576e-05, |
| "loss": 0.3242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37977492809295654, |
| "step": 1210, |
| "valid_targets_mean": 3504.4, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 3.0681818181818183, |
| "grad_norm": 0.6865766533109904, |
| "learning_rate": 2.763620861949456e-05, |
| "loss": 0.3148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3136219382286072, |
| "step": 1215, |
| "valid_targets_mean": 2935.5, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 3.080808080808081, |
| "grad_norm": 0.650463581157268, |
| "learning_rate": 2.7519635009343982e-05, |
| "loss": 0.3616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3669140934944153, |
| "step": 1220, |
| "valid_targets_mean": 3443.1, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 3.0934343434343434, |
| "grad_norm": 0.6374974160183221, |
| "learning_rate": 2.7402763106798295e-05, |
| "loss": 0.385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3267042636871338, |
| "step": 1225, |
| "valid_targets_mean": 3336.6, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 3.106060606060606, |
| "grad_norm": 0.7164459430574219, |
| "learning_rate": 2.7285597547986715e-05, |
| "loss": 0.3452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3801751732826233, |
| "step": 1230, |
| "valid_targets_mean": 3270.2, |
| "valid_targets_min": 1810 |
| }, |
| { |
| "epoch": 3.1186868686868685, |
| "grad_norm": 0.6786289930271091, |
| "learning_rate": 2.7168142980687394e-05, |
| "loss": 0.3578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.343783438205719, |
| "step": 1235, |
| "valid_targets_mean": 2905.7, |
| "valid_targets_min": 1686 |
| }, |
| { |
| "epoch": 3.1313131313131315, |
| "grad_norm": 0.8228076465104819, |
| "learning_rate": 2.7050404064142985e-05, |
| "loss": 0.3593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3551754355430603, |
| "step": 1240, |
| "valid_targets_mean": 3203.6, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 3.143939393939394, |
| "grad_norm": 0.7057452290840084, |
| "learning_rate": 2.693238546887583e-05, |
| "loss": 0.3613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38851505517959595, |
| "step": 1245, |
| "valid_targets_mean": 2690.1, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 3.1565656565656566, |
| "grad_norm": 0.6516753493509879, |
| "learning_rate": 2.6814091876502738e-05, |
| "loss": 0.3702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30876827239990234, |
| "step": 1250, |
| "valid_targets_mean": 2591.5, |
| "valid_targets_min": 1481 |
| }, |
| { |
| "epoch": 3.169191919191919, |
| "grad_norm": 0.5373908122046772, |
| "learning_rate": 2.669552797954917e-05, |
| "loss": 0.3621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4019007682800293, |
| "step": 1255, |
| "valid_targets_mean": 4778.8, |
| "valid_targets_min": 1761 |
| }, |
| { |
| "epoch": 3.1818181818181817, |
| "grad_norm": 0.656469897426696, |
| "learning_rate": 2.6576698481263216e-05, |
| "loss": 0.3694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3878747522830963, |
| "step": 1260, |
| "valid_targets_mean": 3612.4, |
| "valid_targets_min": 1553 |
| }, |
| { |
| "epoch": 3.1944444444444446, |
| "grad_norm": 0.6890638135835326, |
| "learning_rate": 2.6457608095428925e-05, |
| "loss": 0.3607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37581291794776917, |
| "step": 1265, |
| "valid_targets_mean": 3227.2, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 3.207070707070707, |
| "grad_norm": 0.6686732667303787, |
| "learning_rate": 2.633826154617938e-05, |
| "loss": 0.3687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32370471954345703, |
| "step": 1270, |
| "valid_targets_mean": 3021.6, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 3.2196969696969697, |
| "grad_norm": 0.60906879769235, |
| "learning_rate": 2.621866356780924e-05, |
| "loss": 0.333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2982814908027649, |
| "step": 1275, |
| "valid_targets_mean": 3329.8, |
| "valid_targets_min": 1659 |
| }, |
| { |
| "epoch": 3.2323232323232323, |
| "grad_norm": 0.6788697674939761, |
| "learning_rate": 2.6098818904587014e-05, |
| "loss": 0.362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3478686213493347, |
| "step": 1280, |
| "valid_targets_mean": 3108.2, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 3.244949494949495, |
| "grad_norm": 0.7418192989966806, |
| "learning_rate": 2.597873231056679e-05, |
| "loss": 0.342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3505740165710449, |
| "step": 1285, |
| "valid_targets_mean": 2378.4, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 3.257575757575758, |
| "grad_norm": 0.6743259771608354, |
| "learning_rate": 2.585840854939969e-05, |
| "loss": 0.3385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.337390661239624, |
| "step": 1290, |
| "valid_targets_mean": 2974.2, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 3.2702020202020203, |
| "grad_norm": 0.6553868057444038, |
| "learning_rate": 2.5737852394144903e-05, |
| "loss": 0.3231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3390675187110901, |
| "step": 1295, |
| "valid_targets_mean": 2955.1, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 3.282828282828283, |
| "grad_norm": 0.6403703744617418, |
| "learning_rate": 2.5617068627080305e-05, |
| "loss": 0.3688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4630083739757538, |
| "step": 1300, |
| "valid_targets_mean": 4076.2, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 3.2954545454545454, |
| "grad_norm": 0.6023984043375903, |
| "learning_rate": 2.5496062039512834e-05, |
| "loss": 0.348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32059431076049805, |
| "step": 1305, |
| "valid_targets_mean": 3375.9, |
| "valid_targets_min": 1878 |
| }, |
| { |
| "epoch": 3.308080808080808, |
| "grad_norm": 0.6396425541446585, |
| "learning_rate": 2.5374837431588322e-05, |
| "loss": 0.3341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3704610764980316, |
| "step": 1310, |
| "valid_targets_mean": 3331.3, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 3.320707070707071, |
| "grad_norm": 0.6776583962480702, |
| "learning_rate": 2.525339961210117e-05, |
| "loss": 0.356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2946220636367798, |
| "step": 1315, |
| "valid_targets_mean": 2489.2, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.7512035560086019, |
| "learning_rate": 2.5131753398303546e-05, |
| "loss": 0.3612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3226706385612488, |
| "step": 1320, |
| "valid_targets_mean": 2257.8, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 3.345959595959596, |
| "grad_norm": 0.6691736317428321, |
| "learning_rate": 2.5009903615714288e-05, |
| "loss": 0.3713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38169464468955994, |
| "step": 1325, |
| "valid_targets_mean": 3674.4, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 3.3585858585858586, |
| "grad_norm": 0.6529576389515854, |
| "learning_rate": 2.4887855097927515e-05, |
| "loss": 0.3191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3396865725517273, |
| "step": 1330, |
| "valid_targets_mean": 3407.2, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 3.371212121212121, |
| "grad_norm": 0.7154816898888791, |
| "learning_rate": 2.4765612686420855e-05, |
| "loss": 0.3367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.343447744846344, |
| "step": 1335, |
| "valid_targets_mean": 2833.6, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 3.3838383838383836, |
| "grad_norm": 0.6736312101027783, |
| "learning_rate": 2.46431812303634e-05, |
| "loss": 0.378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32376375794410706, |
| "step": 1340, |
| "valid_targets_mean": 2666.4, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 3.3964646464646466, |
| "grad_norm": 0.6475094233289387, |
| "learning_rate": 2.4520565586423364e-05, |
| "loss": 0.3204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29635465145111084, |
| "step": 1345, |
| "valid_targets_mean": 2748.7, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 3.409090909090909, |
| "grad_norm": 0.5843996644681299, |
| "learning_rate": 2.4397770618575402e-05, |
| "loss": 0.3462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3405814468860626, |
| "step": 1350, |
| "valid_targets_mean": 3957.3, |
| "valid_targets_min": 1585 |
| }, |
| { |
| "epoch": 3.4217171717171717, |
| "grad_norm": 0.6569771648498826, |
| "learning_rate": 2.4274801197907665e-05, |
| "loss": 0.3674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35267573595046997, |
| "step": 1355, |
| "valid_targets_mean": 3056.4, |
| "valid_targets_min": 1380 |
| }, |
| { |
| "epoch": 3.4343434343434343, |
| "grad_norm": 0.6278190545664051, |
| "learning_rate": 2.4151662202428613e-05, |
| "loss": 0.3628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3695211410522461, |
| "step": 1360, |
| "valid_targets_mean": 3506.5, |
| "valid_targets_min": 1884 |
| }, |
| { |
| "epoch": 3.446969696969697, |
| "grad_norm": 0.634074126688538, |
| "learning_rate": 2.4028358516873427e-05, |
| "loss": 0.3216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3146069645881653, |
| "step": 1365, |
| "valid_targets_mean": 3289.8, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 3.45959595959596, |
| "grad_norm": 0.6801530900407086, |
| "learning_rate": 2.390489503251034e-05, |
| "loss": 0.3597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4268019199371338, |
| "step": 1370, |
| "valid_targets_mean": 3845.6, |
| "valid_targets_min": 1843 |
| }, |
| { |
| "epoch": 3.4722222222222223, |
| "grad_norm": 0.6302056512933344, |
| "learning_rate": 2.3781276646946526e-05, |
| "loss": 0.3483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35302233695983887, |
| "step": 1375, |
| "valid_targets_mean": 3840.2, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 3.484848484848485, |
| "grad_norm": 0.6377742108475873, |
| "learning_rate": 2.3657508263933874e-05, |
| "loss": 0.3612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33783674240112305, |
| "step": 1380, |
| "valid_targets_mean": 3263.4, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 3.4974747474747474, |
| "grad_norm": 0.7042898368764126, |
| "learning_rate": 2.3533594793174426e-05, |
| "loss": 0.3258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3383498191833496, |
| "step": 1385, |
| "valid_targets_mean": 2682.6, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 3.51010101010101, |
| "grad_norm": 0.7030408364050017, |
| "learning_rate": 2.3409541150125645e-05, |
| "loss": 0.3557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4075915217399597, |
| "step": 1390, |
| "valid_targets_mean": 3162.8, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 3.5227272727272725, |
| "grad_norm": 0.6274505021865276, |
| "learning_rate": 2.3285352255805398e-05, |
| "loss": 0.3496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31670212745666504, |
| "step": 1395, |
| "valid_targets_mean": 3087.0, |
| "valid_targets_min": 392 |
| }, |
| { |
| "epoch": 3.5353535353535355, |
| "grad_norm": 1.2486599391824142, |
| "learning_rate": 2.316103303659678e-05, |
| "loss": 0.3296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36197564005851746, |
| "step": 1400, |
| "valid_targets_mean": 3082.6, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 3.547979797979798, |
| "grad_norm": 0.5371320718863393, |
| "learning_rate": 2.3036588424052672e-05, |
| "loss": 0.351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3815935254096985, |
| "step": 1405, |
| "valid_targets_mean": 4752.9, |
| "valid_targets_min": 1819 |
| }, |
| { |
| "epoch": 3.5606060606060606, |
| "grad_norm": 0.705016854939806, |
| "learning_rate": 2.2912023354700105e-05, |
| "loss": 0.3665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3603851795196533, |
| "step": 1410, |
| "valid_targets_mean": 2926.8, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 3.573232323232323, |
| "grad_norm": 0.5984653768510367, |
| "learning_rate": 2.2787342769844444e-05, |
| "loss": 0.3222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3309054374694824, |
| "step": 1415, |
| "valid_targets_mean": 3481.1, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 3.5858585858585856, |
| "grad_norm": 0.8191525002477924, |
| "learning_rate": 2.2662551615373402e-05, |
| "loss": 0.3989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44843584299087524, |
| "step": 1420, |
| "valid_targets_mean": 2668.3, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 3.5984848484848486, |
| "grad_norm": 0.6651567018600946, |
| "learning_rate": 2.25376548415608e-05, |
| "loss": 0.3694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3173557221889496, |
| "step": 1425, |
| "valid_targets_mean": 2731.2, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 3.611111111111111, |
| "grad_norm": 0.6266431493382524, |
| "learning_rate": 2.241265740287021e-05, |
| "loss": 0.3443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29255497455596924, |
| "step": 1430, |
| "valid_targets_mean": 2907.2, |
| "valid_targets_min": 1479 |
| }, |
| { |
| "epoch": 3.6237373737373737, |
| "grad_norm": 0.5693607197936612, |
| "learning_rate": 2.2287564257758446e-05, |
| "loss": 0.3977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41386911273002625, |
| "step": 1435, |
| "valid_targets_mean": 4703.8, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 3.6363636363636362, |
| "grad_norm": 0.7080853718994018, |
| "learning_rate": 2.2162380368478836e-05, |
| "loss": 0.3847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3499618172645569, |
| "step": 1440, |
| "valid_targets_mean": 2786.1, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 3.648989898989899, |
| "grad_norm": 0.5548114926983784, |
| "learning_rate": 2.2037110700884395e-05, |
| "loss": 0.3565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25791436433792114, |
| "step": 1445, |
| "valid_targets_mean": 3419.7, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 3.6616161616161618, |
| "grad_norm": 0.5977854910500919, |
| "learning_rate": 2.1911760224230824e-05, |
| "loss": 0.3493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33634889125823975, |
| "step": 1450, |
| "valid_targets_mean": 3442.4, |
| "valid_targets_min": 1773 |
| }, |
| { |
| "epoch": 3.6742424242424243, |
| "grad_norm": 0.6796398481161333, |
| "learning_rate": 2.17863339109794e-05, |
| "loss": 0.3525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36308521032333374, |
| "step": 1455, |
| "valid_targets_mean": 3190.7, |
| "valid_targets_min": 1471 |
| }, |
| { |
| "epoch": 3.686868686868687, |
| "grad_norm": 0.6479531096999324, |
| "learning_rate": 2.166083673659973e-05, |
| "loss": 0.336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35041192173957825, |
| "step": 1460, |
| "valid_targets_mean": 3109.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 3.6994949494949494, |
| "grad_norm": 0.6190656382920072, |
| "learning_rate": 2.153527367937236e-05, |
| "loss": 0.3489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3769229054450989, |
| "step": 1465, |
| "valid_targets_mean": 3737.9, |
| "valid_targets_min": 1786 |
| }, |
| { |
| "epoch": 3.712121212121212, |
| "grad_norm": 0.6732653753234384, |
| "learning_rate": 2.140964972019132e-05, |
| "loss": 0.3496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3730910122394562, |
| "step": 1470, |
| "valid_targets_mean": 3028.1, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 3.724747474747475, |
| "grad_norm": 0.682620817181734, |
| "learning_rate": 2.128396984236651e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37931591272354126, |
| "step": 1475, |
| "valid_targets_mean": 3248.3, |
| "valid_targets_min": 1448 |
| }, |
| { |
| "epoch": 3.7373737373737375, |
| "grad_norm": 1.5193685144502576, |
| "learning_rate": 2.115823903142606e-05, |
| "loss": 0.3605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3566587567329407, |
| "step": 1480, |
| "valid_targets_mean": 3345.8, |
| "valid_targets_min": 603 |
| }, |
| { |
| "epoch": 3.75, |
| "grad_norm": 0.6092501389476551, |
| "learning_rate": 2.1032462274918517e-05, |
| "loss": 0.3393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30876415967941284, |
| "step": 1485, |
| "valid_targets_mean": 3301.3, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 3.7626262626262625, |
| "grad_norm": 0.7276893961486488, |
| "learning_rate": 2.0906644562215037e-05, |
| "loss": 0.3381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3389100432395935, |
| "step": 1490, |
| "valid_targets_mean": 2715.4, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 3.775252525252525, |
| "grad_norm": 0.5858712774395105, |
| "learning_rate": 2.078079088431143e-05, |
| "loss": 0.3767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3030000925064087, |
| "step": 1495, |
| "valid_targets_mean": 3219.7, |
| "valid_targets_min": 2366 |
| }, |
| { |
| "epoch": 3.787878787878788, |
| "grad_norm": 0.6888688838778153, |
| "learning_rate": 2.0654906233630197e-05, |
| "loss": 0.3738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.416027694940567, |
| "step": 1500, |
| "valid_targets_mean": 3128.2, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 2.516722408026756, |
| "grad_norm": 0.662986162649258, |
| "learning_rate": 3.23558282621135e-05, |
| "loss": 0.3218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29847097396850586, |
| "step": 1505, |
| "valid_targets_mean": 3091.0, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 2.5250836120401337, |
| "grad_norm": 0.6783328257944375, |
| "learning_rate": 3.229014188825108e-05, |
| "loss": 0.3139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3512507975101471, |
| "step": 1510, |
| "valid_targets_mean": 3352.5, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 2.5334448160535117, |
| "grad_norm": 0.6677148404277962, |
| "learning_rate": 3.2224241814261216e-05, |
| "loss": 0.3225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26659291982650757, |
| "step": 1515, |
| "valid_targets_mean": 2794.4, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 2.5418060200668897, |
| "grad_norm": 0.7219771342415074, |
| "learning_rate": 3.215812918600978e-05, |
| "loss": 0.3324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3495546579360962, |
| "step": 1520, |
| "valid_targets_mean": 2987.6, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 2.5501672240802673, |
| "grad_norm": 0.6560298605364091, |
| "learning_rate": 3.209180515305855e-05, |
| "loss": 0.3119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.331092894077301, |
| "step": 1525, |
| "valid_targets_mean": 3713.1, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 2.5585284280936453, |
| "grad_norm": 0.6919955457501047, |
| "learning_rate": 3.2025270868645146e-05, |
| "loss": 0.3497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3320353925228119, |
| "step": 1530, |
| "valid_targets_mean": 3199.7, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 2.5668896321070234, |
| "grad_norm": 0.708863656128023, |
| "learning_rate": 3.195852748966306e-05, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36112624406814575, |
| "step": 1535, |
| "valid_targets_mean": 3085.5, |
| "valid_targets_min": 588 |
| }, |
| { |
| "epoch": 2.5752508361204014, |
| "grad_norm": 0.7471046326039033, |
| "learning_rate": 3.189157617664151e-05, |
| "loss": 0.3075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28388604521751404, |
| "step": 1540, |
| "valid_targets_mean": 2699.7, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 2.5836120401337794, |
| "grad_norm": 0.7471683542567666, |
| "learning_rate": 3.182441809372523e-05, |
| "loss": 0.317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33689889311790466, |
| "step": 1545, |
| "valid_targets_mean": 2698.6, |
| "valid_targets_min": 1551 |
| }, |
| { |
| "epoch": 2.591973244147157, |
| "grad_norm": 0.6750267862750765, |
| "learning_rate": 3.1757054408654266e-05, |
| "loss": 0.3833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2789178192615509, |
| "step": 1550, |
| "valid_targets_mean": 2798.8, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 2.600334448160535, |
| "grad_norm": 0.681930396951124, |
| "learning_rate": 3.168948629274367e-05, |
| "loss": 0.3283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3054756820201874, |
| "step": 1555, |
| "valid_targets_mean": 2962.2, |
| "valid_targets_min": 1403 |
| }, |
| { |
| "epoch": 2.608695652173913, |
| "grad_norm": 0.6634403273333718, |
| "learning_rate": 3.1621714920863104e-05, |
| "loss": 0.3259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4073365032672882, |
| "step": 1560, |
| "valid_targets_mean": 4461.2, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 2.617056856187291, |
| "grad_norm": 0.8238005424494197, |
| "learning_rate": 3.155374147141646e-05, |
| "loss": 0.3604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38494405150413513, |
| "step": 1565, |
| "valid_targets_mean": 2640.8, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 2.625418060200669, |
| "grad_norm": 0.7052867973145739, |
| "learning_rate": 3.1485567126321295e-05, |
| "loss": 0.3451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3390483260154724, |
| "step": 1570, |
| "valid_targets_mean": 3285.6, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 2.6337792642140467, |
| "grad_norm": 0.6953845280826801, |
| "learning_rate": 3.1417193070988383e-05, |
| "loss": 0.3313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3528243601322174, |
| "step": 1575, |
| "valid_targets_mean": 3543.2, |
| "valid_targets_min": 1601 |
| }, |
| { |
| "epoch": 2.6421404682274248, |
| "grad_norm": 0.7552847898076053, |
| "learning_rate": 3.134862049430099e-05, |
| "loss": 0.3392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39836952090263367, |
| "step": 1580, |
| "valid_targets_mean": 3433.9, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 2.650501672240803, |
| "grad_norm": 1.4277354366593005, |
| "learning_rate": 3.12798505885943e-05, |
| "loss": 0.36, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3085378408432007, |
| "step": 1585, |
| "valid_targets_mean": 3400.1, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 2.6588628762541804, |
| "grad_norm": 0.7410833217029822, |
| "learning_rate": 3.1210884549634624e-05, |
| "loss": 0.3107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28592583537101746, |
| "step": 1590, |
| "valid_targets_mean": 2576.4, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 2.6672240802675584, |
| "grad_norm": 0.8296406296042037, |
| "learning_rate": 3.114172357659861e-05, |
| "loss": 0.3542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.370746374130249, |
| "step": 1595, |
| "valid_targets_mean": 2589.8, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 2.6755852842809364, |
| "grad_norm": 0.5928853152526612, |
| "learning_rate": 3.107236887205242e-05, |
| "loss": 0.3683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33890628814697266, |
| "step": 1600, |
| "valid_targets_mean": 4613.9, |
| "valid_targets_min": 1582 |
| }, |
| { |
| "epoch": 2.6839464882943145, |
| "grad_norm": 0.7237916757375374, |
| "learning_rate": 3.1002821641930815e-05, |
| "loss": 0.3467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3008784055709839, |
| "step": 1605, |
| "valid_targets_mean": 2820.9, |
| "valid_targets_min": 1351 |
| }, |
| { |
| "epoch": 2.6923076923076925, |
| "grad_norm": 0.6958603576096208, |
| "learning_rate": 3.093308309551616e-05, |
| "loss": 0.3285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26427051424980164, |
| "step": 1610, |
| "valid_targets_mean": 2401.6, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 2.70066889632107, |
| "grad_norm": 0.7246194414411228, |
| "learning_rate": 3.0863154445417426e-05, |
| "loss": 0.3112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31494617462158203, |
| "step": 1615, |
| "valid_targets_mean": 2992.2, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 2.709030100334448, |
| "grad_norm": 0.6683077048389021, |
| "learning_rate": 3.079303690754908e-05, |
| "loss": 0.3588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46505263447761536, |
| "step": 1620, |
| "valid_targets_mean": 4923.4, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 2.717391304347826, |
| "grad_norm": 0.6839193880655342, |
| "learning_rate": 3.072273170110998e-05, |
| "loss": 0.344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3480769693851471, |
| "step": 1625, |
| "valid_targets_mean": 3295.5, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 2.7257525083612038, |
| "grad_norm": 0.6148350220041032, |
| "learning_rate": 3.0652240048562134e-05, |
| "loss": 0.3337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3841598629951477, |
| "step": 1630, |
| "valid_targets_mean": 4531.8, |
| "valid_targets_min": 2092 |
| }, |
| { |
| "epoch": 2.734113712374582, |
| "grad_norm": 0.7604959335941064, |
| "learning_rate": 3.058156317560945e-05, |
| "loss": 0.3097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3188338279724121, |
| "step": 1635, |
| "valid_targets_mean": 2672.3, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 2.74247491638796, |
| "grad_norm": 0.7495694482080785, |
| "learning_rate": 3.0510702311176477e-05, |
| "loss": 0.3385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28397685289382935, |
| "step": 1640, |
| "valid_targets_mean": 2509.3, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 2.750836120401338, |
| "grad_norm": 0.5960363613154568, |
| "learning_rate": 3.043965868738695e-05, |
| "loss": 0.33, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26706498861312866, |
| "step": 1645, |
| "valid_targets_mean": 3699.4, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 2.759197324414716, |
| "grad_norm": 0.6692357148144276, |
| "learning_rate": 3.0368433539542433e-05, |
| "loss": 0.3714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2700284719467163, |
| "step": 1650, |
| "valid_targets_mean": 3072.4, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 2.7675585284280935, |
| "grad_norm": 0.7677279753834415, |
| "learning_rate": 3.029702810610082e-05, |
| "loss": 0.3281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3318488895893097, |
| "step": 1655, |
| "valid_targets_mean": 2859.8, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 2.7759197324414715, |
| "grad_norm": 0.7231622567261902, |
| "learning_rate": 3.0225443628654787e-05, |
| "loss": 0.3182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3072254955768585, |
| "step": 1660, |
| "valid_targets_mean": 3285.6, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 2.7842809364548495, |
| "grad_norm": 0.7351401519067079, |
| "learning_rate": 3.0153681351910226e-05, |
| "loss": 0.3046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3622933626174927, |
| "step": 1665, |
| "valid_targets_mean": 3139.9, |
| "valid_targets_min": 1919 |
| }, |
| { |
| "epoch": 2.7926421404682276, |
| "grad_norm": 0.7218998613996677, |
| "learning_rate": 3.0081742523664576e-05, |
| "loss": 0.305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2836865782737732, |
| "step": 1670, |
| "valid_targets_mean": 2875.6, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 2.8010033444816056, |
| "grad_norm": 0.7498483662923942, |
| "learning_rate": 3.0009628394785158e-05, |
| "loss": 0.3279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2725030481815338, |
| "step": 1675, |
| "valid_targets_mean": 2490.9, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 2.809364548494983, |
| "grad_norm": 0.7901928997172852, |
| "learning_rate": 2.9937340219187402e-05, |
| "loss": 0.3407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3297320008277893, |
| "step": 1680, |
| "valid_targets_mean": 2595.1, |
| "valid_targets_min": 1608 |
| }, |
| { |
| "epoch": 2.817725752508361, |
| "grad_norm": 0.6829285663175374, |
| "learning_rate": 2.986487925381304e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28002995252609253, |
| "step": 1685, |
| "valid_targets_mean": 2900.0, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 2.8260869565217392, |
| "grad_norm": 0.7868893655628152, |
| "learning_rate": 2.9792246758608283e-05, |
| "loss": 0.3628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3678167164325714, |
| "step": 1690, |
| "valid_targets_mean": 3206.1, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 2.834448160535117, |
| "grad_norm": 0.6961974009885317, |
| "learning_rate": 2.9719443996501858e-05, |
| "loss": 0.3441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3555162250995636, |
| "step": 1695, |
| "valid_targets_mean": 3276.0, |
| "valid_targets_min": 1491 |
| }, |
| { |
| "epoch": 2.842809364548495, |
| "grad_norm": 0.6616306549579406, |
| "learning_rate": 2.9646472233383118e-05, |
| "loss": 0.3263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.307451993227005, |
| "step": 1700, |
| "valid_targets_mean": 3025.1, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 2.851170568561873, |
| "grad_norm": 0.699054155600686, |
| "learning_rate": 2.9573332738079964e-05, |
| "loss": 0.3428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.325960248708725, |
| "step": 1705, |
| "valid_targets_mean": 3397.9, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 2.859531772575251, |
| "grad_norm": 0.5618995876602438, |
| "learning_rate": 2.9500026782336828e-05, |
| "loss": 0.3321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3432704210281372, |
| "step": 1710, |
| "valid_targets_mean": 5129.1, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 2.867892976588629, |
| "grad_norm": 0.7396609388739099, |
| "learning_rate": 2.942655564079254e-05, |
| "loss": 0.3364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30100107192993164, |
| "step": 1715, |
| "valid_targets_mean": 2780.6, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 2.8762541806020065, |
| "grad_norm": 0.6882252256679291, |
| "learning_rate": 2.9352920590958173e-05, |
| "loss": 0.3636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3655456006526947, |
| "step": 1720, |
| "valid_targets_mean": 3660.6, |
| "valid_targets_min": 1486 |
| }, |
| { |
| "epoch": 2.8846153846153846, |
| "grad_norm": 0.6954294304011069, |
| "learning_rate": 2.927912291319482e-05, |
| "loss": 0.2649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2898782789707184, |
| "step": 1725, |
| "valid_targets_mean": 2949.5, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 2.8929765886287626, |
| "grad_norm": 0.7685790812651909, |
| "learning_rate": 2.9205163890691338e-05, |
| "loss": 0.3633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.351645827293396, |
| "step": 1730, |
| "valid_targets_mean": 3392.4, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 2.90133779264214, |
| "grad_norm": 0.6514952351452494, |
| "learning_rate": 2.9131044809442038e-05, |
| "loss": 0.3061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27277517318725586, |
| "step": 1735, |
| "valid_targets_mean": 3230.4, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 2.9096989966555182, |
| "grad_norm": 0.6336596359886507, |
| "learning_rate": 2.9056766958224324e-05, |
| "loss": 0.3282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31338661909103394, |
| "step": 1740, |
| "valid_targets_mean": 3871.8, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 2.9180602006688963, |
| "grad_norm": 0.7074870527746576, |
| "learning_rate": 2.898233162857627e-05, |
| "loss": 0.3159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31244152784347534, |
| "step": 1745, |
| "valid_targets_mean": 3252.4, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 2.9264214046822743, |
| "grad_norm": 0.7317476390005567, |
| "learning_rate": 2.8907740114774185e-05, |
| "loss": 0.3326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3308480381965637, |
| "step": 1750, |
| "valid_targets_mean": 2940.5, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 2.9347826086956523, |
| "grad_norm": 0.669207925359114, |
| "learning_rate": 2.8832993713810095e-05, |
| "loss": 0.3291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34635135531425476, |
| "step": 1755, |
| "valid_targets_mean": 3485.1, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 2.94314381270903, |
| "grad_norm": 0.7081348378617047, |
| "learning_rate": 2.8758093725369193e-05, |
| "loss": 0.3508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41460931301116943, |
| "step": 1760, |
| "valid_targets_mean": 3348.2, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 2.951505016722408, |
| "grad_norm": 0.6563436808159772, |
| "learning_rate": 2.868304145180722e-05, |
| "loss": 0.363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43143677711486816, |
| "step": 1765, |
| "valid_targets_mean": 5450.4, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 2.959866220735786, |
| "grad_norm": 1.0813836021947982, |
| "learning_rate": 2.8607838198127886e-05, |
| "loss": 0.3024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3358667194843292, |
| "step": 1770, |
| "valid_targets_mean": 2942.9, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 2.968227424749164, |
| "grad_norm": 0.6535458920771104, |
| "learning_rate": 2.8532485271960088e-05, |
| "loss": 0.3272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30923616886138916, |
| "step": 1775, |
| "valid_targets_mean": 3134.3, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 2.976588628762542, |
| "grad_norm": 0.7051449951363025, |
| "learning_rate": 2.8456983983535243e-05, |
| "loss": 0.3081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3197246789932251, |
| "step": 1780, |
| "valid_targets_mean": 3088.7, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 2.9849498327759196, |
| "grad_norm": 0.7514550832469282, |
| "learning_rate": 2.838133564566447e-05, |
| "loss": 0.3221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33178478479385376, |
| "step": 1785, |
| "valid_targets_mean": 2903.9, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 2.9933110367892977, |
| "grad_norm": 0.7487764007212119, |
| "learning_rate": 2.8305541573715775e-05, |
| "loss": 0.355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32397782802581787, |
| "step": 1790, |
| "valid_targets_mean": 2655.2, |
| "valid_targets_min": 364 |
| }, |
| { |
| "epoch": 3.0016722408026757, |
| "grad_norm": 0.697866012772672, |
| "learning_rate": 2.8229603085591178e-05, |
| "loss": 0.3045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24206683039665222, |
| "step": 1795, |
| "valid_targets_mean": 2628.6, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 3.0100334448160537, |
| "grad_norm": 0.7292123243657525, |
| "learning_rate": 2.8153521501703803e-05, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32684776186943054, |
| "step": 1800, |
| "valid_targets_mean": 3399.4, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 3.0183946488294313, |
| "grad_norm": 0.7473811261850504, |
| "learning_rate": 2.8077298144954904e-05, |
| "loss": 0.2602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2628287672996521, |
| "step": 1805, |
| "valid_targets_mean": 2887.2, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 3.0267558528428093, |
| "grad_norm": 0.7650083502129927, |
| "learning_rate": 2.8000934340710883e-05, |
| "loss": 0.316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30963340401649475, |
| "step": 1810, |
| "valid_targets_mean": 3063.6, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 3.0351170568561874, |
| "grad_norm": 0.7397530221539242, |
| "learning_rate": 2.792443141678022e-05, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27429091930389404, |
| "step": 1815, |
| "valid_targets_mean": 2718.4, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 3.0434782608695654, |
| "grad_norm": 0.889361629882369, |
| "learning_rate": 2.784779070339041e-05, |
| "loss": 0.316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3256457448005676, |
| "step": 1820, |
| "valid_targets_mean": 2798.4, |
| "valid_targets_min": 470 |
| }, |
| { |
| "epoch": 3.051839464882943, |
| "grad_norm": 0.6809205141917194, |
| "learning_rate": 2.7771013533164805e-05, |
| "loss": 0.3188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3276858329772949, |
| "step": 1825, |
| "valid_targets_mean": 3351.5, |
| "valid_targets_min": 399 |
| }, |
| { |
| "epoch": 3.060200668896321, |
| "grad_norm": 0.6744548172485136, |
| "learning_rate": 2.7694101241099484e-05, |
| "loss": 0.3659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4031035006046295, |
| "step": 1830, |
| "valid_targets_mean": 4916.2, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 3.068561872909699, |
| "grad_norm": 0.7582120508573842, |
| "learning_rate": 2.7617055164539993e-05, |
| "loss": 0.3349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31827855110168457, |
| "step": 1835, |
| "valid_targets_mean": 2926.5, |
| "valid_targets_min": 2041 |
| }, |
| { |
| "epoch": 3.076923076923077, |
| "grad_norm": 0.8315396768017139, |
| "learning_rate": 2.753987664315813e-05, |
| "loss": 0.3021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35661745071411133, |
| "step": 1840, |
| "valid_targets_mean": 2858.8, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 3.0852842809364547, |
| "grad_norm": 0.7155190185107607, |
| "learning_rate": 2.746256701892861e-05, |
| "loss": 0.3741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3801868259906769, |
| "step": 1845, |
| "valid_targets_mean": 4064.2, |
| "valid_targets_min": 1411 |
| }, |
| { |
| "epoch": 3.0936454849498327, |
| "grad_norm": 0.6741071495612008, |
| "learning_rate": 2.738512763610579e-05, |
| "loss": 0.308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37737980484962463, |
| "step": 1850, |
| "valid_targets_mean": 4971.6, |
| "valid_targets_min": 1956 |
| }, |
| { |
| "epoch": 3.1020066889632107, |
| "grad_norm": 0.7590694014485702, |
| "learning_rate": 2.7307559841200238e-05, |
| "loss": 0.3291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3324778079986572, |
| "step": 1855, |
| "valid_targets_mean": 2946.1, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 3.1103678929765888, |
| "grad_norm": 0.7215558419615479, |
| "learning_rate": 2.7229864982955328e-05, |
| "loss": 0.3186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3469077944755554, |
| "step": 1860, |
| "valid_targets_mean": 3110.1, |
| "valid_targets_min": 1665 |
| }, |
| { |
| "epoch": 3.1187290969899664, |
| "grad_norm": 0.6897412184844943, |
| "learning_rate": 2.7152044412323842e-05, |
| "loss": 0.3075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28832149505615234, |
| "step": 1865, |
| "valid_targets_mean": 3266.5, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 3.1270903010033444, |
| "grad_norm": 0.8950983106159963, |
| "learning_rate": 2.7074099482444406e-05, |
| "loss": 0.3128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3346301317214966, |
| "step": 1870, |
| "valid_targets_mean": 2962.5, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 3.1354515050167224, |
| "grad_norm": 0.6829362728624939, |
| "learning_rate": 2.699603154861801e-05, |
| "loss": 0.3217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2530469298362732, |
| "step": 1875, |
| "valid_targets_mean": 3057.2, |
| "valid_targets_min": 1148 |
| }, |
| { |
| "epoch": 3.1438127090301005, |
| "grad_norm": 0.7233648289737619, |
| "learning_rate": 2.6917841968284433e-05, |
| "loss": 0.3161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3072529733181, |
| "step": 1880, |
| "valid_targets_mean": 2967.2, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 3.1521739130434785, |
| "grad_norm": 0.7416457175298982, |
| "learning_rate": 2.6839532100998623e-05, |
| "loss": 0.3185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3872751295566559, |
| "step": 1885, |
| "valid_targets_mean": 3862.7, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 3.160535117056856, |
| "grad_norm": 0.7812518570866998, |
| "learning_rate": 2.6761103308407076e-05, |
| "loss": 0.3277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25746119022369385, |
| "step": 1890, |
| "valid_targets_mean": 2487.5, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 3.168896321070234, |
| "grad_norm": 0.7436986096190392, |
| "learning_rate": 2.668255695422415e-05, |
| "loss": 0.3709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37360888719558716, |
| "step": 1895, |
| "valid_targets_mean": 3813.4, |
| "valid_targets_min": 1554 |
| }, |
| { |
| "epoch": 3.177257525083612, |
| "grad_norm": 0.7142319442876787, |
| "learning_rate": 2.660389440420836e-05, |
| "loss": 0.3068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.272394061088562, |
| "step": 1900, |
| "valid_targets_mean": 2995.9, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 3.1856187290969897, |
| "grad_norm": 0.7424793152458009, |
| "learning_rate": 2.6525117026138614e-05, |
| "loss": 0.3392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34922927618026733, |
| "step": 1905, |
| "valid_targets_mean": 3819.7, |
| "valid_targets_min": 1601 |
| }, |
| { |
| "epoch": 3.1939799331103678, |
| "grad_norm": 0.7607562321366768, |
| "learning_rate": 2.644622618979047e-05, |
| "loss": 0.2896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24981051683425903, |
| "step": 1910, |
| "valid_targets_mean": 2548.7, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 3.202341137123746, |
| "grad_norm": 0.6904862318660174, |
| "learning_rate": 2.6367223266912252e-05, |
| "loss": 0.3317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37764304876327515, |
| "step": 1915, |
| "valid_targets_mean": 3910.4, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 3.210702341137124, |
| "grad_norm": 0.8961099343679048, |
| "learning_rate": 2.6288109631201266e-05, |
| "loss": 0.3337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3819909393787384, |
| "step": 1920, |
| "valid_targets_mean": 2620.2, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 3.219063545150502, |
| "grad_norm": 0.7566386982431123, |
| "learning_rate": 2.6208886658279875e-05, |
| "loss": 0.3137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3507644534111023, |
| "step": 1925, |
| "valid_targets_mean": 3339.7, |
| "valid_targets_min": 1683 |
| }, |
| { |
| "epoch": 3.2274247491638794, |
| "grad_norm": 0.8144566736238488, |
| "learning_rate": 2.6129555725671586e-05, |
| "loss": 0.3041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3747752010822296, |
| "step": 1930, |
| "valid_targets_mean": 2877.8, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 3.2357859531772575, |
| "grad_norm": 0.8094873874087346, |
| "learning_rate": 2.605011821277712e-05, |
| "loss": 0.306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3171420693397522, |
| "step": 1935, |
| "valid_targets_mean": 2959.7, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 3.2441471571906355, |
| "grad_norm": 0.8547392925559153, |
| "learning_rate": 2.597057550085037e-05, |
| "loss": 0.3001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27529996633529663, |
| "step": 1940, |
| "valid_targets_mean": 2264.8, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 3.2525083612040135, |
| "grad_norm": 0.6817740682466431, |
| "learning_rate": 2.589092897297447e-05, |
| "loss": 0.3122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33298245072364807, |
| "step": 1945, |
| "valid_targets_mean": 3641.5, |
| "valid_targets_min": 2028 |
| }, |
| { |
| "epoch": 3.260869565217391, |
| "grad_norm": 0.7178992056677376, |
| "learning_rate": 2.581118001403767e-05, |
| "loss": 0.3346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.298176109790802, |
| "step": 1950, |
| "valid_targets_mean": 2812.1, |
| "valid_targets_min": 1666 |
| }, |
| { |
| "epoch": 3.269230769230769, |
| "grad_norm": 0.821395268384391, |
| "learning_rate": 2.573133001070928e-05, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32294681668281555, |
| "step": 1955, |
| "valid_targets_mean": 2872.3, |
| "valid_targets_min": 1526 |
| }, |
| { |
| "epoch": 3.277591973244147, |
| "grad_norm": 0.7018121583116861, |
| "learning_rate": 2.565138035141558e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32964542508125305, |
| "step": 1960, |
| "valid_targets_mean": 3175.1, |
| "valid_targets_min": 1682 |
| }, |
| { |
| "epoch": 3.2859531772575252, |
| "grad_norm": 1.1803702361445025, |
| "learning_rate": 2.557133242631565e-05, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3171846866607666, |
| "step": 1965, |
| "valid_targets_mean": 3355.6, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 3.294314381270903, |
| "grad_norm": 0.6610850683002595, |
| "learning_rate": 2.549118762727721e-05, |
| "loss": 0.3053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24194839596748352, |
| "step": 1970, |
| "valid_targets_mean": 3080.6, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 3.302675585284281, |
| "grad_norm": 0.7255555656749366, |
| "learning_rate": 2.5410947347852436e-05, |
| "loss": 0.3355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4482927620410919, |
| "step": 1975, |
| "valid_targets_mean": 4331.0, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 3.311036789297659, |
| "grad_norm": 0.7459931964816805, |
| "learning_rate": 2.5330612983253667e-05, |
| "loss": 0.3369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28639882802963257, |
| "step": 1980, |
| "valid_targets_mean": 3048.4, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 3.319397993311037, |
| "grad_norm": 0.7132568663511498, |
| "learning_rate": 2.5250185930329235e-05, |
| "loss": 0.3194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3665810227394104, |
| "step": 1985, |
| "valid_targets_mean": 3538.0, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 3.327759197324415, |
| "grad_norm": 0.8008208379218488, |
| "learning_rate": 2.5169667587539105e-05, |
| "loss": 0.3226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30878740549087524, |
| "step": 1990, |
| "valid_targets_mean": 2999.9, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 3.3361204013377925, |
| "grad_norm": 0.7114926198475543, |
| "learning_rate": 2.5089059354930584e-05, |
| "loss": 0.3253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3151680827140808, |
| "step": 1995, |
| "valid_targets_mean": 3198.5, |
| "valid_targets_min": 1876 |
| }, |
| { |
| "epoch": 3.3444816053511706, |
| "grad_norm": 0.6910899592340489, |
| "learning_rate": 2.5008362634113986e-05, |
| "loss": 0.3158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27248960733413696, |
| "step": 2000, |
| "valid_targets_mean": 3219.5, |
| "valid_targets_min": 1548 |
| }, |
| { |
| "epoch": 3.3528428093645486, |
| "grad_norm": 0.9194983641690248, |
| "learning_rate": 2.4927578828238253e-05, |
| "loss": 0.2827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30196303129196167, |
| "step": 2005, |
| "valid_targets_mean": 2675.1, |
| "valid_targets_min": 1560 |
| }, |
| { |
| "epoch": 3.361204013377926, |
| "grad_norm": 0.7413625053509546, |
| "learning_rate": 2.484670934196654e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2616788148880005, |
| "step": 2010, |
| "valid_targets_mean": 2792.3, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 3.369565217391304, |
| "grad_norm": 0.7183291854874223, |
| "learning_rate": 2.476575558145183e-05, |
| "loss": 0.3222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3487267792224884, |
| "step": 2015, |
| "valid_targets_mean": 3637.6, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 3.3779264214046822, |
| "grad_norm": 0.7490283521521003, |
| "learning_rate": 2.468471895431243e-05, |
| "loss": 0.3021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.325644314289093, |
| "step": 2020, |
| "valid_targets_mean": 3182.8, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 3.3862876254180603, |
| "grad_norm": 0.7101402332669482, |
| "learning_rate": 2.4603600869607564e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2660444378852844, |
| "step": 2025, |
| "valid_targets_mean": 2812.0, |
| "valid_targets_min": 1258 |
| }, |
| { |
| "epoch": 3.3946488294314383, |
| "grad_norm": 0.730576453198831, |
| "learning_rate": 2.452240273781281e-05, |
| "loss": 0.3016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26417773962020874, |
| "step": 2030, |
| "valid_targets_mean": 3180.6, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 3.403010033444816, |
| "grad_norm": 0.7181814679922088, |
| "learning_rate": 2.444112597079558e-05, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2812889814376831, |
| "step": 2035, |
| "valid_targets_mean": 3133.4, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 3.411371237458194, |
| "grad_norm": 0.7924112516136512, |
| "learning_rate": 2.435977198179065e-05, |
| "loss": 0.3287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27810171246528625, |
| "step": 2040, |
| "valid_targets_mean": 2717.6, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 3.419732441471572, |
| "grad_norm": 0.707141761893294, |
| "learning_rate": 2.4278342185375467e-05, |
| "loss": 0.3362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31040269136428833, |
| "step": 2045, |
| "valid_targets_mean": 3125.6, |
| "valid_targets_min": 1931 |
| }, |
| { |
| "epoch": 3.42809364548495, |
| "grad_norm": 0.7561619308472627, |
| "learning_rate": 2.4196837997445636e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3123628795146942, |
| "step": 2050, |
| "valid_targets_mean": 3224.0, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 3.4364548494983276, |
| "grad_norm": 0.7289170075667627, |
| "learning_rate": 2.4115260835190285e-05, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2535760998725891, |
| "step": 2055, |
| "valid_targets_mean": 3353.6, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 3.4448160535117056, |
| "grad_norm": 0.945847336384475, |
| "learning_rate": 2.4033612117067396e-05, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2784852981567383, |
| "step": 2060, |
| "valid_targets_mean": 3911.6, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 3.4531772575250836, |
| "grad_norm": 0.7817559218890252, |
| "learning_rate": 2.395189326277918e-05, |
| "loss": 0.2968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3658587336540222, |
| "step": 2065, |
| "valid_targets_mean": 3038.2, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 3.4615384615384617, |
| "grad_norm": 0.7908249845730267, |
| "learning_rate": 2.3870105693247347e-05, |
| "loss": 0.3314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40112197399139404, |
| "step": 2070, |
| "valid_targets_mean": 3198.5, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 3.4698996655518393, |
| "grad_norm": 0.7869243206602189, |
| "learning_rate": 2.3788250830588437e-05, |
| "loss": 0.3191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2704690992832184, |
| "step": 2075, |
| "valid_targets_mean": 2424.8, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 3.4782608695652173, |
| "grad_norm": 0.7080463514373667, |
| "learning_rate": 2.3706330098089077e-05, |
| "loss": 0.314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3315350413322449, |
| "step": 2080, |
| "valid_targets_mean": 4324.7, |
| "valid_targets_min": 1855 |
| }, |
| { |
| "epoch": 3.4866220735785953, |
| "grad_norm": 0.8218808851621214, |
| "learning_rate": 2.3624344920181243e-05, |
| "loss": 0.2889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3174235224723816, |
| "step": 2085, |
| "valid_targets_mean": 2845.2, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 3.4949832775919734, |
| "grad_norm": 0.7054886370767576, |
| "learning_rate": 2.3542296722417452e-05, |
| "loss": 0.3309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3576347529888153, |
| "step": 2090, |
| "valid_targets_mean": 3957.9, |
| "valid_targets_min": 1892 |
| }, |
| { |
| "epoch": 3.5033444816053514, |
| "grad_norm": 0.7737550873720773, |
| "learning_rate": 2.346018693144605e-05, |
| "loss": 0.3147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3562350869178772, |
| "step": 2095, |
| "valid_targets_mean": 3385.3, |
| "valid_targets_min": 1565 |
| }, |
| { |
| "epoch": 3.511705685618729, |
| "grad_norm": 0.793659888489234, |
| "learning_rate": 2.3378016974986326e-05, |
| "loss": 0.3287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3222711384296417, |
| "step": 2100, |
| "valid_targets_mean": 2910.6, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 3.520066889632107, |
| "grad_norm": 0.8708230054218504, |
| "learning_rate": 2.3295788281803733e-05, |
| "loss": 0.3126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33255574107170105, |
| "step": 2105, |
| "valid_targets_mean": 3600.3, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 3.528428093645485, |
| "grad_norm": 0.7022641595914034, |
| "learning_rate": 2.321350228168505e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3107645511627197, |
| "step": 2110, |
| "valid_targets_mean": 3758.8, |
| "valid_targets_min": 1562 |
| }, |
| { |
| "epoch": 3.5367892976588626, |
| "grad_norm": 0.8652735159983888, |
| "learning_rate": 2.3131160405413472e-05, |
| "loss": 0.2842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26982659101486206, |
| "step": 2115, |
| "valid_targets_mean": 2795.1, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 3.5451505016722407, |
| "grad_norm": 0.656569555739008, |
| "learning_rate": 2.30487640847438e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3019533157348633, |
| "step": 2120, |
| "valid_targets_mean": 3843.1, |
| "valid_targets_min": 1730 |
| }, |
| { |
| "epoch": 3.5535117056856187, |
| "grad_norm": 0.721412813412654, |
| "learning_rate": 2.296631475237749e-05, |
| "loss": 0.3217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.326846718788147, |
| "step": 2125, |
| "valid_targets_mean": 3144.4, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 3.5618729096989967, |
| "grad_norm": 0.8698536209082071, |
| "learning_rate": 2.2883813841937754e-05, |
| "loss": 0.3396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32312431931495667, |
| "step": 2130, |
| "valid_targets_mean": 2314.3, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 3.5702341137123748, |
| "grad_norm": 0.8109874750171677, |
| "learning_rate": 2.2801262787944668e-05, |
| "loss": 0.3159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.298412948846817, |
| "step": 2135, |
| "valid_targets_mean": 3258.5, |
| "valid_targets_min": 1480 |
| }, |
| { |
| "epoch": 3.5785953177257523, |
| "grad_norm": 0.8162989082018804, |
| "learning_rate": 2.2718663025790183e-05, |
| "loss": 0.3138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2839236259460449, |
| "step": 2140, |
| "valid_targets_mean": 2840.1, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 3.5869565217391304, |
| "grad_norm": 0.8038116768717268, |
| "learning_rate": 2.2636015991713167e-05, |
| "loss": 0.3237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3331753611564636, |
| "step": 2145, |
| "valid_targets_mean": 2935.8, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 3.5953177257525084, |
| "grad_norm": 0.7739334985662348, |
| "learning_rate": 2.2553323122774487e-05, |
| "loss": 0.2988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3323972821235657, |
| "step": 2150, |
| "valid_targets_mean": 3164.0, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 3.6036789297658864, |
| "grad_norm": 0.7740161292149046, |
| "learning_rate": 2.2470585856831953e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25347644090652466, |
| "step": 2155, |
| "valid_targets_mean": 2834.1, |
| "valid_targets_min": 1341 |
| }, |
| { |
| "epoch": 3.6120401337792645, |
| "grad_norm": 0.6771441745861378, |
| "learning_rate": 2.2387805632515365e-05, |
| "loss": 0.3432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31761401891708374, |
| "step": 2160, |
| "valid_targets_mean": 4497.9, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 3.620401337792642, |
| "grad_norm": 0.7521566633081039, |
| "learning_rate": 2.2304983889201467e-05, |
| "loss": 0.3186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3334948420524597, |
| "step": 2165, |
| "valid_targets_mean": 3627.6, |
| "valid_targets_min": 1882 |
| }, |
| { |
| "epoch": 3.62876254180602, |
| "grad_norm": 0.7031338023674866, |
| "learning_rate": 2.222212206698894e-05, |
| "loss": 0.3302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24446901679039001, |
| "step": 2170, |
| "valid_targets_mean": 2985.4, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 3.637123745819398, |
| "grad_norm": 0.6866912372395072, |
| "learning_rate": 2.2139221606673353e-05, |
| "loss": 0.3618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3053354024887085, |
| "step": 2175, |
| "valid_targets_mean": 3322.4, |
| "valid_targets_min": 1844 |
| }, |
| { |
| "epoch": 3.6454849498327757, |
| "grad_norm": 0.7043379955622305, |
| "learning_rate": 2.2056283949722114e-05, |
| "loss": 0.3045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29806143045425415, |
| "step": 2180, |
| "valid_targets_mean": 3245.2, |
| "valid_targets_min": 1284 |
| }, |
| { |
| "epoch": 3.6538461538461537, |
| "grad_norm": 0.7223387295053122, |
| "learning_rate": 2.197331053824939e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2715410888195038, |
| "step": 2185, |
| "valid_targets_mean": 3403.3, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 3.6622073578595318, |
| "grad_norm": 0.7923524210124755, |
| "learning_rate": 2.1890302814991075e-05, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27055805921554565, |
| "step": 2190, |
| "valid_targets_mean": 2505.2, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 3.67056856187291, |
| "grad_norm": 0.9333927510801652, |
| "learning_rate": 2.1807262223279633e-05, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33472126722335815, |
| "step": 2195, |
| "valid_targets_mean": 2667.6, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 3.678929765886288, |
| "grad_norm": 0.7418078632890535, |
| "learning_rate": 2.172419020701907e-05, |
| "loss": 0.3113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2958923280239105, |
| "step": 2200, |
| "valid_targets_mean": 3098.1, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 3.6872909698996654, |
| "grad_norm": 0.8027987445224076, |
| "learning_rate": 2.1641088210659804e-05, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.294519305229187, |
| "step": 2205, |
| "valid_targets_mean": 2970.6, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 3.6956521739130435, |
| "grad_norm": 0.8206281052811005, |
| "learning_rate": 2.155795767917352e-05, |
| "loss": 0.2961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31719639897346497, |
| "step": 2210, |
| "valid_targets_mean": 3145.6, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 3.7040133779264215, |
| "grad_norm": 0.7960144879970568, |
| "learning_rate": 2.14748000580281e-05, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3015314042568207, |
| "step": 2215, |
| "valid_targets_mean": 2424.9, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 3.712374581939799, |
| "grad_norm": 0.7242043132987579, |
| "learning_rate": 2.1391616793162435e-05, |
| "loss": 0.319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29711389541625977, |
| "step": 2220, |
| "valid_targets_mean": 3244.1, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 3.720735785953177, |
| "grad_norm": 0.8514530826111597, |
| "learning_rate": 2.1308409330961308e-05, |
| "loss": 0.309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3484026789665222, |
| "step": 2225, |
| "valid_targets_mean": 3235.6, |
| "valid_targets_min": 509 |
| }, |
| { |
| "epoch": 3.729096989966555, |
| "grad_norm": 0.7964054451384952, |
| "learning_rate": 2.122517911823027e-05, |
| "loss": 0.3255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2610142230987549, |
| "step": 2230, |
| "valid_targets_mean": 2320.4, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 3.737458193979933, |
| "grad_norm": 0.8055361034248192, |
| "learning_rate": 2.114192760217042e-05, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3181573450565338, |
| "step": 2235, |
| "valid_targets_mean": 3128.3, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 3.745819397993311, |
| "grad_norm": 0.7412318158314767, |
| "learning_rate": 2.10586562303533e-05, |
| "loss": 0.2753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2673335671424866, |
| "step": 2240, |
| "valid_targets_mean": 2812.3, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 3.754180602006689, |
| "grad_norm": 0.806735595661349, |
| "learning_rate": 2.0975366450695707e-05, |
| "loss": 0.2901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34919291734695435, |
| "step": 2245, |
| "valid_targets_mean": 2936.5, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 3.762541806020067, |
| "grad_norm": 0.7799986710841482, |
| "learning_rate": 2.0892059711434496e-05, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30157431960105896, |
| "step": 2250, |
| "valid_targets_mean": 2891.5, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 3.770903010033445, |
| "grad_norm": 0.6961704800642899, |
| "learning_rate": 2.0808737461101417e-05, |
| "loss": 0.2889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2948909401893616, |
| "step": 2255, |
| "valid_targets_mean": 3901.8, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 3.779264214046823, |
| "grad_norm": 0.6430882576013616, |
| "learning_rate": 2.0725401148497946e-05, |
| "loss": 0.3453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36942294239997864, |
| "step": 2260, |
| "valid_targets_mean": 4432.6, |
| "valid_targets_min": 2022 |
| }, |
| { |
| "epoch": 3.787625418060201, |
| "grad_norm": 0.9476578148171562, |
| "learning_rate": 2.0642052222670043e-05, |
| "loss": 0.3016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34764429926872253, |
| "step": 2265, |
| "valid_targets_mean": 2577.2, |
| "valid_targets_min": 586 |
| }, |
| { |
| "epoch": 3.7959866220735785, |
| "grad_norm": 0.8377190542394216, |
| "learning_rate": 2.0558692132883008e-05, |
| "loss": 0.31, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3148440420627594, |
| "step": 2270, |
| "valid_targets_mean": 2928.6, |
| "valid_targets_min": 1524 |
| }, |
| { |
| "epoch": 3.8043478260869565, |
| "grad_norm": 0.7674746381928171, |
| "learning_rate": 2.047532232859625e-05, |
| "loss": 0.3163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2882377505302429, |
| "step": 2275, |
| "valid_targets_mean": 3211.1, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 3.8127090301003346, |
| "grad_norm": 0.7603539777572138, |
| "learning_rate": 2.039194425943808e-05, |
| "loss": 0.3297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28924140334129333, |
| "step": 2280, |
| "valid_targets_mean": 2899.9, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 3.821070234113712, |
| "grad_norm": 0.6686475071499299, |
| "learning_rate": 2.0308559375180557e-05, |
| "loss": 0.274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22952501475811005, |
| "step": 2285, |
| "valid_targets_mean": 2880.6, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 3.82943143812709, |
| "grad_norm": 0.9368254198322394, |
| "learning_rate": 2.0225169125714193e-05, |
| "loss": 0.3089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3129611909389496, |
| "step": 2290, |
| "valid_targets_mean": 3224.8, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 3.8377926421404682, |
| "grad_norm": 0.8093927362873512, |
| "learning_rate": 2.0141774961022826e-05, |
| "loss": 0.2892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30943459272384644, |
| "step": 2295, |
| "valid_targets_mean": 2797.4, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 3.8461538461538463, |
| "grad_norm": 0.8283893332898696, |
| "learning_rate": 2.0058378331158357e-05, |
| "loss": 0.2882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3456169366836548, |
| "step": 2300, |
| "valid_targets_mean": 3146.9, |
| "valid_targets_min": 983 |
| }, |
| { |
| "epoch": 3.8545150501672243, |
| "grad_norm": 0.8137074950993536, |
| "learning_rate": 1.9974980686215546e-05, |
| "loss": 0.2795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24720898270606995, |
| "step": 2305, |
| "valid_targets_mean": 2561.4, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 3.862876254180602, |
| "grad_norm": 0.7732084599764113, |
| "learning_rate": 1.9891583476306814e-05, |
| "loss": 0.327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31134891510009766, |
| "step": 2310, |
| "valid_targets_mean": 2994.1, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 3.87123745819398, |
| "grad_norm": 0.7919123584972602, |
| "learning_rate": 1.9808188151537008e-05, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25116395950317383, |
| "step": 2315, |
| "valid_targets_mean": 2886.5, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 3.879598662207358, |
| "grad_norm": 0.7406481098660109, |
| "learning_rate": 1.972479616197821e-05, |
| "loss": 0.3043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27166545391082764, |
| "step": 2320, |
| "valid_targets_mean": 3462.1, |
| "valid_targets_min": 1420 |
| }, |
| { |
| "epoch": 3.8879598662207355, |
| "grad_norm": 0.8731416317069042, |
| "learning_rate": 1.96414089576445e-05, |
| "loss": 0.2973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35053551197052, |
| "step": 2325, |
| "valid_targets_mean": 2947.4, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 3.8963210702341136, |
| "grad_norm": 0.7355424472980551, |
| "learning_rate": 1.9558027988466743e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31646502017974854, |
| "step": 2330, |
| "valid_targets_mean": 3953.5, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 3.9046822742474916, |
| "grad_norm": 0.7933779157508104, |
| "learning_rate": 1.947465470426741e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2982478141784668, |
| "step": 2335, |
| "valid_targets_mean": 3171.0, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 3.9130434782608696, |
| "grad_norm": 0.8102903523307262, |
| "learning_rate": 1.9391290554735326e-05, |
| "loss": 0.3092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3341084122657776, |
| "step": 2340, |
| "valid_targets_mean": 2779.8, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 3.9214046822742477, |
| "grad_norm": 0.7472511964464619, |
| "learning_rate": 1.93079369894005e-05, |
| "loss": 0.3187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30373987555503845, |
| "step": 2345, |
| "valid_targets_mean": 3103.1, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 3.9297658862876252, |
| "grad_norm": 0.7947702151134352, |
| "learning_rate": 1.922459545760889e-05, |
| "loss": 0.3175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.363625705242157, |
| "step": 2350, |
| "valid_targets_mean": 3638.0, |
| "valid_targets_min": 1698 |
| }, |
| { |
| "epoch": 3.9381270903010033, |
| "grad_norm": 0.8068716471695595, |
| "learning_rate": 1.914126740849723e-05, |
| "loss": 0.3014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2704453766345978, |
| "step": 2355, |
| "valid_targets_mean": 2755.2, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 3.9464882943143813, |
| "grad_norm": 0.8320104780946185, |
| "learning_rate": 1.9057954290967795e-05, |
| "loss": 0.3297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38438886404037476, |
| "step": 2360, |
| "valid_targets_mean": 4250.0, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 3.9548494983277593, |
| "grad_norm": 0.7539305683119704, |
| "learning_rate": 1.897465755366325e-05, |
| "loss": 0.3009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3422359228134155, |
| "step": 2365, |
| "valid_targets_mean": 3382.0, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.9632107023411374, |
| "grad_norm": 0.7840574192641151, |
| "learning_rate": 1.8891378644941437e-05, |
| "loss": 0.2832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31690046191215515, |
| "step": 2370, |
| "valid_targets_mean": 3137.6, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 3.971571906354515, |
| "grad_norm": 0.7175563191342146, |
| "learning_rate": 1.88081190128502e-05, |
| "loss": 0.2915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30410125851631165, |
| "step": 2375, |
| "valid_targets_mean": 3167.8, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 3.979933110367893, |
| "grad_norm": 0.7773926485050648, |
| "learning_rate": 1.8724880105102196e-05, |
| "loss": 0.2751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2675161361694336, |
| "step": 2380, |
| "valid_targets_mean": 3070.1, |
| "valid_targets_min": 1741 |
| }, |
| { |
| "epoch": 3.988294314381271, |
| "grad_norm": 0.7560734554908822, |
| "learning_rate": 1.8641663369049724e-05, |
| "loss": 0.287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2527911365032196, |
| "step": 2385, |
| "valid_targets_mean": 2798.2, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 3.9966555183946486, |
| "grad_norm": 0.9060459955316458, |
| "learning_rate": 1.8558470251659574e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27911093831062317, |
| "step": 2390, |
| "valid_targets_mean": 2562.9, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 4.005016722408027, |
| "grad_norm": 0.8594449711299057, |
| "learning_rate": 1.8475302199487848e-05, |
| "loss": 0.309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2793564200401306, |
| "step": 2395, |
| "valid_targets_mean": 3010.3, |
| "valid_targets_min": 1511 |
| }, |
| { |
| "epoch": 4.013377926421405, |
| "grad_norm": 0.8838950374531943, |
| "learning_rate": 1.8392160658654826e-05, |
| "loss": 0.2648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3361824154853821, |
| "step": 2400, |
| "valid_targets_mean": 3615.7, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 4.021739130434782, |
| "grad_norm": 0.7437793364772181, |
| "learning_rate": 1.8309047074819805e-05, |
| "loss": 0.3187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2967781126499176, |
| "step": 2405, |
| "valid_targets_mean": 3316.2, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 4.030100334448161, |
| "grad_norm": 0.8335679273374376, |
| "learning_rate": 1.822596289315596e-05, |
| "loss": 0.281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29241418838500977, |
| "step": 2410, |
| "valid_targets_mean": 3000.0, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 4.038461538461538, |
| "grad_norm": 0.9450863777551641, |
| "learning_rate": 1.814290955832523e-05, |
| "loss": 0.2639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27432459592819214, |
| "step": 2415, |
| "valid_targets_mean": 2766.5, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 4.046822742474917, |
| "grad_norm": 0.6892365494886082, |
| "learning_rate": 1.8059888514453196e-05, |
| "loss": 0.2743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35358893871307373, |
| "step": 2420, |
| "valid_targets_mean": 4687.2, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 4.055183946488294, |
| "grad_norm": 0.8546396818192133, |
| "learning_rate": 1.7976901205103953e-05, |
| "loss": 0.2409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2732149660587311, |
| "step": 2425, |
| "valid_targets_mean": 2872.1, |
| "valid_targets_min": 1565 |
| }, |
| { |
| "epoch": 4.063545150501672, |
| "grad_norm": 0.9074538701365267, |
| "learning_rate": 1.789394907325504e-05, |
| "loss": 0.2829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27739718556404114, |
| "step": 2430, |
| "valid_targets_mean": 2549.9, |
| "valid_targets_min": 412 |
| }, |
| { |
| "epoch": 4.0719063545150505, |
| "grad_norm": 0.7010499122198948, |
| "learning_rate": 1.7811033561272328e-05, |
| "loss": 0.2805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28559303283691406, |
| "step": 2435, |
| "valid_targets_mean": 4280.4, |
| "valid_targets_min": 1688 |
| }, |
| { |
| "epoch": 4.080267558528428, |
| "grad_norm": 0.7783072544646484, |
| "learning_rate": 1.7728156110884924e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27712807059288025, |
| "step": 2440, |
| "valid_targets_mean": 3133.4, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 4.088628762541806, |
| "grad_norm": 0.8270554308257784, |
| "learning_rate": 1.7645318163160146e-05, |
| "loss": 0.3121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2960726022720337, |
| "step": 2445, |
| "valid_targets_mean": 3287.0, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 4.096989966555184, |
| "grad_norm": 0.8001563378250733, |
| "learning_rate": 1.7562521158478432e-05, |
| "loss": 0.279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23369301855564117, |
| "step": 2450, |
| "valid_targets_mean": 3446.6, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 4.105351170568562, |
| "grad_norm": 0.8436159622655983, |
| "learning_rate": 1.7479766536508313e-05, |
| "loss": 0.292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28451332449913025, |
| "step": 2455, |
| "valid_targets_mean": 3320.6, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 4.11371237458194, |
| "grad_norm": 0.8511630672848115, |
| "learning_rate": 1.7397055736181366e-05, |
| "loss": 0.2975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644152343273163, |
| "step": 2460, |
| "valid_targets_mean": 2837.6, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 4.122073578595318, |
| "grad_norm": 0.8329359927809505, |
| "learning_rate": 1.7314390195667193e-05, |
| "loss": 0.2839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27568697929382324, |
| "step": 2465, |
| "valid_targets_mean": 3675.1, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 4.130434782608695, |
| "grad_norm": 0.8456711766375431, |
| "learning_rate": 1.723177135234844e-05, |
| "loss": 0.2939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2696060538291931, |
| "step": 2470, |
| "valid_targets_mean": 3198.6, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 4.138795986622074, |
| "grad_norm": 0.8660274510460868, |
| "learning_rate": 1.7149200642795765e-05, |
| "loss": 0.2902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39124855399131775, |
| "step": 2475, |
| "valid_targets_mean": 3618.2, |
| "valid_targets_min": 1647 |
| }, |
| { |
| "epoch": 4.147157190635451, |
| "grad_norm": 0.8805366064387657, |
| "learning_rate": 1.70666795027429e-05, |
| "loss": 0.2943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3205997943878174, |
| "step": 2480, |
| "valid_targets_mean": 3357.6, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 4.15551839464883, |
| "grad_norm": 0.8831645923939866, |
| "learning_rate": 1.6984209367061657e-05, |
| "loss": 0.2741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3723400831222534, |
| "step": 2485, |
| "valid_targets_mean": 4439.7, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 4.1638795986622075, |
| "grad_norm": 0.8033626392233867, |
| "learning_rate": 1.6901791669736974e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23729437589645386, |
| "step": 2490, |
| "valid_targets_mean": 3279.5, |
| "valid_targets_min": 1317 |
| }, |
| { |
| "epoch": 4.172240802675585, |
| "grad_norm": 0.8529045414447846, |
| "learning_rate": 1.6819427843842016e-05, |
| "loss": 0.2724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24402417242527008, |
| "step": 2495, |
| "valid_targets_mean": 2829.3, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 4.1806020066889635, |
| "grad_norm": 0.7772728028989128, |
| "learning_rate": 1.6737119321513224e-05, |
| "loss": 0.3132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3176288604736328, |
| "step": 2500, |
| "valid_targets_mean": 3672.4, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 4.188963210702341, |
| "grad_norm": 0.8338000934996834, |
| "learning_rate": 1.6654867533925418e-05, |
| "loss": 0.2758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2721063494682312, |
| "step": 2505, |
| "valid_targets_mean": 3436.9, |
| "valid_targets_min": 1539 |
| }, |
| { |
| "epoch": 4.197324414715719, |
| "grad_norm": 0.8267713909712678, |
| "learning_rate": 1.6572673911266943e-05, |
| "loss": 0.2976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28024280071258545, |
| "step": 2510, |
| "valid_targets_mean": 3187.4, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 4.205685618729097, |
| "grad_norm": 0.9157546033073007, |
| "learning_rate": 1.6490539882714756e-05, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2485034167766571, |
| "step": 2515, |
| "valid_targets_mean": 2835.7, |
| "valid_targets_min": 1525 |
| }, |
| { |
| "epoch": 4.214046822742475, |
| "grad_norm": 0.9249610301165988, |
| "learning_rate": 1.6408466876409596e-05, |
| "loss": 0.2725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23990267515182495, |
| "step": 2520, |
| "valid_targets_mean": 2692.9, |
| "valid_targets_min": 490 |
| }, |
| { |
| "epoch": 4.222408026755853, |
| "grad_norm": 0.8518340628069135, |
| "learning_rate": 1.6326456319431154e-05, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31082072854042053, |
| "step": 2525, |
| "valid_targets_mean": 3444.6, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 4.230769230769231, |
| "grad_norm": 0.9837882931443535, |
| "learning_rate": 1.6244509637773256e-05, |
| "loss": 0.2714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29353979229927063, |
| "step": 2530, |
| "valid_targets_mean": 3000.7, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 4.239130434782608, |
| "grad_norm": 0.8579109041612042, |
| "learning_rate": 1.6162628256319078e-05, |
| "loss": 0.2849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2931848168373108, |
| "step": 2535, |
| "valid_targets_mean": 2974.6, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 4.247491638795987, |
| "grad_norm": 0.7372703580470882, |
| "learning_rate": 1.6080813598816355e-05, |
| "loss": 0.3212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35204175114631653, |
| "step": 2540, |
| "valid_targets_mean": 4623.1, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 4.2558528428093645, |
| "grad_norm": 0.9167357129141266, |
| "learning_rate": 1.599906708785262e-05, |
| "loss": 0.2447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23422318696975708, |
| "step": 2545, |
| "valid_targets_mean": 2499.6, |
| "valid_targets_min": 1144 |
| }, |
| { |
| "epoch": 4.264214046822742, |
| "grad_norm": 0.8898102183876689, |
| "learning_rate": 1.5917390144830488e-05, |
| "loss": 0.2956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.295245885848999, |
| "step": 2550, |
| "valid_targets_mean": 3242.8, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 4.2725752508361206, |
| "grad_norm": 0.9416423066048137, |
| "learning_rate": 1.583578418994294e-05, |
| "loss": 0.2993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23591409623622894, |
| "step": 2555, |
| "valid_targets_mean": 2772.4, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 4.280936454849498, |
| "grad_norm": 0.8396792312207702, |
| "learning_rate": 1.5754250642148592e-05, |
| "loss": 0.2838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2691681385040283, |
| "step": 2560, |
| "valid_targets_mean": 3140.4, |
| "valid_targets_min": 1822 |
| }, |
| { |
| "epoch": 4.289297658862877, |
| "grad_norm": 0.7552376746174522, |
| "learning_rate": 1.5672790919147096e-05, |
| "loss": 0.2648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30901944637298584, |
| "step": 2565, |
| "valid_targets_mean": 3934.4, |
| "valid_targets_min": 1525 |
| }, |
| { |
| "epoch": 4.297658862876254, |
| "grad_norm": 0.9282959640580136, |
| "learning_rate": 1.5591406437354394e-05, |
| "loss": 0.2932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2631564736366272, |
| "step": 2570, |
| "valid_targets_mean": 3684.6, |
| "valid_targets_min": 603 |
| }, |
| { |
| "epoch": 4.306020066889632, |
| "grad_norm": 0.8408763401027246, |
| "learning_rate": 1.5510098611878177e-05, |
| "loss": 0.2522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1855039745569229, |
| "step": 2575, |
| "valid_targets_mean": 2278.2, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 4.31438127090301, |
| "grad_norm": 0.9661559358244203, |
| "learning_rate": 1.542886885649322e-05, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20213311910629272, |
| "step": 2580, |
| "valid_targets_mean": 2565.0, |
| "valid_targets_min": 1622 |
| }, |
| { |
| "epoch": 4.322742474916388, |
| "grad_norm": 0.8691049252102782, |
| "learning_rate": 1.534771858361683e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2871206998825073, |
| "step": 2585, |
| "valid_targets_mean": 3261.2, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 4.331103678929766, |
| "grad_norm": 0.8392260775398249, |
| "learning_rate": 1.5266649204284273e-05, |
| "loss": 0.2793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2738720774650574, |
| "step": 2590, |
| "valid_targets_mean": 3433.5, |
| "valid_targets_min": 1852 |
| }, |
| { |
| "epoch": 4.339464882943144, |
| "grad_norm": 0.8840473177758481, |
| "learning_rate": 1.5185662128124254e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2708375155925751, |
| "step": 2595, |
| "valid_targets_mean": 3278.4, |
| "valid_targets_min": 399 |
| }, |
| { |
| "epoch": 4.3478260869565215, |
| "grad_norm": 0.8804892196325519, |
| "learning_rate": 1.510475876333438e-05, |
| "loss": 0.2994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23639748990535736, |
| "step": 2600, |
| "valid_targets_mean": 2654.6, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 4.3561872909699, |
| "grad_norm": 0.8094688600381953, |
| "learning_rate": 1.5023940516656697e-05, |
| "loss": 0.2935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2887652516365051, |
| "step": 2605, |
| "valid_targets_mean": 3643.9, |
| "valid_targets_min": 2109 |
| }, |
| { |
| "epoch": 4.364548494983278, |
| "grad_norm": 0.9244051200125512, |
| "learning_rate": 1.4943208793353235e-05, |
| "loss": 0.2653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2914060056209564, |
| "step": 2610, |
| "valid_targets_mean": 3336.8, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 4.372909698996655, |
| "grad_norm": 0.7461063611424056, |
| "learning_rate": 1.4862564997181528e-05, |
| "loss": 0.2765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36067837476730347, |
| "step": 2615, |
| "valid_targets_mean": 5280.1, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 4.381270903010034, |
| "grad_norm": 0.9652367742763335, |
| "learning_rate": 1.4782010530370294e-05, |
| "loss": 0.2636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25113189220428467, |
| "step": 2620, |
| "valid_targets_mean": 2949.8, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 4.389632107023411, |
| "grad_norm": 0.8992134459024913, |
| "learning_rate": 1.470154679359495e-05, |
| "loss": 0.2412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24360308051109314, |
| "step": 2625, |
| "valid_targets_mean": 2608.5, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 4.39799331103679, |
| "grad_norm": 0.8220794903907007, |
| "learning_rate": 1.4621175185953322e-05, |
| "loss": 0.277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3220457136631012, |
| "step": 2630, |
| "valid_targets_mean": 4098.1, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 4.406354515050167, |
| "grad_norm": 0.8521683178016516, |
| "learning_rate": 1.4540897104941307e-05, |
| "loss": 0.2753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3359491527080536, |
| "step": 2635, |
| "valid_targets_mean": 3451.1, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 4.414715719063545, |
| "grad_norm": 0.8796923872304094, |
| "learning_rate": 1.4460713946428553e-05, |
| "loss": 0.2772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24371229112148285, |
| "step": 2640, |
| "valid_targets_mean": 2400.8, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 4.423076923076923, |
| "grad_norm": 1.0131860235742853, |
| "learning_rate": 1.4380627104634224e-05, |
| "loss": 0.2554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3007010817527771, |
| "step": 2645, |
| "valid_targets_mean": 2731.2, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 4.431438127090301, |
| "grad_norm": 0.7392458747612428, |
| "learning_rate": 1.4300637972102721e-05, |
| "loss": 0.2702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3089587688446045, |
| "step": 2650, |
| "valid_targets_mean": 4641.4, |
| "valid_targets_min": 1954 |
| }, |
| { |
| "epoch": 4.4397993311036785, |
| "grad_norm": 0.8818880175089461, |
| "learning_rate": 1.4220747939679478e-05, |
| "loss": 0.2579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2619357407093048, |
| "step": 2655, |
| "valid_targets_mean": 3080.8, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 4.448160535117057, |
| "grad_norm": 0.9056508130411561, |
| "learning_rate": 1.414095839648679e-05, |
| "loss": 0.2827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25068965554237366, |
| "step": 2660, |
| "valid_targets_mean": 2617.4, |
| "valid_targets_min": 1481 |
| }, |
| { |
| "epoch": 4.456521739130435, |
| "grad_norm": 0.8935220051791342, |
| "learning_rate": 1.4061270729899663e-05, |
| "loss": 0.2726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26286935806274414, |
| "step": 2665, |
| "valid_targets_mean": 2883.9, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 4.464882943143813, |
| "grad_norm": 0.8961547416267401, |
| "learning_rate": 1.3981686325521647e-05, |
| "loss": 0.2768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29072946310043335, |
| "step": 2670, |
| "valid_targets_mean": 2993.4, |
| "valid_targets_min": 1894 |
| }, |
| { |
| "epoch": 4.473244147157191, |
| "grad_norm": 0.9599671002081342, |
| "learning_rate": 1.3902206567160827e-05, |
| "loss": 0.2455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28398674726486206, |
| "step": 2675, |
| "valid_targets_mean": 2923.8, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 4.481605351170568, |
| "grad_norm": 0.8341406674593823, |
| "learning_rate": 1.3822832836805667e-05, |
| "loss": 0.3141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3429492115974426, |
| "step": 2680, |
| "valid_targets_mean": 3562.8, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 4.489966555183947, |
| "grad_norm": 0.8660387274121687, |
| "learning_rate": 1.3743566514601037e-05, |
| "loss": 0.2615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28438010811805725, |
| "step": 2685, |
| "valid_targets_mean": 3383.6, |
| "valid_targets_min": 1276 |
| }, |
| { |
| "epoch": 4.498327759197324, |
| "grad_norm": 0.8240982742485928, |
| "learning_rate": 1.3664408978824209e-05, |
| "loss": 0.2648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2728864550590515, |
| "step": 2690, |
| "valid_targets_mean": 3949.8, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 4.506688963210703, |
| "grad_norm": 0.9047049810271199, |
| "learning_rate": 1.3585361605860863e-05, |
| "loss": 0.2831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2605753540992737, |
| "step": 2695, |
| "valid_targets_mean": 2817.6, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 4.51505016722408, |
| "grad_norm": 0.8397078739499565, |
| "learning_rate": 1.3506425770181211e-05, |
| "loss": 0.2871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24365462362766266, |
| "step": 2700, |
| "valid_targets_mean": 2901.8, |
| "valid_targets_min": 2041 |
| }, |
| { |
| "epoch": 4.523411371237458, |
| "grad_norm": 0.8582678085193816, |
| "learning_rate": 1.342760284431603e-05, |
| "loss": 0.3192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2986323833465576, |
| "step": 2705, |
| "valid_targets_mean": 3100.2, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 4.531772575250836, |
| "grad_norm": 0.7889072695692275, |
| "learning_rate": 1.3348894198832845e-05, |
| "loss": 0.2708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26328298449516296, |
| "step": 2710, |
| "valid_targets_mean": 3108.0, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 4.540133779264214, |
| "grad_norm": 0.742736182328933, |
| "learning_rate": 1.3270301202312075e-05, |
| "loss": 0.2846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37916791439056396, |
| "step": 2715, |
| "valid_targets_mean": 5153.8, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 4.548494983277592, |
| "grad_norm": 0.9919759799813364, |
| "learning_rate": 1.3191825221323246e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30372777581214905, |
| "step": 2720, |
| "valid_targets_mean": 2784.2, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 4.55685618729097, |
| "grad_norm": 0.794724468575154, |
| "learning_rate": 1.311346762040123e-05, |
| "loss": 0.276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2651178538799286, |
| "step": 2725, |
| "valid_targets_mean": 3715.1, |
| "valid_targets_min": 983 |
| }, |
| { |
| "epoch": 4.565217391304348, |
| "grad_norm": 0.9806561211664588, |
| "learning_rate": 1.3035229762022513e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2600407600402832, |
| "step": 2730, |
| "valid_targets_mean": 2778.1, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 4.573578595317725, |
| "grad_norm": 0.8400790069869569, |
| "learning_rate": 1.2957113006581494e-05, |
| "loss": 0.2809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30648618936538696, |
| "step": 2735, |
| "valid_targets_mean": 3071.6, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 4.581939799331104, |
| "grad_norm": 0.912124026132302, |
| "learning_rate": 1.2879118712366858e-05, |
| "loss": 0.2922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3389705717563629, |
| "step": 2740, |
| "valid_targets_mean": 3479.6, |
| "valid_targets_min": 1737 |
| }, |
| { |
| "epoch": 4.590301003344481, |
| "grad_norm": 0.7136031625832305, |
| "learning_rate": 1.280124823553794e-05, |
| "loss": 0.2648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26324355602264404, |
| "step": 2745, |
| "valid_targets_mean": 4402.9, |
| "valid_targets_min": 1958 |
| }, |
| { |
| "epoch": 4.59866220735786, |
| "grad_norm": 0.8876231778745343, |
| "learning_rate": 1.2723502930101126e-05, |
| "loss": 0.3051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3144656717777252, |
| "step": 2750, |
| "valid_targets_mean": 4292.6, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 4.607023411371237, |
| "grad_norm": 0.9123329157042492, |
| "learning_rate": 1.2645884147886376e-05, |
| "loss": 0.2452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22034093737602234, |
| "step": 2755, |
| "valid_targets_mean": 3341.9, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 4.615384615384615, |
| "grad_norm": 0.8627497975800223, |
| "learning_rate": 1.2568393238523627e-05, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28283166885375977, |
| "step": 2760, |
| "valid_targets_mean": 3059.2, |
| "valid_targets_min": 1435 |
| }, |
| { |
| "epoch": 4.6237458193979935, |
| "grad_norm": 0.8879285250035446, |
| "learning_rate": 1.2491031549419396e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28905028104782104, |
| "step": 2765, |
| "valid_targets_mean": 3173.9, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 4.632107023411371, |
| "grad_norm": 0.7869539440700758, |
| "learning_rate": 1.2413800425733324e-05, |
| "loss": 0.2637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23459485173225403, |
| "step": 2770, |
| "valid_targets_mean": 3455.7, |
| "valid_targets_min": 1705 |
| }, |
| { |
| "epoch": 4.6404682274247495, |
| "grad_norm": 0.874081153668911, |
| "learning_rate": 1.2336701210354774e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26058483123779297, |
| "step": 2775, |
| "valid_targets_mean": 3799.4, |
| "valid_targets_min": 2140 |
| }, |
| { |
| "epoch": 4.648829431438127, |
| "grad_norm": 0.8505418138060274, |
| "learning_rate": 1.2259735243879533e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2382025420665741, |
| "step": 2780, |
| "valid_targets_mean": 2949.2, |
| "valid_targets_min": 1662 |
| }, |
| { |
| "epoch": 4.657190635451505, |
| "grad_norm": 0.8408719538127842, |
| "learning_rate": 1.2182903864586424e-05, |
| "loss": 0.311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3271663188934326, |
| "step": 2785, |
| "valid_targets_mean": 3384.8, |
| "valid_targets_min": 1772 |
| }, |
| { |
| "epoch": 4.665551839464883, |
| "grad_norm": 0.7906487246754133, |
| "learning_rate": 1.2106208408414101e-05, |
| "loss": 0.261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23760370910167694, |
| "step": 2790, |
| "valid_targets_mean": 3003.1, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 4.673913043478261, |
| "grad_norm": 0.7560469434433705, |
| "learning_rate": 1.202965020893779e-05, |
| "loss": 0.2795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3065562844276428, |
| "step": 2795, |
| "valid_targets_mean": 4305.3, |
| "valid_targets_min": 1436 |
| }, |
| { |
| "epoch": 4.682274247491639, |
| "grad_norm": 0.931404543547185, |
| "learning_rate": 1.1953230597346116e-05, |
| "loss": 0.2814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30321380496025085, |
| "step": 2800, |
| "valid_targets_mean": 3184.8, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 4.690635451505017, |
| "grad_norm": 0.8785086713293649, |
| "learning_rate": 1.1876950902417921e-05, |
| "loss": 0.311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2660791277885437, |
| "step": 2805, |
| "valid_targets_mean": 2884.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 4.698996655518394, |
| "grad_norm": 0.8658447278693211, |
| "learning_rate": 1.1800812450499227e-05, |
| "loss": 0.2447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24090614914894104, |
| "step": 2810, |
| "valid_targets_mean": 2715.7, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 4.707357859531773, |
| "grad_norm": 1.0374938153628415, |
| "learning_rate": 1.1724816565480092e-05, |
| "loss": 0.2597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20534390211105347, |
| "step": 2815, |
| "valid_targets_mean": 2147.6, |
| "valid_targets_min": 401 |
| }, |
| { |
| "epoch": 4.7157190635451505, |
| "grad_norm": 0.7920774633218928, |
| "learning_rate": 1.1648964568771661e-05, |
| "loss": 0.2632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18782053887844086, |
| "step": 2820, |
| "valid_targets_mean": 3404.8, |
| "valid_targets_min": 2009 |
| }, |
| { |
| "epoch": 4.724080267558528, |
| "grad_norm": 0.8633417845835815, |
| "learning_rate": 1.157325777928314e-05, |
| "loss": 0.2725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30495747923851013, |
| "step": 2825, |
| "valid_targets_mean": 3513.8, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 4.7324414715719065, |
| "grad_norm": 0.9344722457587161, |
| "learning_rate": 1.149769751339889e-05, |
| "loss": 0.2654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2682046592235565, |
| "step": 2830, |
| "valid_targets_mean": 3535.4, |
| "valid_targets_min": 1574 |
| }, |
| { |
| "epoch": 4.740802675585284, |
| "grad_norm": 0.9085942238263078, |
| "learning_rate": 1.142228508495553e-05, |
| "loss": 0.2743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27757948637008667, |
| "step": 2835, |
| "valid_targets_mean": 2801.4, |
| "valid_targets_min": 1637 |
| }, |
| { |
| "epoch": 4.749163879598662, |
| "grad_norm": 0.9016528116196614, |
| "learning_rate": 1.1347021805219092e-05, |
| "loss": 0.281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24009665846824646, |
| "step": 2840, |
| "valid_targets_mean": 2991.9, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 4.75752508361204, |
| "grad_norm": 0.8216538528179507, |
| "learning_rate": 1.1271908982862214e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2618323862552643, |
| "step": 2845, |
| "valid_targets_mean": 4103.2, |
| "valid_targets_min": 1949 |
| }, |
| { |
| "epoch": 4.765886287625418, |
| "grad_norm": 1.0231544478271972, |
| "learning_rate": 1.11969479239414e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30647069215774536, |
| "step": 2850, |
| "valid_targets_mean": 2558.7, |
| "valid_targets_min": 364 |
| }, |
| { |
| "epoch": 4.774247491638796, |
| "grad_norm": 2.596885204828478, |
| "learning_rate": 1.1122139931874303e-05, |
| "loss": 0.3129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3939549922943115, |
| "step": 2855, |
| "valid_targets_mean": 4341.0, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 4.782608695652174, |
| "grad_norm": 0.9290067746793299, |
| "learning_rate": 1.104748630741705e-05, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30313026905059814, |
| "step": 2860, |
| "valid_targets_mean": 2781.0, |
| "valid_targets_min": 392 |
| }, |
| { |
| "epoch": 4.790969899665551, |
| "grad_norm": 1.7683165858974776, |
| "learning_rate": 1.0972988348641643e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22824634611606598, |
| "step": 2865, |
| "valid_targets_mean": 2794.6, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.79933110367893, |
| "grad_norm": 0.8612735757395678, |
| "learning_rate": 1.0898647350913376e-05, |
| "loss": 0.2637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24694600701332092, |
| "step": 2870, |
| "valid_targets_mean": 3144.4, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 4.8076923076923075, |
| "grad_norm": 0.883437344029108, |
| "learning_rate": 1.0824464606868323e-05, |
| "loss": 0.2571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24586498737335205, |
| "step": 2875, |
| "valid_targets_mean": 3431.4, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 4.816053511705686, |
| "grad_norm": 1.0330995770490803, |
| "learning_rate": 1.0750441406390841e-05, |
| "loss": 0.2459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2311995029449463, |
| "step": 2880, |
| "valid_targets_mean": 2488.1, |
| "valid_targets_min": 1242 |
| }, |
| { |
| "epoch": 4.8244147157190636, |
| "grad_norm": 0.958681058026221, |
| "learning_rate": 1.0676579036591167e-05, |
| "loss": 0.2742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2965131998062134, |
| "step": 2885, |
| "valid_targets_mean": 3851.2, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 4.832775919732441, |
| "grad_norm": 0.788119350116846, |
| "learning_rate": 1.0602878781783019e-05, |
| "loss": 0.2932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.328529953956604, |
| "step": 2890, |
| "valid_targets_mean": 3779.6, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 4.84113712374582, |
| "grad_norm": 0.8696431488480126, |
| "learning_rate": 1.0529341923461272e-05, |
| "loss": 0.2744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26618334650993347, |
| "step": 2895, |
| "valid_targets_mean": 3219.2, |
| "valid_targets_min": 1480 |
| }, |
| { |
| "epoch": 4.849498327759197, |
| "grad_norm": 0.9950302873697183, |
| "learning_rate": 1.0455969740279675e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28443658351898193, |
| "step": 2900, |
| "valid_targets_mean": 2625.2, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 4.857859531772576, |
| "grad_norm": 0.9363541770349809, |
| "learning_rate": 1.0382763508028615e-05, |
| "loss": 0.256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23824138939380646, |
| "step": 2905, |
| "valid_targets_mean": 2914.6, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 4.866220735785953, |
| "grad_norm": 0.9212980221737899, |
| "learning_rate": 1.0309724499612939e-05, |
| "loss": 0.2566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30664288997650146, |
| "step": 2910, |
| "valid_targets_mean": 3167.0, |
| "valid_targets_min": 1422 |
| }, |
| { |
| "epoch": 4.874581939799331, |
| "grad_norm": 0.9658354985211547, |
| "learning_rate": 1.0236853985029815e-05, |
| "loss": 0.2841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2978072762489319, |
| "step": 2915, |
| "valid_targets_mean": 4677.4, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 4.882943143812709, |
| "grad_norm": 0.8858319243242195, |
| "learning_rate": 1.0164153231346656e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24526861310005188, |
| "step": 2920, |
| "valid_targets_mean": 3126.1, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 4.891304347826087, |
| "grad_norm": 1.0526204864364126, |
| "learning_rate": 1.0091623502679075e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3539399802684784, |
| "step": 2925, |
| "valid_targets_mean": 3289.9, |
| "valid_targets_min": 1212 |
| }, |
| { |
| "epoch": 4.8996655518394645, |
| "grad_norm": 0.885379966379974, |
| "learning_rate": 1.0019266060168929e-05, |
| "loss": 0.2934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30143141746520996, |
| "step": 2930, |
| "valid_targets_mean": 3651.1, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 4.908026755852843, |
| "grad_norm": 1.1625828671998966, |
| "learning_rate": 9.947082161962363e-06, |
| "loss": 0.248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24516814947128296, |
| "step": 2935, |
| "valid_targets_mean": 2769.2, |
| "valid_targets_min": 569 |
| }, |
| { |
| "epoch": 4.916387959866221, |
| "grad_norm": 0.8652972290357003, |
| "learning_rate": 9.875073063187947e-06, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26153671741485596, |
| "step": 2940, |
| "valid_targets_mean": 3214.2, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 4.924749163879599, |
| "grad_norm": 0.9078402224774373, |
| "learning_rate": 9.803240015934859e-06, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2811887264251709, |
| "step": 2945, |
| "valid_targets_mean": 3040.2, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 4.933110367892977, |
| "grad_norm": 0.855619293705552, |
| "learning_rate": 9.731584269231094e-06, |
| "loss": 0.2411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24628743529319763, |
| "step": 2950, |
| "valid_targets_mean": 3259.8, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 4.941471571906354, |
| "grad_norm": 0.9213152242653578, |
| "learning_rate": 9.660107069021767e-06, |
| "loss": 0.2783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33864572644233704, |
| "step": 2955, |
| "valid_targets_mean": 3462.7, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 4.949832775919733, |
| "grad_norm": 0.8302602925046146, |
| "learning_rate": 9.588809658147433e-06, |
| "loss": 0.2748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28112542629241943, |
| "step": 2960, |
| "valid_targets_mean": 3587.3, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 4.95819397993311, |
| "grad_norm": 0.9191160601073972, |
| "learning_rate": 9.517693276322488e-06, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26543906331062317, |
| "step": 2965, |
| "valid_targets_mean": 2759.7, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 4.966555183946488, |
| "grad_norm": 0.9353550508600107, |
| "learning_rate": 9.446759160113602e-06, |
| "loss": 0.2826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2775583863258362, |
| "step": 2970, |
| "valid_targets_mean": 2901.1, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 4.974916387959866, |
| "grad_norm": 0.9139877304453574, |
| "learning_rate": 9.376008542918227e-06, |
| "loss": 0.2281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19975979626178741, |
| "step": 2975, |
| "valid_targets_mean": 2663.2, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 4.983277591973244, |
| "grad_norm": 0.922883713258425, |
| "learning_rate": 9.305442654943145e-06, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2600483000278473, |
| "step": 2980, |
| "valid_targets_mean": 2795.2, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 4.991638795986622, |
| "grad_norm": 0.9322875420888264, |
| "learning_rate": 9.235062723183076e-06, |
| "loss": 0.2583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2565094232559204, |
| "step": 2985, |
| "valid_targets_mean": 2820.6, |
| "valid_targets_min": 1321 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.7643560224911901, |
| "learning_rate": 9.164869971399359e-06, |
| "loss": 0.2743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3641391396522522, |
| "step": 2990, |
| "valid_targets_mean": 4868.6, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 5.008361204013378, |
| "grad_norm": 0.8481755315514735, |
| "learning_rate": 9.094865620098646e-06, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22899624705314636, |
| "step": 2995, |
| "valid_targets_mean": 3174.0, |
| "valid_targets_min": 1965 |
| }, |
| { |
| "epoch": 5.016722408026756, |
| "grad_norm": 0.8188076252143365, |
| "learning_rate": 9.025050886511702e-06, |
| "loss": 0.2747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3067629039287567, |
| "step": 3000, |
| "valid_targets_mean": 4291.9, |
| "valid_targets_min": 1704 |
| }, |
| { |
| "epoch": 5.025083612040134, |
| "grad_norm": 0.8029644241788463, |
| "learning_rate": 8.955426984572228e-06, |
| "loss": 0.2581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3037480115890503, |
| "step": 3005, |
| "valid_targets_mean": 4106.2, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 5.033444816053512, |
| "grad_norm": 0.8661738149420555, |
| "learning_rate": 8.885995124895768e-06, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2674838900566101, |
| "step": 3010, |
| "valid_targets_mean": 3359.9, |
| "valid_targets_min": 1500 |
| }, |
| { |
| "epoch": 5.04180602006689, |
| "grad_norm": 0.9620964614380081, |
| "learning_rate": 8.816756514758634e-06, |
| "loss": 0.2832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2533591389656067, |
| "step": 3015, |
| "valid_targets_mean": 3118.5, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 5.050167224080267, |
| "grad_norm": 0.7541256752914219, |
| "learning_rate": 8.747712358076936e-06, |
| "loss": 0.2311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24237793684005737, |
| "step": 3020, |
| "valid_targets_mean": 4191.6, |
| "valid_targets_min": 1668 |
| }, |
| { |
| "epoch": 5.058528428093646, |
| "grad_norm": 0.9025605491692672, |
| "learning_rate": 8.678863855385646e-06, |
| "loss": 0.2646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33202728629112244, |
| "step": 3025, |
| "valid_targets_mean": 4466.5, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 5.066889632107023, |
| "grad_norm": 0.8425388830294137, |
| "learning_rate": 8.61021220381771e-06, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3084254860877991, |
| "step": 3030, |
| "valid_targets_mean": 4306.9, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 5.075250836120401, |
| "grad_norm": 0.8389860612401873, |
| "learning_rate": 8.54175859708324e-06, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22211232781410217, |
| "step": 3035, |
| "valid_targets_mean": 3588.2, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 5.083612040133779, |
| "grad_norm": 0.9514036120737082, |
| "learning_rate": 8.473504225448765e-06, |
| "loss": 0.257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2409243881702423, |
| "step": 3040, |
| "valid_targets_mean": 2856.7, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 5.091973244147157, |
| "grad_norm": 0.9560659512366602, |
| "learning_rate": 8.405450275716525e-06, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2601991891860962, |
| "step": 3045, |
| "valid_targets_mean": 3723.9, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 5.1003344481605355, |
| "grad_norm": 0.9864743563923629, |
| "learning_rate": 8.337597931203836e-06, |
| "loss": 0.239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3188202381134033, |
| "step": 3050, |
| "valid_targets_mean": 3242.7, |
| "valid_targets_min": 1154 |
| }, |
| { |
| "epoch": 5.108695652173913, |
| "grad_norm": 1.1490912764067835, |
| "learning_rate": 8.269948371722518e-06, |
| "loss": 0.2602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21089932322502136, |
| "step": 3055, |
| "valid_targets_mean": 2516.8, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 5.117056856187291, |
| "grad_norm": 0.8194749944721579, |
| "learning_rate": 8.20250277355838e-06, |
| "loss": 0.2787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3658130168914795, |
| "step": 3060, |
| "valid_targets_mean": 4739.9, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 5.125418060200669, |
| "grad_norm": 0.9728259830553914, |
| "learning_rate": 8.135262309450764e-06, |
| "loss": 0.2707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27498018741607666, |
| "step": 3065, |
| "valid_targets_mean": 3150.4, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 5.133779264214047, |
| "grad_norm": 1.0179078265962471, |
| "learning_rate": 8.068228148572157e-06, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19528654217720032, |
| "step": 3070, |
| "valid_targets_mean": 2590.3, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 5.142140468227424, |
| "grad_norm": 1.0414753424178975, |
| "learning_rate": 8.001401456507858e-06, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24913433194160461, |
| "step": 3075, |
| "valid_targets_mean": 2828.6, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 5.150501672240803, |
| "grad_norm": 0.9673371238498945, |
| "learning_rate": 7.934783395235716e-06, |
| "loss": 0.253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2619754672050476, |
| "step": 3080, |
| "valid_targets_mean": 3273.0, |
| "valid_targets_min": 1547 |
| }, |
| { |
| "epoch": 5.15886287625418, |
| "grad_norm": 1.0777145808692163, |
| "learning_rate": 7.868375123105921e-06, |
| "loss": 0.29, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.241988867521286, |
| "step": 3085, |
| "valid_targets_mean": 2760.0, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 5.167224080267559, |
| "grad_norm": 0.9357681236144693, |
| "learning_rate": 7.802177794820857e-06, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4071310758590698, |
| "step": 3090, |
| "valid_targets_mean": 3665.1, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 5.1755852842809364, |
| "grad_norm": 0.8810724848053256, |
| "learning_rate": 7.736192561415045e-06, |
| "loss": 0.2883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3404349386692047, |
| "step": 3095, |
| "valid_targets_mean": 3941.1, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 5.183946488294314, |
| "grad_norm": 0.9345756552103464, |
| "learning_rate": 7.670420570235113e-06, |
| "loss": 0.2718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20666499435901642, |
| "step": 3100, |
| "valid_targets_mean": 2741.7, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 5.1923076923076925, |
| "grad_norm": 0.89831218286986, |
| "learning_rate": 7.604862964919819e-06, |
| "loss": 0.2531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26516643166542053, |
| "step": 3105, |
| "valid_targets_mean": 3194.3, |
| "valid_targets_min": 1893 |
| }, |
| { |
| "epoch": 5.20066889632107, |
| "grad_norm": 1.0235151109065963, |
| "learning_rate": 7.539520885380242e-06, |
| "loss": 0.2647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23447315394878387, |
| "step": 3110, |
| "valid_targets_mean": 2732.0, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 5.209030100334449, |
| "grad_norm": 1.0527575176171846, |
| "learning_rate": 7.474395467779885e-06, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24746760725975037, |
| "step": 3115, |
| "valid_targets_mean": 3079.3, |
| "valid_targets_min": 1647 |
| }, |
| { |
| "epoch": 5.217391304347826, |
| "grad_norm": 0.8412479852328654, |
| "learning_rate": 7.409487844514946e-06, |
| "loss": 0.2765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2139432430267334, |
| "step": 3120, |
| "valid_targets_mean": 3529.4, |
| "valid_targets_min": 2262 |
| }, |
| { |
| "epoch": 5.225752508361204, |
| "grad_norm": 0.8859243166629239, |
| "learning_rate": 7.344799144194647e-06, |
| "loss": 0.2646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30506086349487305, |
| "step": 3125, |
| "valid_targets_mean": 4511.6, |
| "valid_targets_min": 1709 |
| }, |
| { |
| "epoch": 5.234113712374582, |
| "grad_norm": 0.928318267325103, |
| "learning_rate": 7.280330491621579e-06, |
| "loss": 0.265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25192520022392273, |
| "step": 3130, |
| "valid_targets_mean": 3102.3, |
| "valid_targets_min": 1604 |
| }, |
| { |
| "epoch": 5.24247491638796, |
| "grad_norm": 0.8514180338596942, |
| "learning_rate": 7.2160830077721655e-06, |
| "loss": 0.2806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42115187644958496, |
| "step": 3135, |
| "valid_targets_mean": 4393.4, |
| "valid_targets_min": 2044 |
| }, |
| { |
| "epoch": 5.250836120401337, |
| "grad_norm": 0.8701754054847802, |
| "learning_rate": 7.15205780977716e-06, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23187309503555298, |
| "step": 3140, |
| "valid_targets_mean": 3508.4, |
| "valid_targets_min": 1806 |
| }, |
| { |
| "epoch": 5.259197324414716, |
| "grad_norm": 1.0414461577784981, |
| "learning_rate": 7.0882560109022255e-06, |
| "loss": 0.2487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2434636354446411, |
| "step": 3145, |
| "valid_targets_mean": 2689.4, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 5.2675585284280935, |
| "grad_norm": 0.9992819578511724, |
| "learning_rate": 7.02467872052858e-06, |
| "loss": 0.2108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20966418087482452, |
| "step": 3150, |
| "valid_targets_mean": 3109.2, |
| "valid_targets_min": 1471 |
| }, |
| { |
| "epoch": 5.275919732441472, |
| "grad_norm": 0.9478720751528437, |
| "learning_rate": 6.9613270441337075e-06, |
| "loss": 0.2412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22975382208824158, |
| "step": 3155, |
| "valid_targets_mean": 3196.7, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 5.2842809364548495, |
| "grad_norm": 0.8672829908504149, |
| "learning_rate": 6.8982020832721054e-06, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22695282101631165, |
| "step": 3160, |
| "valid_targets_mean": 3513.6, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 5.292642140468227, |
| "grad_norm": 1.022405240131088, |
| "learning_rate": 6.835304935556198e-06, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2423592507839203, |
| "step": 3165, |
| "valid_targets_mean": 3192.9, |
| "valid_targets_min": 1355 |
| }, |
| { |
| "epoch": 5.301003344481606, |
| "grad_norm": 1.081711172053293, |
| "learning_rate": 6.772636694637183e-06, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25607234239578247, |
| "step": 3170, |
| "valid_targets_mean": 2742.1, |
| "valid_targets_min": 1670 |
| }, |
| { |
| "epoch": 5.309364548494983, |
| "grad_norm": 0.959669265454484, |
| "learning_rate": 6.710198450186047e-06, |
| "loss": 0.2657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2445649951696396, |
| "step": 3175, |
| "valid_targets_mean": 2531.1, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 5.317725752508361, |
| "grad_norm": 1.0556452222632704, |
| "learning_rate": 6.6479912878746225e-06, |
| "loss": 0.2698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32292306423187256, |
| "step": 3180, |
| "valid_targets_mean": 3753.7, |
| "valid_targets_min": 1316 |
| }, |
| { |
| "epoch": 5.326086956521739, |
| "grad_norm": 1.110335544316918, |
| "learning_rate": 6.586016289356692e-06, |
| "loss": 0.2582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20516835153102875, |
| "step": 3185, |
| "valid_targets_mean": 2823.1, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 5.334448160535117, |
| "grad_norm": 0.9443496373098136, |
| "learning_rate": 6.524274532249195e-06, |
| "loss": 0.2247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2695116698741913, |
| "step": 3190, |
| "valid_targets_mean": 2830.7, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 5.342809364548495, |
| "grad_norm": 1.2883459095067469, |
| "learning_rate": 6.462767090113486e-06, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21128371357917786, |
| "step": 3195, |
| "valid_targets_mean": 2801.6, |
| "valid_targets_min": 1972 |
| }, |
| { |
| "epoch": 5.351170568561873, |
| "grad_norm": 0.7305670443838644, |
| "learning_rate": 6.401495032436667e-06, |
| "loss": 0.2613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34377604722976685, |
| "step": 3200, |
| "valid_targets_mean": 5868.9, |
| "valid_targets_min": 1873 |
| }, |
| { |
| "epoch": 5.3595317725752505, |
| "grad_norm": 0.9618080510519665, |
| "learning_rate": 6.34045942461299e-06, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20367145538330078, |
| "step": 3205, |
| "valid_targets_mean": 2934.6, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 5.367892976588629, |
| "grad_norm": 0.9183980494977025, |
| "learning_rate": 6.279661327925333e-06, |
| "loss": 0.2591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24812433123588562, |
| "step": 3210, |
| "valid_targets_mean": 3023.1, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 5.3762541806020065, |
| "grad_norm": 0.9596558209841023, |
| "learning_rate": 6.219101799526753e-06, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33065247535705566, |
| "step": 3215, |
| "valid_targets_mean": 4098.1, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 5.384615384615385, |
| "grad_norm": 1.065383634447373, |
| "learning_rate": 6.158781892422085e-06, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2475639134645462, |
| "step": 3220, |
| "valid_targets_mean": 2772.1, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 5.392976588628763, |
| "grad_norm": 1.044424208460433, |
| "learning_rate": 6.098702655449664e-06, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2278965413570404, |
| "step": 3225, |
| "valid_targets_mean": 2502.4, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 5.40133779264214, |
| "grad_norm": 0.9665704851257386, |
| "learning_rate": 6.038865133263054e-06, |
| "loss": 0.2448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31926289200782776, |
| "step": 3230, |
| "valid_targets_mean": 3628.5, |
| "valid_targets_min": 1750 |
| }, |
| { |
| "epoch": 5.409698996655519, |
| "grad_norm": 0.964435362243508, |
| "learning_rate": 5.9792703663129125e-06, |
| "loss": 0.2289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21948401629924774, |
| "step": 3235, |
| "valid_targets_mean": 2733.2, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 5.418060200668896, |
| "grad_norm": 0.9794403625903487, |
| "learning_rate": 5.919919390828859e-06, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22015729546546936, |
| "step": 3240, |
| "valid_targets_mean": 2922.4, |
| "valid_targets_min": 1575 |
| }, |
| { |
| "epoch": 5.426421404682274, |
| "grad_norm": 0.9982047586124657, |
| "learning_rate": 5.860813238801523e-06, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21148087084293365, |
| "step": 3245, |
| "valid_targets_mean": 3052.9, |
| "valid_targets_min": 1548 |
| }, |
| { |
| "epoch": 5.434782608695652, |
| "grad_norm": 0.8716785695051501, |
| "learning_rate": 5.801952937964537e-06, |
| "loss": 0.2537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23328334093093872, |
| "step": 3250, |
| "valid_targets_mean": 3625.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 5.44314381270903, |
| "grad_norm": 1.0317002727776252, |
| "learning_rate": 5.743339511776693e-06, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26123955845832825, |
| "step": 3255, |
| "valid_targets_mean": 3316.4, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 5.451505016722408, |
| "grad_norm": 0.8933485431020612, |
| "learning_rate": 5.684973979404144e-06, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23536235094070435, |
| "step": 3260, |
| "valid_targets_mean": 3289.2, |
| "valid_targets_min": 1411 |
| }, |
| { |
| "epoch": 5.459866220735786, |
| "grad_norm": 0.9330309774110559, |
| "learning_rate": 5.6268573557026865e-06, |
| "loss": 0.274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25734925270080566, |
| "step": 3265, |
| "valid_targets_mean": 3473.9, |
| "valid_targets_min": 1469 |
| }, |
| { |
| "epoch": 5.468227424749164, |
| "grad_norm": 1.0119464981075554, |
| "learning_rate": 5.568990651200108e-06, |
| "loss": 0.2646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644900977611542, |
| "step": 3270, |
| "valid_targets_mean": 3406.8, |
| "valid_targets_min": 569 |
| }, |
| { |
| "epoch": 5.476588628762542, |
| "grad_norm": 1.0468454697016878, |
| "learning_rate": 5.511374872078616e-06, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29436013102531433, |
| "step": 3275, |
| "valid_targets_mean": 3085.1, |
| "valid_targets_min": 1665 |
| }, |
| { |
| "epoch": 5.48494983277592, |
| "grad_norm": 0.9588401461605252, |
| "learning_rate": 5.454011020157348e-06, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21803942322731018, |
| "step": 3280, |
| "valid_targets_mean": 3367.6, |
| "valid_targets_min": 1776 |
| }, |
| { |
| "epoch": 5.493311036789297, |
| "grad_norm": 0.8920342971378608, |
| "learning_rate": 5.396900092874953e-06, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20749205350875854, |
| "step": 3285, |
| "valid_targets_mean": 3192.9, |
| "valid_targets_min": 1668 |
| }, |
| { |
| "epoch": 5.501672240802676, |
| "grad_norm": 0.8025673440389024, |
| "learning_rate": 5.340043083272239e-06, |
| "loss": 0.2647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25130224227905273, |
| "step": 3290, |
| "valid_targets_mean": 3616.1, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 5.510033444816053, |
| "grad_norm": 1.0290460488107447, |
| "learning_rate": 5.283440979974901e-06, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.255595326423645, |
| "step": 3295, |
| "valid_targets_mean": 3070.9, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 5.518394648829432, |
| "grad_norm": 0.9036243917362351, |
| "learning_rate": 5.227094767176364e-06, |
| "loss": 0.2535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2398861050605774, |
| "step": 3300, |
| "valid_targets_mean": 3360.8, |
| "valid_targets_min": 1448 |
| }, |
| { |
| "epoch": 5.526755852842809, |
| "grad_norm": 0.9707296599929639, |
| "learning_rate": 5.17100542462063e-06, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24867475032806396, |
| "step": 3305, |
| "valid_targets_mean": 3409.8, |
| "valid_targets_min": 1500 |
| }, |
| { |
| "epoch": 5.535117056856187, |
| "grad_norm": 1.0059190414101475, |
| "learning_rate": 5.115173927585264e-06, |
| "loss": 0.2462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20245328545570374, |
| "step": 3310, |
| "valid_targets_mean": 2579.6, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 5.543478260869565, |
| "grad_norm": 1.150440106449695, |
| "learning_rate": 5.059601246864438e-06, |
| "loss": 0.2338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2849067747592926, |
| "step": 3315, |
| "valid_targets_mean": 3054.2, |
| "valid_targets_min": 1511 |
| }, |
| { |
| "epoch": 5.551839464882943, |
| "grad_norm": 1.082246481751666, |
| "learning_rate": 5.004288348752018e-06, |
| "loss": 0.2211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24570798873901367, |
| "step": 3320, |
| "valid_targets_mean": 3292.1, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 5.5602006688963215, |
| "grad_norm": 0.9677466519631982, |
| "learning_rate": 4.949236195024825e-06, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21175232529640198, |
| "step": 3325, |
| "valid_targets_mean": 2859.6, |
| "valid_targets_min": 452 |
| }, |
| { |
| "epoch": 5.568561872909699, |
| "grad_norm": 0.9670337251548189, |
| "learning_rate": 4.894445742925853e-06, |
| "loss": 0.2623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23612819612026215, |
| "step": 3330, |
| "valid_targets_mean": 2778.9, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 5.576923076923077, |
| "grad_norm": 0.9399114769292228, |
| "learning_rate": 4.839917945147647e-06, |
| "loss": 0.2502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24552688002586365, |
| "step": 3335, |
| "valid_targets_mean": 2997.2, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 5.585284280936455, |
| "grad_norm": 0.8414887814395099, |
| "learning_rate": 4.785653749815744e-06, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29480239748954773, |
| "step": 3340, |
| "valid_targets_mean": 4310.2, |
| "valid_targets_min": 1636 |
| }, |
| { |
| "epoch": 5.593645484949833, |
| "grad_norm": 0.7931418317297482, |
| "learning_rate": 4.731654100472178e-06, |
| "loss": 0.2583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3128657341003418, |
| "step": 3345, |
| "valid_targets_mean": 4607.0, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 5.602006688963211, |
| "grad_norm": 0.8840163267997618, |
| "learning_rate": 4.677919936059064e-06, |
| "loss": 0.2558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24446120858192444, |
| "step": 3350, |
| "valid_targets_mean": 3667.1, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 5.610367892976589, |
| "grad_norm": 0.9191791952149919, |
| "learning_rate": 4.624452190902304e-06, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2651020884513855, |
| "step": 3355, |
| "valid_targets_mean": 3420.4, |
| "valid_targets_min": 1745 |
| }, |
| { |
| "epoch": 5.618729096989966, |
| "grad_norm": 0.9355892323378777, |
| "learning_rate": 4.571251794695308e-06, |
| "loss": 0.2397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29256555438041687, |
| "step": 3360, |
| "valid_targets_mean": 4212.4, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 5.627090301003345, |
| "grad_norm": 1.0090759936821445, |
| "learning_rate": 4.518319672482845e-06, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2667285203933716, |
| "step": 3365, |
| "valid_targets_mean": 2737.7, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 5.635451505016722, |
| "grad_norm": 1.0171835292538327, |
| "learning_rate": 4.465656744644957e-06, |
| "loss": 0.2726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30735355615615845, |
| "step": 3370, |
| "valid_targets_mean": 3446.8, |
| "valid_targets_min": 1726 |
| }, |
| { |
| "epoch": 5.6438127090301, |
| "grad_norm": 0.9819290282194414, |
| "learning_rate": 4.413263926880935e-06, |
| "loss": 0.2608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20418116450309753, |
| "step": 3375, |
| "valid_targets_mean": 3223.5, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 5.6521739130434785, |
| "grad_norm": 0.9512457595996446, |
| "learning_rate": 4.3611421301934435e-06, |
| "loss": 0.2741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2649402320384979, |
| "step": 3380, |
| "valid_targets_mean": 2930.5, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 5.660535117056856, |
| "grad_norm": 0.9658417094141116, |
| "learning_rate": 4.309292260872633e-06, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21503464877605438, |
| "step": 3385, |
| "valid_targets_mean": 2954.3, |
| "valid_targets_min": 1684 |
| }, |
| { |
| "epoch": 5.668896321070234, |
| "grad_norm": 1.0062110489738594, |
| "learning_rate": 4.257715220480405e-06, |
| "loss": 0.2721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2543056011199951, |
| "step": 3390, |
| "valid_targets_mean": 3383.0, |
| "valid_targets_min": 1705 |
| }, |
| { |
| "epoch": 5.677257525083612, |
| "grad_norm": 1.0054767456103721, |
| "learning_rate": 4.206411905834733e-06, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3248503506183624, |
| "step": 3395, |
| "valid_targets_mean": 3018.8, |
| "valid_targets_min": 399 |
| }, |
| { |
| "epoch": 5.68561872909699, |
| "grad_norm": 1.085787300697935, |
| "learning_rate": 4.155383208994055e-06, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24291780591011047, |
| "step": 3400, |
| "valid_targets_mean": 3004.7, |
| "valid_targets_min": 1883 |
| }, |
| { |
| "epoch": 5.693979933110368, |
| "grad_norm": 1.0345601696467057, |
| "learning_rate": 4.10463001724178e-06, |
| "loss": 0.2416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24932274222373962, |
| "step": 3405, |
| "valid_targets_mean": 2949.5, |
| "valid_targets_min": 1622 |
| }, |
| { |
| "epoch": 5.702341137123746, |
| "grad_norm": 0.9908894862017844, |
| "learning_rate": 4.054153213070868e-06, |
| "loss": 0.2495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2516738772392273, |
| "step": 3410, |
| "valid_targets_mean": 3543.2, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 5.710702341137123, |
| "grad_norm": 1.0855149671023934, |
| "learning_rate": 4.003953674168455e-06, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2057594358921051, |
| "step": 3415, |
| "valid_targets_mean": 3033.4, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 5.719063545150502, |
| "grad_norm": 0.9852747879835021, |
| "learning_rate": 3.954032273400608e-06, |
| "loss": 0.2406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.266365110874176, |
| "step": 3420, |
| "valid_targets_mean": 3131.4, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 5.7274247491638794, |
| "grad_norm": 0.8893474256351308, |
| "learning_rate": 3.904389878797159e-06, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2710364758968353, |
| "step": 3425, |
| "valid_targets_mean": 3534.0, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 5.735785953177258, |
| "grad_norm": 0.8715257939471994, |
| "learning_rate": 3.85502735353658e-06, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2547582983970642, |
| "step": 3430, |
| "valid_targets_mean": 3161.2, |
| "valid_targets_min": 1420 |
| }, |
| { |
| "epoch": 5.7441471571906355, |
| "grad_norm": 0.9676813409941313, |
| "learning_rate": 3.8059455559310167e-06, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2646714746952057, |
| "step": 3435, |
| "valid_targets_mean": 3319.5, |
| "valid_targets_min": 1710 |
| }, |
| { |
| "epoch": 5.752508361204013, |
| "grad_norm": 0.8470578522309716, |
| "learning_rate": 3.757145339411332e-06, |
| "loss": 0.229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22734609246253967, |
| "step": 3440, |
| "valid_targets_mean": 4302.4, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 5.760869565217392, |
| "grad_norm": 0.853636864130374, |
| "learning_rate": 3.708627552512276e-06, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20801186561584473, |
| "step": 3445, |
| "valid_targets_mean": 3614.8, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 5.769230769230769, |
| "grad_norm": 0.8787913423829194, |
| "learning_rate": 3.660393038857739e-06, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22825166583061218, |
| "step": 3450, |
| "valid_targets_mean": 3887.0, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 5.777591973244148, |
| "grad_norm": 1.1205253969747466, |
| "learning_rate": 3.6124426371460542e-06, |
| "loss": 0.2611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.272126704454422, |
| "step": 3455, |
| "valid_targets_mean": 2778.0, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 5.785953177257525, |
| "grad_norm": 1.0498337049709496, |
| "learning_rate": 3.564777181135466e-06, |
| "loss": 0.2762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2422400861978531, |
| "step": 3460, |
| "valid_targets_mean": 2545.4, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 5.794314381270903, |
| "grad_norm": 1.1993568136310828, |
| "learning_rate": 3.517397499629589e-06, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2053757905960083, |
| "step": 3465, |
| "valid_targets_mean": 3302.1, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 5.802675585284281, |
| "grad_norm": 0.843797327600791, |
| "learning_rate": 3.4703044164630064e-06, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2291642725467682, |
| "step": 3470, |
| "valid_targets_mean": 4161.9, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 5.811036789297659, |
| "grad_norm": 0.8755458954346165, |
| "learning_rate": 3.4234987504869553e-06, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3180461823940277, |
| "step": 3475, |
| "valid_targets_mean": 4406.1, |
| "valid_targets_min": 2243 |
| }, |
| { |
| "epoch": 5.8193979933110365, |
| "grad_norm": 1.0301442813101, |
| "learning_rate": 3.376981315555086e-06, |
| "loss": 0.2767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27760040760040283, |
| "step": 3480, |
| "valid_targets_mean": 2683.6, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 5.827759197324415, |
| "grad_norm": 0.9573217341539905, |
| "learning_rate": 3.3307529205092903e-06, |
| "loss": 0.273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.368574321269989, |
| "step": 3485, |
| "valid_targets_mean": 4355.6, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 5.8361204013377925, |
| "grad_norm": 1.029121606843474, |
| "learning_rate": 3.2848143691656807e-06, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23345233500003815, |
| "step": 3490, |
| "valid_targets_mean": 2955.6, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 5.84448160535117, |
| "grad_norm": 1.0526837100245612, |
| "learning_rate": 3.239166460300571e-06, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23312462866306305, |
| "step": 3495, |
| "valid_targets_mean": 2799.9, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 5.852842809364549, |
| "grad_norm": 0.9555127758551365, |
| "learning_rate": 3.1938099876366047e-06, |
| "loss": 0.2627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2574623227119446, |
| "step": 3500, |
| "valid_targets_mean": 2801.6, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 5.861204013377926, |
| "grad_norm": 1.0434914071493264, |
| "learning_rate": 3.1487457398289645e-06, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2559327781200409, |
| "step": 3505, |
| "valid_targets_mean": 3459.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 5.869565217391305, |
| "grad_norm": 1.012926148789505, |
| "learning_rate": 3.1039745004516207e-06, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2865094840526581, |
| "step": 3510, |
| "valid_targets_mean": 3056.8, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 5.877926421404682, |
| "grad_norm": 0.9712574615035141, |
| "learning_rate": 3.0594970479837683e-06, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21085739135742188, |
| "step": 3515, |
| "valid_targets_mean": 2824.9, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 5.88628762541806, |
| "grad_norm": 1.0473259954733953, |
| "learning_rate": 3.015314155796234e-06, |
| "loss": 0.2031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2044457346200943, |
| "step": 3520, |
| "valid_targets_mean": 2760.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 5.894648829431438, |
| "grad_norm": 0.9843115195011657, |
| "learning_rate": 2.9714265921380557e-06, |
| "loss": 0.2371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20010721683502197, |
| "step": 3525, |
| "valid_targets_mean": 2771.8, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 5.903010033444816, |
| "grad_norm": 0.8585558006225893, |
| "learning_rate": 2.927835120123128e-06, |
| "loss": 0.2512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3017348051071167, |
| "step": 3530, |
| "valid_targets_mean": 3708.9, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 5.911371237458194, |
| "grad_norm": 1.0365669573233212, |
| "learning_rate": 2.8845404977169057e-06, |
| "loss": 0.2316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24910643696784973, |
| "step": 3535, |
| "valid_targets_mean": 3256.1, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 5.919732441471572, |
| "grad_norm": 1.1977783758414982, |
| "learning_rate": 2.841543477723254e-06, |
| "loss": 0.3115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3304036557674408, |
| "step": 3540, |
| "valid_targets_mean": 4009.1, |
| "valid_targets_min": 1801 |
| }, |
| { |
| "epoch": 5.9280936454849495, |
| "grad_norm": 1.0475636986470853, |
| "learning_rate": 2.7988448077713592e-06, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23120662569999695, |
| "step": 3545, |
| "valid_targets_mean": 2633.4, |
| "valid_targets_min": 1628 |
| }, |
| { |
| "epoch": 5.936454849498328, |
| "grad_norm": 0.8986613684835274, |
| "learning_rate": 2.7564452303027024e-06, |
| "loss": 0.24, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25718823075294495, |
| "step": 3550, |
| "valid_targets_mean": 3136.1, |
| "valid_targets_min": 1648 |
| }, |
| { |
| "epoch": 5.944816053511706, |
| "grad_norm": 0.8828527508561764, |
| "learning_rate": 2.7143454825581714e-06, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.189050555229187, |
| "step": 3555, |
| "valid_targets_mean": 3121.1, |
| "valid_targets_min": 1683 |
| }, |
| { |
| "epoch": 5.953177257525084, |
| "grad_norm": 1.117960588110681, |
| "learning_rate": 2.672546296565237e-06, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24358290433883667, |
| "step": 3560, |
| "valid_targets_mean": 3175.4, |
| "valid_targets_min": 1662 |
| }, |
| { |
| "epoch": 5.961538461538462, |
| "grad_norm": 1.0074867797130804, |
| "learning_rate": 2.6310483991252133e-06, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2374524474143982, |
| "step": 3565, |
| "valid_targets_mean": 2834.6, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 5.969899665551839, |
| "grad_norm": 1.0690795488474825, |
| "learning_rate": 2.589852511800646e-06, |
| "loss": 0.2652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17189118266105652, |
| "step": 3570, |
| "valid_targets_mean": 2602.5, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 5.978260869565218, |
| "grad_norm": 0.9971267052649938, |
| "learning_rate": 2.54895935090274e-06, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21394936740398407, |
| "step": 3575, |
| "valid_targets_mean": 2751.8, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 5.986622073578595, |
| "grad_norm": 0.9537557291572413, |
| "learning_rate": 2.508369627478917e-06, |
| "loss": 0.2331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22841092944145203, |
| "step": 3580, |
| "valid_targets_mean": 3169.6, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 5.994983277591973, |
| "grad_norm": 0.9343814378914798, |
| "learning_rate": 2.468084047300452e-06, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2370833456516266, |
| "step": 3585, |
| "valid_targets_mean": 3215.1, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 6.003344481605351, |
| "grad_norm": 0.8238052983578956, |
| "learning_rate": 2.4281033108501873e-06, |
| "loss": 0.2314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2642517685890198, |
| "step": 3590, |
| "valid_targets_mean": 4032.8, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 6.011705685618729, |
| "grad_norm": 0.8851781452831197, |
| "learning_rate": 2.3884281133103725e-06, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2074108123779297, |
| "step": 3595, |
| "valid_targets_mean": 3117.4, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 6.0200668896321075, |
| "grad_norm": 1.0191065552656804, |
| "learning_rate": 2.3490591445505715e-06, |
| "loss": 0.2346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20292872190475464, |
| "step": 3600, |
| "valid_targets_mean": 2607.1, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 6.028428093645485, |
| "grad_norm": 0.8274990269440808, |
| "learning_rate": 2.309997089115659e-06, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27467474341392517, |
| "step": 3605, |
| "valid_targets_mean": 4511.8, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 6.036789297658863, |
| "grad_norm": 0.9829693732867127, |
| "learning_rate": 2.271242626213925e-06, |
| "loss": 0.2406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2838166654109955, |
| "step": 3610, |
| "valid_targets_mean": 3051.6, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 6.045150501672241, |
| "grad_norm": 0.9430424383463232, |
| "learning_rate": 2.232796429705253e-06, |
| "loss": 0.2751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2801671028137207, |
| "step": 3615, |
| "valid_targets_mean": 3661.6, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 6.053511705685619, |
| "grad_norm": 0.9799256756829944, |
| "learning_rate": 2.1946591680894145e-06, |
| "loss": 0.2252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21253493428230286, |
| "step": 3620, |
| "valid_targets_mean": 3080.5, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 6.061872909698996, |
| "grad_norm": 0.890449059990666, |
| "learning_rate": 2.1568315044944586e-06, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23232722282409668, |
| "step": 3625, |
| "valid_targets_mean": 3467.1, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 6.070234113712375, |
| "grad_norm": 1.553508951062491, |
| "learning_rate": 2.1193140966651484e-06, |
| "loss": 0.2247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2310488224029541, |
| "step": 3630, |
| "valid_targets_mean": 3239.2, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 6.078595317725752, |
| "grad_norm": 1.0015740592300846, |
| "learning_rate": 2.082107596951548e-06, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2560243308544159, |
| "step": 3635, |
| "valid_targets_mean": 3611.4, |
| "valid_targets_min": 1662 |
| }, |
| { |
| "epoch": 6.086956521739131, |
| "grad_norm": 0.9610763495680839, |
| "learning_rate": 2.0452126522976746e-06, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23907433450222015, |
| "step": 3640, |
| "valid_targets_mean": 3443.9, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 6.095317725752508, |
| "grad_norm": 1.0195087469479902, |
| "learning_rate": 2.008629904230237e-06, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21630674600601196, |
| "step": 3645, |
| "valid_targets_mean": 3096.0, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 6.103678929765886, |
| "grad_norm": 1.1781421008430892, |
| "learning_rate": 1.972359988847499e-06, |
| "loss": 0.2767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22949744760990143, |
| "step": 3650, |
| "valid_targets_mean": 2490.5, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 6.1120401337792645, |
| "grad_norm": 1.0009259653669014, |
| "learning_rate": 1.9364035368082222e-06, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17091065645217896, |
| "step": 3655, |
| "valid_targets_mean": 2323.1, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 6.120401337792642, |
| "grad_norm": 0.9973471406872797, |
| "learning_rate": 1.9007611733206733e-06, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29807907342910767, |
| "step": 3660, |
| "valid_targets_mean": 3280.1, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 6.12876254180602, |
| "grad_norm": 0.9458454127635654, |
| "learning_rate": 1.8654335181317784e-06, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26122528314590454, |
| "step": 3665, |
| "valid_targets_mean": 3286.4, |
| "valid_targets_min": 1471 |
| }, |
| { |
| "epoch": 6.137123745819398, |
| "grad_norm": 0.9302638864213695, |
| "learning_rate": 1.8304211855163311e-06, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30081790685653687, |
| "step": 3670, |
| "valid_targets_mean": 3793.2, |
| "valid_targets_min": 392 |
| }, |
| { |
| "epoch": 6.145484949832776, |
| "grad_norm": 0.9293216572645322, |
| "learning_rate": 1.7957247842663194e-06, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2717227041721344, |
| "step": 3675, |
| "valid_targets_mean": 3530.5, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 6.153846153846154, |
| "grad_norm": 1.0642259780797343, |
| "learning_rate": 1.7613449176803476e-06, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18526840209960938, |
| "step": 3680, |
| "valid_targets_mean": 3227.3, |
| "valid_targets_min": 1819 |
| }, |
| { |
| "epoch": 6.162207357859532, |
| "grad_norm": 1.0950639668119169, |
| "learning_rate": 1.7272821835531295e-06, |
| "loss": 0.2536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23934021592140198, |
| "step": 3685, |
| "valid_targets_mean": 2936.0, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 6.170568561872909, |
| "grad_norm": 0.8320781108074271, |
| "learning_rate": 1.693537174165103e-06, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2670717239379883, |
| "step": 3690, |
| "valid_targets_mean": 4768.5, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 6.178929765886288, |
| "grad_norm": 1.0190310935542606, |
| "learning_rate": 1.660110476272132e-06, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1878700852394104, |
| "step": 3695, |
| "valid_targets_mean": 2822.3, |
| "valid_targets_min": 1513 |
| }, |
| { |
| "epoch": 6.187290969899665, |
| "grad_norm": 0.946671940766795, |
| "learning_rate": 1.6270026710952924e-06, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18372738361358643, |
| "step": 3700, |
| "valid_targets_mean": 3202.5, |
| "valid_targets_min": 1844 |
| }, |
| { |
| "epoch": 6.195652173913044, |
| "grad_norm": 1.0311761236131074, |
| "learning_rate": 1.5942143343107953e-06, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1737433671951294, |
| "step": 3705, |
| "valid_targets_mean": 2330.4, |
| "valid_targets_min": 983 |
| }, |
| { |
| "epoch": 6.2040133779264215, |
| "grad_norm": 1.7693463573078112, |
| "learning_rate": 1.5617460360399439e-06, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24771828949451447, |
| "step": 3710, |
| "valid_targets_mean": 2783.2, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 6.212374581939799, |
| "grad_norm": 1.1913402227691237, |
| "learning_rate": 1.529598340839238e-06, |
| "loss": 0.2247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20294560492038727, |
| "step": 3715, |
| "valid_targets_mean": 3321.5, |
| "valid_targets_min": 1623 |
| }, |
| { |
| "epoch": 6.2207357859531776, |
| "grad_norm": 1.1205061236211051, |
| "learning_rate": 1.4977718076905533e-06, |
| "loss": 0.245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20099762082099915, |
| "step": 3720, |
| "valid_targets_mean": 2455.0, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 6.229096989966555, |
| "grad_norm": 0.872701348205632, |
| "learning_rate": 1.4662669899914161e-06, |
| "loss": 0.2251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.240260511636734, |
| "step": 3725, |
| "valid_targets_mean": 4170.6, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 6.237458193979933, |
| "grad_norm": 1.149500218715332, |
| "learning_rate": 1.4350844355453952e-06, |
| "loss": 0.2167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24577274918556213, |
| "step": 3730, |
| "valid_targets_mean": 2776.9, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 6.245819397993311, |
| "grad_norm": 0.9744589071128174, |
| "learning_rate": 1.404224686552571e-06, |
| "loss": 0.2699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2977054715156555, |
| "step": 3735, |
| "valid_targets_mean": 3161.8, |
| "valid_targets_min": 1420 |
| }, |
| { |
| "epoch": 6.254180602006689, |
| "grad_norm": 1.0622602777455052, |
| "learning_rate": 1.3736882796000983e-06, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2422657608985901, |
| "step": 3740, |
| "valid_targets_mean": 3276.9, |
| "valid_targets_min": 2083 |
| }, |
| { |
| "epoch": 6.262541806020067, |
| "grad_norm": 0.9192780596090956, |
| "learning_rate": 1.3434757456528868e-06, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23593655228614807, |
| "step": 3745, |
| "valid_targets_mean": 3154.8, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 6.270903010033445, |
| "grad_norm": 1.0794767225936577, |
| "learning_rate": 1.3135876100443557e-06, |
| "loss": 0.2451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19183969497680664, |
| "step": 3750, |
| "valid_targets_mean": 2641.8, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 6.2792642140468224, |
| "grad_norm": 1.1069267787089752, |
| "learning_rate": 1.2840243924673202e-06, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19526013731956482, |
| "step": 3755, |
| "valid_targets_mean": 2651.9, |
| "valid_targets_min": 1307 |
| }, |
| { |
| "epoch": 6.287625418060201, |
| "grad_norm": 0.9530346118359216, |
| "learning_rate": 1.2547866069649418e-06, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2443237155675888, |
| "step": 3760, |
| "valid_targets_mean": 2864.8, |
| "valid_targets_min": 1587 |
| }, |
| { |
| "epoch": 6.2959866220735785, |
| "grad_norm": 0.9997194895255284, |
| "learning_rate": 1.225874761921788e-06, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22411714494228363, |
| "step": 3765, |
| "valid_targets_mean": 2974.7, |
| "valid_targets_min": 1770 |
| }, |
| { |
| "epoch": 6.304347826086957, |
| "grad_norm": 0.9257546461579786, |
| "learning_rate": 1.1972893600550007e-06, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20396903157234192, |
| "step": 3770, |
| "valid_targets_mean": 3238.4, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 6.312709030100335, |
| "grad_norm": 0.9526741297223604, |
| "learning_rate": 1.1690308984055454e-06, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31394025683403015, |
| "step": 3775, |
| "valid_targets_mean": 3941.2, |
| "valid_targets_min": 1904 |
| }, |
| { |
| "epoch": 6.321070234113712, |
| "grad_norm": 1.0127893431246604, |
| "learning_rate": 1.141099868329576e-06, |
| "loss": 0.2697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2128710150718689, |
| "step": 3780, |
| "valid_targets_mean": 3173.2, |
| "valid_targets_min": 2167 |
| }, |
| { |
| "epoch": 6.329431438127091, |
| "grad_norm": 0.8562910539058333, |
| "learning_rate": 1.1134967554898868e-06, |
| "loss": 0.2487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3077230155467987, |
| "step": 3785, |
| "valid_targets_mean": 3871.0, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 6.337792642140468, |
| "grad_norm": 1.0570481175477418, |
| "learning_rate": 1.0862220398474798e-06, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24611452221870422, |
| "step": 3790, |
| "valid_targets_mean": 2720.8, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 6.346153846153846, |
| "grad_norm": 0.9974643589859099, |
| "learning_rate": 1.0592761956531983e-06, |
| "loss": 0.26, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15949031710624695, |
| "step": 3795, |
| "valid_targets_mean": 2890.8, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 6.354515050167224, |
| "grad_norm": 1.0285315175075678, |
| "learning_rate": 1.0326596914395015e-06, |
| "loss": 0.2196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.218702495098114, |
| "step": 3800, |
| "valid_targets_mean": 2983.0, |
| "valid_targets_min": 1307 |
| }, |
| { |
| "epoch": 6.362876254180602, |
| "grad_norm": 1.0391314709729795, |
| "learning_rate": 1.0063729900122943e-06, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22132647037506104, |
| "step": 3805, |
| "valid_targets_mean": 3014.7, |
| "valid_targets_min": 1600 |
| }, |
| { |
| "epoch": 6.3712374581939795, |
| "grad_norm": 1.0732291866174521, |
| "learning_rate": 9.80416548442904e-07, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16350066661834717, |
| "step": 3810, |
| "valid_targets_mean": 2471.2, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 6.379598662207358, |
| "grad_norm": 0.9478207894233418, |
| "learning_rate": 9.547908180601274e-07, |
| "loss": 0.218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2005515992641449, |
| "step": 3815, |
| "valid_targets_mean": 3266.4, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 6.3879598662207355, |
| "grad_norm": 0.9884148175012485, |
| "learning_rate": 9.294962444423672e-07, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18229839205741882, |
| "step": 3820, |
| "valid_targets_mean": 2692.9, |
| "valid_targets_min": 1731 |
| }, |
| { |
| "epoch": 6.396321070234114, |
| "grad_norm": 1.0689420786608823, |
| "learning_rate": 9.045332674099039e-07, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2374996840953827, |
| "step": 3825, |
| "valid_targets_mean": 3234.9, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 6.404682274247492, |
| "grad_norm": 0.9999053556423455, |
| "learning_rate": 8.799023210172319e-07, |
| "loss": 0.2183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2577441334724426, |
| "step": 3830, |
| "valid_targets_mean": 3541.5, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 6.413043478260869, |
| "grad_norm": 1.0162923003110396, |
| "learning_rate": 8.556038335455241e-07, |
| "loss": 0.2354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17862260341644287, |
| "step": 3835, |
| "valid_targets_mean": 3000.1, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 6.421404682274248, |
| "grad_norm": 0.9436887696227507, |
| "learning_rate": 8.316382274951773e-07, |
| "loss": 0.2596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3100453317165375, |
| "step": 3840, |
| "valid_targets_mean": 4021.4, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 6.429765886287625, |
| "grad_norm": 0.9165404614671304, |
| "learning_rate": 8.080059195784829e-07, |
| "loss": 0.2715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29584699869155884, |
| "step": 3845, |
| "valid_targets_mean": 3990.2, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 6.438127090301004, |
| "grad_norm": 1.1633047424989935, |
| "learning_rate": 7.847073207123523e-07, |
| "loss": 0.2805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2624181807041168, |
| "step": 3850, |
| "valid_targets_mean": 2811.7, |
| "valid_targets_min": 1472 |
| }, |
| { |
| "epoch": 6.446488294314381, |
| "grad_norm": 0.9983233707225826, |
| "learning_rate": 7.617428360111945e-07, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.281194269657135, |
| "step": 3855, |
| "valid_targets_mean": 3405.9, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 6.454849498327759, |
| "grad_norm": 1.1246524097930575, |
| "learning_rate": 7.391128647798607e-07, |
| "loss": 0.2389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22077451646327972, |
| "step": 3860, |
| "valid_targets_mean": 2505.6, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 6.463210702341137, |
| "grad_norm": 0.886456015080147, |
| "learning_rate": 7.168178005067062e-07, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29799652099609375, |
| "step": 3865, |
| "valid_targets_mean": 3983.9, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 6.471571906354515, |
| "grad_norm": 1.103332362483573, |
| "learning_rate": 6.948580308567532e-07, |
| "loss": 0.2222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2571655511856079, |
| "step": 3870, |
| "valid_targets_mean": 2698.6, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 6.479933110367893, |
| "grad_norm": 1.0813420856710951, |
| "learning_rate": 6.732339376649388e-07, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22849063575267792, |
| "step": 3875, |
| "valid_targets_mean": 2950.5, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 6.488294314381271, |
| "grad_norm": 1.0707482467762934, |
| "learning_rate": 6.519458969294845e-07, |
| "loss": 0.2237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18700650334358215, |
| "step": 3880, |
| "valid_targets_mean": 2505.4, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 6.496655518394649, |
| "grad_norm": 0.9136997187616676, |
| "learning_rate": 6.309942788053502e-07, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18983229994773865, |
| "step": 3885, |
| "valid_targets_mean": 2847.4, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 6.505016722408027, |
| "grad_norm": 0.9836787164297042, |
| "learning_rate": 6.103794475978086e-07, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27802348136901855, |
| "step": 3890, |
| "valid_targets_mean": 3571.6, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 6.513377926421405, |
| "grad_norm": 1.0040587188078438, |
| "learning_rate": 5.901017617560989e-07, |
| "loss": 0.2256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2178075611591339, |
| "step": 3895, |
| "valid_targets_mean": 3485.3, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 6.521739130434782, |
| "grad_norm": 0.9972334739609068, |
| "learning_rate": 5.701615738672073e-07, |
| "loss": 0.2391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2519034743309021, |
| "step": 3900, |
| "valid_targets_mean": 3683.1, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 6.530100334448161, |
| "grad_norm": 1.0048200677550907, |
| "learning_rate": 5.505592306497298e-07, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2037794291973114, |
| "step": 3905, |
| "valid_targets_mean": 2815.6, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 6.538461538461538, |
| "grad_norm": 0.9738058489579007, |
| "learning_rate": 5.312950729478327e-07, |
| "loss": 0.2571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1917770355939865, |
| "step": 3910, |
| "valid_targets_mean": 2968.3, |
| "valid_targets_min": 1757 |
| }, |
| { |
| "epoch": 6.546822742474916, |
| "grad_norm": 0.9699331976466884, |
| "learning_rate": 5.123694357253439e-07, |
| "loss": 0.2332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19296962022781372, |
| "step": 3915, |
| "valid_targets_mean": 3587.3, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 6.555183946488294, |
| "grad_norm": 0.9210291981550992, |
| "learning_rate": 4.937826480599195e-07, |
| "loss": 0.239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25981834530830383, |
| "step": 3920, |
| "valid_targets_mean": 3616.3, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 6.563545150501672, |
| "grad_norm": 0.9639041354225487, |
| "learning_rate": 4.755350331373243e-07, |
| "loss": 0.2665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22324317693710327, |
| "step": 3925, |
| "valid_targets_mean": 3426.1, |
| "valid_targets_min": 1477 |
| }, |
| { |
| "epoch": 6.5719063545150505, |
| "grad_norm": 1.0060449285500996, |
| "learning_rate": 4.576269082458118e-07, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18587031960487366, |
| "step": 3930, |
| "valid_targets_mean": 2988.8, |
| "valid_targets_min": 1536 |
| }, |
| { |
| "epoch": 6.580267558528428, |
| "grad_norm": 1.125813362538308, |
| "learning_rate": 4.4005858477060404e-07, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21866926550865173, |
| "step": 3935, |
| "valid_targets_mean": 3366.3, |
| "valid_targets_min": 1060 |
| }, |
| { |
| "epoch": 6.588628762541806, |
| "grad_norm": 1.0628904813820763, |
| "learning_rate": 4.228303681884782e-07, |
| "loss": 0.2324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25543057918548584, |
| "step": 3940, |
| "valid_targets_mean": 3191.6, |
| "valid_targets_min": 1800 |
| }, |
| { |
| "epoch": 6.596989966555184, |
| "grad_norm": 0.9915725733061522, |
| "learning_rate": 4.059425580624576e-07, |
| "loss": 0.2374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28621232509613037, |
| "step": 3945, |
| "valid_targets_mean": 3603.1, |
| "valid_targets_min": 1548 |
| }, |
| { |
| "epoch": 6.605351170568562, |
| "grad_norm": 0.9949146897868569, |
| "learning_rate": 3.893954480366091e-07, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1640351116657257, |
| "step": 3950, |
| "valid_targets_mean": 2460.5, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 6.61371237458194, |
| "grad_norm": 1.111214711835855, |
| "learning_rate": 3.731893258309227e-07, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22030051052570343, |
| "step": 3955, |
| "valid_targets_mean": 2509.4, |
| "valid_targets_min": 553 |
| }, |
| { |
| "epoch": 6.622073578595318, |
| "grad_norm": 1.1676078726615438, |
| "learning_rate": 3.573244732363179e-07, |
| "loss": 0.2437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.243607297539711, |
| "step": 3960, |
| "valid_targets_mean": 3134.6, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 6.630434782608695, |
| "grad_norm": 0.9596071900127525, |
| "learning_rate": 3.4180116610973645e-07, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.280606210231781, |
| "step": 3965, |
| "valid_targets_mean": 3487.9, |
| "valid_targets_min": 1539 |
| }, |
| { |
| "epoch": 6.638795986622074, |
| "grad_norm": 1.0307311782355484, |
| "learning_rate": 3.2661967436936394e-07, |
| "loss": 0.2347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2129300832748413, |
| "step": 3970, |
| "valid_targets_mean": 3150.9, |
| "valid_targets_min": 364 |
| }, |
| { |
| "epoch": 6.647157190635451, |
| "grad_norm": 0.9029900853777432, |
| "learning_rate": 3.117802619899113e-07, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2022523730993271, |
| "step": 3975, |
| "valid_targets_mean": 3131.2, |
| "valid_targets_min": 1462 |
| }, |
| { |
| "epoch": 6.65551839464883, |
| "grad_norm": 0.9353250337198755, |
| "learning_rate": 2.9728318699804525e-07, |
| "loss": 0.2183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26376834511756897, |
| "step": 3980, |
| "valid_targets_mean": 3456.8, |
| "valid_targets_min": 1636 |
| }, |
| { |
| "epoch": 6.6638795986622075, |
| "grad_norm": 1.1365720683226703, |
| "learning_rate": 2.831287014678941e-07, |
| "loss": 0.2141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19698631763458252, |
| "step": 3985, |
| "valid_targets_mean": 2634.6, |
| "valid_targets_min": 569 |
| }, |
| { |
| "epoch": 6.672240802675585, |
| "grad_norm": 0.9037444665225245, |
| "learning_rate": 2.693170515166599e-07, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17331139743328094, |
| "step": 3990, |
| "valid_targets_mean": 3423.4, |
| "valid_targets_min": 2070 |
| }, |
| { |
| "epoch": 6.6806020066889635, |
| "grad_norm": 1.012894148288379, |
| "learning_rate": 2.558484773003445e-07, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2655693292617798, |
| "step": 3995, |
| "valid_targets_mean": 3323.4, |
| "valid_targets_min": 1844 |
| }, |
| { |
| "epoch": 6.688963210702341, |
| "grad_norm": 0.9548388318374232, |
| "learning_rate": 2.427232130095747e-07, |
| "loss": 0.2373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21322210133075714, |
| "step": 4000, |
| "valid_targets_mean": 2801.6, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 6.697324414715719, |
| "grad_norm": 1.0832658905494663, |
| "learning_rate": 2.299414868655281e-07, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2207055389881134, |
| "step": 4005, |
| "valid_targets_mean": 2772.9, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 6.705685618729097, |
| "grad_norm": 0.9005094142183284, |
| "learning_rate": 2.1750352111596707e-07, |
| "loss": 0.24, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24203582108020782, |
| "step": 4010, |
| "valid_targets_mean": 3876.8, |
| "valid_targets_min": 2273 |
| }, |
| { |
| "epoch": 6.714046822742475, |
| "grad_norm": 0.9978940251893587, |
| "learning_rate": 2.0540953203137093e-07, |
| "loss": 0.225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1879318505525589, |
| "step": 4015, |
| "valid_targets_mean": 3497.7, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 6.722408026755852, |
| "grad_norm": 0.9909059278250834, |
| "learning_rate": 1.9365972990117e-07, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1991642862558365, |
| "step": 4020, |
| "valid_targets_mean": 2930.1, |
| "valid_targets_min": 1353 |
| }, |
| { |
| "epoch": 6.730769230769231, |
| "grad_norm": 0.9925673396527694, |
| "learning_rate": 1.8225431903010403e-07, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23669245839118958, |
| "step": 4025, |
| "valid_targets_mean": 2976.0, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 6.739130434782608, |
| "grad_norm": 0.97958659307702, |
| "learning_rate": 1.7119349773466076e-07, |
| "loss": 0.2493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18920472264289856, |
| "step": 4030, |
| "valid_targets_mean": 2922.8, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 6.747491638795987, |
| "grad_norm": 0.9895938981944002, |
| "learning_rate": 1.6047745833962735e-07, |
| "loss": 0.2638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4012299180030823, |
| "step": 4035, |
| "valid_targets_mean": 4044.7, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 6.7558528428093645, |
| "grad_norm": 1.005865202853038, |
| "learning_rate": 1.5010638717474878e-07, |
| "loss": 0.2231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2346489280462265, |
| "step": 4040, |
| "valid_targets_mean": 3234.9, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 6.764214046822742, |
| "grad_norm": 0.9665878862524135, |
| "learning_rate": 1.400804645714815e-07, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20860449969768524, |
| "step": 4045, |
| "valid_targets_mean": 2963.2, |
| "valid_targets_min": 1512 |
| }, |
| { |
| "epoch": 6.7725752508361206, |
| "grad_norm": 0.9073442199596257, |
| "learning_rate": 1.30399864859867e-07, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21425005793571472, |
| "step": 4050, |
| "valid_targets_mean": 4054.4, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 6.780936454849498, |
| "grad_norm": 1.1395884258364646, |
| "learning_rate": 1.2106475636549654e-07, |
| "loss": 0.2503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2343166172504425, |
| "step": 4055, |
| "valid_targets_mean": 2424.9, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 6.789297658862877, |
| "grad_norm": 1.2355832602043204, |
| "learning_rate": 1.1207530140658452e-07, |
| "loss": 0.247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1832336038351059, |
| "step": 4060, |
| "valid_targets_mean": 2785.1, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 6.797658862876254, |
| "grad_norm": 1.0756162811102452, |
| "learning_rate": 1.0343165629114416e-07, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2562386989593506, |
| "step": 4065, |
| "valid_targets_mean": 2926.1, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 6.806020066889632, |
| "grad_norm": 1.12479348737203, |
| "learning_rate": 9.513397131427404e-08, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19680562615394592, |
| "step": 4070, |
| "valid_targets_mean": 3050.8, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 6.81438127090301, |
| "grad_norm": 1.3027817427113138, |
| "learning_rate": 8.71823907555358e-08, |
| "loss": 0.2794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2448652684688568, |
| "step": 4075, |
| "valid_targets_mean": 3234.3, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 6.822742474916388, |
| "grad_norm": 1.0120756120555998, |
| "learning_rate": 7.957705287645834e-08, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.236515074968338, |
| "step": 4080, |
| "valid_targets_mean": 3107.5, |
| "valid_targets_min": 1469 |
| }, |
| { |
| "epoch": 6.831103678929766, |
| "grad_norm": 1.1643671752495577, |
| "learning_rate": 7.231808991812639e-08, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24128901958465576, |
| "step": 4085, |
| "valid_targets_mean": 2651.4, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 6.839464882943144, |
| "grad_norm": 1.0224383394242054, |
| "learning_rate": 6.540562809887574e-08, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2086195945739746, |
| "step": 4090, |
| "valid_targets_mean": 2881.9, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 6.8478260869565215, |
| "grad_norm": 0.8984874112503329, |
| "learning_rate": 5.8839787612114955e-08, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19981077313423157, |
| "step": 4095, |
| "valid_targets_mean": 3368.8, |
| "valid_targets_min": 1532 |
| }, |
| { |
| "epoch": 6.8561872909699, |
| "grad_norm": 1.1889036672332234, |
| "learning_rate": 5.2620682624213714e-08, |
| "loss": 0.2788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3057703673839569, |
| "step": 4100, |
| "valid_targets_mean": 2838.0, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 6.864548494983278, |
| "grad_norm": 0.9722791686736607, |
| "learning_rate": 4.6748421272537756e-08, |
| "loss": 0.2356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3012353777885437, |
| "step": 4105, |
| "valid_targets_mean": 3410.2, |
| "valid_targets_min": 401 |
| }, |
| { |
| "epoch": 6.872909698996655, |
| "grad_norm": 0.8439698339063494, |
| "learning_rate": 4.1223105663554806e-08, |
| "loss": 0.2274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22458210587501526, |
| "step": 4110, |
| "valid_targets_mean": 4013.0, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 6.881270903010034, |
| "grad_norm": 0.9937076155434867, |
| "learning_rate": 3.604483187106711e-08, |
| "loss": 0.2557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21647757291793823, |
| "step": 4115, |
| "valid_targets_mean": 2891.7, |
| "valid_targets_min": 1398 |
| }, |
| { |
| "epoch": 6.889632107023411, |
| "grad_norm": 0.9554683145250049, |
| "learning_rate": 3.1213689934537215e-08, |
| "loss": 0.2428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.227905735373497, |
| "step": 4120, |
| "valid_targets_mean": 3056.9, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 6.897993311036789, |
| "grad_norm": 0.9851841831055532, |
| "learning_rate": 2.6729763857522573e-08, |
| "loss": 0.2184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20012471079826355, |
| "step": 4125, |
| "valid_targets_mean": 2812.2, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 6.906354515050167, |
| "grad_norm": 0.9102139042294596, |
| "learning_rate": 2.2593131606216677e-08, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22855457663536072, |
| "step": 4130, |
| "valid_targets_mean": 3411.4, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 6.914715719063545, |
| "grad_norm": 0.9968709409763933, |
| "learning_rate": 1.880386510809018e-08, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24055655300617218, |
| "step": 4135, |
| "valid_targets_mean": 2944.4, |
| "valid_targets_min": 1447 |
| }, |
| { |
| "epoch": 6.923076923076923, |
| "grad_norm": 1.0089101681026145, |
| "learning_rate": 1.536203025064742e-08, |
| "loss": 0.2634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23049476742744446, |
| "step": 4140, |
| "valid_targets_mean": 3192.5, |
| "valid_targets_min": 1745 |
| }, |
| { |
| "epoch": 6.931438127090301, |
| "grad_norm": 1.0054169631158152, |
| "learning_rate": 1.226768688026736e-08, |
| "loss": 0.2575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21784156560897827, |
| "step": 4145, |
| "valid_targets_mean": 2982.2, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 6.9397993311036785, |
| "grad_norm": 1.0500654956007207, |
| "learning_rate": 9.520888801182182e-09, |
| "loss": 0.2275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21303492784500122, |
| "step": 4150, |
| "valid_targets_mean": 2794.8, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 6.948160535117057, |
| "grad_norm": 1.054419064540089, |
| "learning_rate": 7.121683774518051e-09, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17308101058006287, |
| "step": 4155, |
| "valid_targets_mean": 2646.4, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 6.956521739130435, |
| "grad_norm": 1.00371154489669, |
| "learning_rate": 5.0701135174890944e-09, |
| "loss": 0.2474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29931163787841797, |
| "step": 4160, |
| "valid_targets_mean": 3849.4, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 6.964882943143813, |
| "grad_norm": 0.930732845194307, |
| "learning_rate": 3.3662137026535537e-09, |
| "loss": 0.2348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22841259837150574, |
| "step": 4165, |
| "valid_targets_mean": 3192.3, |
| "valid_targets_min": 1398 |
| }, |
| { |
| "epoch": 6.973244147157191, |
| "grad_norm": 0.9699847666900223, |
| "learning_rate": 2.0100139573031584e-09, |
| "loss": 0.2398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2246263176202774, |
| "step": 4170, |
| "valid_targets_mean": 2845.4, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 6.981605351170568, |
| "grad_norm": 0.9378995458223955, |
| "learning_rate": 1.0015378629413265e-09, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21635910868644714, |
| "step": 4175, |
| "valid_targets_mean": 2931.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 6.989966555183947, |
| "grad_norm": 1.0220155583231438, |
| "learning_rate": 3.4080295488347903e-10, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2119850516319275, |
| "step": 4180, |
| "valid_targets_mean": 2728.2, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 6.998327759197324, |
| "grad_norm": 0.9751477515928492, |
| "learning_rate": 2.7820721939519902e-11, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21303658187389374, |
| "step": 4185, |
| "valid_targets_mean": 3151.9, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22936706244945526, |
| "step": 4186, |
| "total_flos": 791537577689088.0, |
| "train_loss": 0.17696809689205084, |
| "train_runtime": 13311.7439, |
| "train_samples_per_second": 5.027, |
| "train_steps_per_second": 0.314, |
| "valid_targets_mean": 3387.6, |
| "valid_targets_min": 1204 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4186, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 791537577689088.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|