| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4585, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.007639419404125287, |
| "grad_norm": 8.56353259226621, |
| "learning_rate": 3.4858387799564276e-07, |
| "loss": 0.9853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.485528826713562, |
| "step": 5, |
| "valid_targets_mean": 3401.8, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 0.015278838808250574, |
| "grad_norm": 8.131404212301335, |
| "learning_rate": 7.843137254901962e-07, |
| "loss": 1.0071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47187474370002747, |
| "step": 10, |
| "valid_targets_mean": 2919.4, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 0.02291825821237586, |
| "grad_norm": 7.290663279109773, |
| "learning_rate": 1.2200435729847495e-06, |
| "loss": 1.0029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3917523920536041, |
| "step": 15, |
| "valid_targets_mean": 2336.1, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 0.030557677616501147, |
| "grad_norm": 6.253781799061595, |
| "learning_rate": 1.655773420479303e-06, |
| "loss": 0.959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6743544936180115, |
| "step": 20, |
| "valid_targets_mean": 3415.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 0.03819709702062643, |
| "grad_norm": 4.392892259108477, |
| "learning_rate": 2.0915032679738565e-06, |
| "loss": 0.9939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3614335358142853, |
| "step": 25, |
| "valid_targets_mean": 2495.8, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 0.04583651642475172, |
| "grad_norm": 3.431018980960601, |
| "learning_rate": 2.5272331154684097e-06, |
| "loss": 0.922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5053595304489136, |
| "step": 30, |
| "valid_targets_mean": 4036.6, |
| "valid_targets_min": 1478 |
| }, |
| { |
| "epoch": 0.053475935828877004, |
| "grad_norm": 3.153409826158592, |
| "learning_rate": 2.962962962962963e-06, |
| "loss": 0.9547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3868003785610199, |
| "step": 35, |
| "valid_targets_mean": 2478.8, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 0.061115355233002294, |
| "grad_norm": 2.0831272022034146, |
| "learning_rate": 3.398692810457517e-06, |
| "loss": 0.8596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4014698266983032, |
| "step": 40, |
| "valid_targets_mean": 4233.2, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 0.06875477463712758, |
| "grad_norm": 1.6667591827402235, |
| "learning_rate": 3.83442265795207e-06, |
| "loss": 0.8571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4750503897666931, |
| "step": 45, |
| "valid_targets_mean": 3809.9, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 0.07639419404125286, |
| "grad_norm": 1.3493811705230785, |
| "learning_rate": 4.270152505446624e-06, |
| "loss": 0.8804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3598395884037018, |
| "step": 50, |
| "valid_targets_mean": 2505.9, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 0.08403361344537816, |
| "grad_norm": 1.5469719000738422, |
| "learning_rate": 4.705882352941177e-06, |
| "loss": 0.8181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3857227563858032, |
| "step": 55, |
| "valid_targets_mean": 2302.5, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 0.09167303284950344, |
| "grad_norm": 1.2108296473201847, |
| "learning_rate": 5.14161220043573e-06, |
| "loss": 0.8229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6197760105133057, |
| "step": 60, |
| "valid_targets_mean": 3091.4, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 0.09931245225362872, |
| "grad_norm": 0.9602992602617543, |
| "learning_rate": 5.577342047930284e-06, |
| "loss": 0.7262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3339218497276306, |
| "step": 65, |
| "valid_targets_mean": 3060.6, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 0.10695187165775401, |
| "grad_norm": 0.987631773029606, |
| "learning_rate": 6.0130718954248365e-06, |
| "loss": 0.8129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4006999731063843, |
| "step": 70, |
| "valid_targets_mean": 3960.8, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 0.11459129106187929, |
| "grad_norm": 0.9293072024847869, |
| "learning_rate": 6.4488017429193905e-06, |
| "loss": 0.7625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42446625232696533, |
| "step": 75, |
| "valid_targets_mean": 3102.1, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 0.12223071046600459, |
| "grad_norm": 0.8519810844732746, |
| "learning_rate": 6.8845315904139445e-06, |
| "loss": 0.7621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34469449520111084, |
| "step": 80, |
| "valid_targets_mean": 3108.2, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 0.12987012987012986, |
| "grad_norm": 0.7340258302490502, |
| "learning_rate": 7.320261437908497e-06, |
| "loss": 0.7235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3129647672176361, |
| "step": 85, |
| "valid_targets_mean": 3680.9, |
| "valid_targets_min": 2358 |
| }, |
| { |
| "epoch": 0.13750954927425516, |
| "grad_norm": 0.7217579014723088, |
| "learning_rate": 7.755991285403051e-06, |
| "loss": 0.7184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22861731052398682, |
| "step": 90, |
| "valid_targets_mean": 2556.1, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 0.14514896867838045, |
| "grad_norm": 0.7843685287405917, |
| "learning_rate": 8.191721132897605e-06, |
| "loss": 0.714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2588593661785126, |
| "step": 95, |
| "valid_targets_mean": 2526.9, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 0.15278838808250572, |
| "grad_norm": 0.835309959958566, |
| "learning_rate": 8.627450980392157e-06, |
| "loss": 0.7336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29795417189598083, |
| "step": 100, |
| "valid_targets_mean": 2311.1, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 0.16042780748663102, |
| "grad_norm": 0.8939656344358561, |
| "learning_rate": 9.063180827886711e-06, |
| "loss": 0.6585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.355358362197876, |
| "step": 105, |
| "valid_targets_mean": 2767.4, |
| "valid_targets_min": 1885 |
| }, |
| { |
| "epoch": 0.16806722689075632, |
| "grad_norm": 0.7765567561351433, |
| "learning_rate": 9.498910675381264e-06, |
| "loss": 0.7021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3594488501548767, |
| "step": 110, |
| "valid_targets_mean": 3382.8, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 0.17570664629488159, |
| "grad_norm": 0.699526469363576, |
| "learning_rate": 9.934640522875818e-06, |
| "loss": 0.6992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4037782847881317, |
| "step": 115, |
| "valid_targets_mean": 4486.2, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.18334606569900688, |
| "grad_norm": 0.8794463842026947, |
| "learning_rate": 1.037037037037037e-05, |
| "loss": 0.7356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3373746871948242, |
| "step": 120, |
| "valid_targets_mean": 2458.4, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 0.19098548510313215, |
| "grad_norm": 0.676206262993347, |
| "learning_rate": 1.0806100217864926e-05, |
| "loss": 0.6595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30680835247039795, |
| "step": 125, |
| "valid_targets_mean": 3827.6, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 0.19862490450725745, |
| "grad_norm": 0.7688052056049358, |
| "learning_rate": 1.1241830065359478e-05, |
| "loss": 0.698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26999378204345703, |
| "step": 130, |
| "valid_targets_mean": 2575.5, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 0.20626432391138275, |
| "grad_norm": 0.7755987352317165, |
| "learning_rate": 1.167755991285403e-05, |
| "loss": 0.6742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.330909788608551, |
| "step": 135, |
| "valid_targets_mean": 3124.4, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 0.21390374331550802, |
| "grad_norm": 0.7903556123351976, |
| "learning_rate": 1.2113289760348586e-05, |
| "loss": 0.6659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38125163316726685, |
| "step": 140, |
| "valid_targets_mean": 3087.4, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 0.2215431627196333, |
| "grad_norm": 0.7589506946645384, |
| "learning_rate": 1.2549019607843138e-05, |
| "loss": 0.6921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36488616466522217, |
| "step": 145, |
| "valid_targets_mean": 4247.0, |
| "valid_targets_min": 1868 |
| }, |
| { |
| "epoch": 0.22918258212375858, |
| "grad_norm": 0.6894437269697314, |
| "learning_rate": 1.298474945533769e-05, |
| "loss": 0.6682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2953642010688782, |
| "step": 150, |
| "valid_targets_mean": 3034.4, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 0.23682200152788388, |
| "grad_norm": 0.9478585705238028, |
| "learning_rate": 1.3420479302832245e-05, |
| "loss": 0.6625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3361087143421173, |
| "step": 155, |
| "valid_targets_mean": 1931.2, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 0.24446142093200918, |
| "grad_norm": 0.6983921245328072, |
| "learning_rate": 1.3856209150326799e-05, |
| "loss": 0.6769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39449670910835266, |
| "step": 160, |
| "valid_targets_mean": 4291.1, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 0.25210084033613445, |
| "grad_norm": 0.7642774492217729, |
| "learning_rate": 1.4291938997821353e-05, |
| "loss": 0.6664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3134499788284302, |
| "step": 165, |
| "valid_targets_mean": 2839.6, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 0.2597402597402597, |
| "grad_norm": 0.7000875293679036, |
| "learning_rate": 1.4727668845315905e-05, |
| "loss": 0.635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41188955307006836, |
| "step": 170, |
| "valid_targets_mean": 3929.6, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 0.26737967914438504, |
| "grad_norm": 0.860459609848493, |
| "learning_rate": 1.5163398692810458e-05, |
| "loss": 0.6856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4588810205459595, |
| "step": 175, |
| "valid_targets_mean": 3703.8, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 0.2750190985485103, |
| "grad_norm": 1.9304398390219022, |
| "learning_rate": 1.559912854030501e-05, |
| "loss": 0.6345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32375526428222656, |
| "step": 180, |
| "valid_targets_mean": 3939.1, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 0.2826585179526356, |
| "grad_norm": 0.8170199929994688, |
| "learning_rate": 1.6034858387799567e-05, |
| "loss": 0.6095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33352822065353394, |
| "step": 185, |
| "valid_targets_mean": 3359.6, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 0.2902979373567609, |
| "grad_norm": 0.6978579891276123, |
| "learning_rate": 1.647058823529412e-05, |
| "loss": 0.6729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40702342987060547, |
| "step": 190, |
| "valid_targets_mean": 3593.4, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 0.2979373567608862, |
| "grad_norm": 1.0173308675163864, |
| "learning_rate": 1.6906318082788672e-05, |
| "loss": 0.6387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4305134415626526, |
| "step": 195, |
| "valid_targets_mean": 2495.9, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 0.30557677616501144, |
| "grad_norm": 0.6720245226873705, |
| "learning_rate": 1.7342047930283224e-05, |
| "loss": 0.631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26800355315208435, |
| "step": 200, |
| "valid_targets_mean": 2775.8, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 0.31321619556913677, |
| "grad_norm": 0.7925807789036575, |
| "learning_rate": 1.7777777777777777e-05, |
| "loss": 0.6251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26368221640586853, |
| "step": 205, |
| "valid_targets_mean": 3823.2, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 0.32085561497326204, |
| "grad_norm": 0.8482490987351864, |
| "learning_rate": 1.8213507625272332e-05, |
| "loss": 0.6464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3924250304698944, |
| "step": 210, |
| "valid_targets_mean": 3340.0, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 0.3284950343773873, |
| "grad_norm": 0.7587944111803762, |
| "learning_rate": 1.8649237472766885e-05, |
| "loss": 0.6271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2620357275009155, |
| "step": 215, |
| "valid_targets_mean": 2859.0, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 0.33613445378151263, |
| "grad_norm": 0.7364341217962659, |
| "learning_rate": 1.908496732026144e-05, |
| "loss": 0.6122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3173060417175293, |
| "step": 220, |
| "valid_targets_mean": 3238.9, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 0.3437738731856379, |
| "grad_norm": 0.6987727914802906, |
| "learning_rate": 1.9520697167755993e-05, |
| "loss": 0.6125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30513855814933777, |
| "step": 225, |
| "valid_targets_mean": 3986.5, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 0.35141329258976317, |
| "grad_norm": 0.7226588989043562, |
| "learning_rate": 1.9956427015250545e-05, |
| "loss": 0.6279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33299773931503296, |
| "step": 230, |
| "valid_targets_mean": 3696.0, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 0.35905271199388844, |
| "grad_norm": 0.8158650358729972, |
| "learning_rate": 2.0392156862745097e-05, |
| "loss": 0.6654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32044363021850586, |
| "step": 235, |
| "valid_targets_mean": 3097.4, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 0.36669213139801377, |
| "grad_norm": 0.7088614261293413, |
| "learning_rate": 2.0827886710239653e-05, |
| "loss": 0.6017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2543582618236542, |
| "step": 240, |
| "valid_targets_mean": 2256.9, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 0.37433155080213903, |
| "grad_norm": 0.6151357812054147, |
| "learning_rate": 2.126361655773421e-05, |
| "loss": 0.6515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1985795795917511, |
| "step": 245, |
| "valid_targets_mean": 3318.6, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 0.3819709702062643, |
| "grad_norm": 0.7937566667562097, |
| "learning_rate": 2.1699346405228758e-05, |
| "loss": 0.6187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3406463861465454, |
| "step": 250, |
| "valid_targets_mean": 3448.1, |
| "valid_targets_min": 2067 |
| }, |
| { |
| "epoch": 0.38961038961038963, |
| "grad_norm": 0.6298445900787324, |
| "learning_rate": 2.2135076252723313e-05, |
| "loss": 0.5786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29489225149154663, |
| "step": 255, |
| "valid_targets_mean": 3681.2, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 0.3972498090145149, |
| "grad_norm": 0.8201725710279596, |
| "learning_rate": 2.257080610021787e-05, |
| "loss": 0.6133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3263534903526306, |
| "step": 260, |
| "valid_targets_mean": 3468.8, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 0.40488922841864017, |
| "grad_norm": 0.7501412935238757, |
| "learning_rate": 2.3006535947712418e-05, |
| "loss": 0.6471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30918407440185547, |
| "step": 265, |
| "valid_targets_mean": 4111.1, |
| "valid_targets_min": 1461 |
| }, |
| { |
| "epoch": 0.4125286478227655, |
| "grad_norm": 0.7932880947679686, |
| "learning_rate": 2.3442265795206974e-05, |
| "loss": 0.635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38556236028671265, |
| "step": 270, |
| "valid_targets_mean": 3402.2, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 0.42016806722689076, |
| "grad_norm": 0.7336631307032824, |
| "learning_rate": 2.387799564270153e-05, |
| "loss": 0.6027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2884320020675659, |
| "step": 275, |
| "valid_targets_mean": 3283.2, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 0.42780748663101603, |
| "grad_norm": 0.7987572249200825, |
| "learning_rate": 2.431372549019608e-05, |
| "loss": 0.5793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.303595632314682, |
| "step": 280, |
| "valid_targets_mean": 3274.4, |
| "valid_targets_min": 1782 |
| }, |
| { |
| "epoch": 0.43544690603514136, |
| "grad_norm": 0.7921872393026232, |
| "learning_rate": 2.4749455337690634e-05, |
| "loss": 0.6192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34139686822891235, |
| "step": 285, |
| "valid_targets_mean": 3101.2, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 0.4430863254392666, |
| "grad_norm": 0.745571535038673, |
| "learning_rate": 2.5185185185185187e-05, |
| "loss": 0.628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32645875215530396, |
| "step": 290, |
| "valid_targets_mean": 3515.2, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 0.4507257448433919, |
| "grad_norm": 0.7733455760458197, |
| "learning_rate": 2.562091503267974e-05, |
| "loss": 0.6153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41803407669067383, |
| "step": 295, |
| "valid_targets_mean": 3754.2, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 0.45836516424751717, |
| "grad_norm": 0.8925987187590559, |
| "learning_rate": 2.6056644880174295e-05, |
| "loss": 0.6203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3707024157047272, |
| "step": 300, |
| "valid_targets_mean": 2850.6, |
| "valid_targets_min": 1689 |
| }, |
| { |
| "epoch": 0.4660045836516425, |
| "grad_norm": 0.8036647475977927, |
| "learning_rate": 2.6492374727668847e-05, |
| "loss": 0.6258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2339508831501007, |
| "step": 305, |
| "valid_targets_mean": 2463.9, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 0.47364400305576776, |
| "grad_norm": 0.7031610335825725, |
| "learning_rate": 2.6928104575163403e-05, |
| "loss": 0.6027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25344857573509216, |
| "step": 310, |
| "valid_targets_mean": 2872.8, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 0.48128342245989303, |
| "grad_norm": 0.7480718215833951, |
| "learning_rate": 2.736383442265795e-05, |
| "loss": 0.6064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21547476947307587, |
| "step": 315, |
| "valid_targets_mean": 2392.2, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 0.48892284186401835, |
| "grad_norm": 0.8331408619239437, |
| "learning_rate": 2.7799564270152507e-05, |
| "loss": 0.6047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2768464684486389, |
| "step": 320, |
| "valid_targets_mean": 2553.5, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 0.4965622612681436, |
| "grad_norm": 0.8087367473209722, |
| "learning_rate": 2.8235294117647063e-05, |
| "loss": 0.6213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26989734172821045, |
| "step": 325, |
| "valid_targets_mean": 3067.9, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 0.5042016806722689, |
| "grad_norm": 0.7776781031068692, |
| "learning_rate": 2.8671023965141612e-05, |
| "loss": 0.5847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27393457293510437, |
| "step": 330, |
| "valid_targets_mean": 2845.4, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 0.5118411000763942, |
| "grad_norm": 0.8248214347980428, |
| "learning_rate": 2.9106753812636168e-05, |
| "loss": 0.6142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2886251211166382, |
| "step": 335, |
| "valid_targets_mean": 3156.9, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 0.5194805194805194, |
| "grad_norm": 0.7871145452467468, |
| "learning_rate": 2.9542483660130724e-05, |
| "loss": 0.6064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22021612524986267, |
| "step": 340, |
| "valid_targets_mean": 1920.1, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 0.5271199388846448, |
| "grad_norm": 0.6598524132491371, |
| "learning_rate": 2.9978213507625272e-05, |
| "loss": 0.5969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3316832184791565, |
| "step": 345, |
| "valid_targets_mean": 4670.0, |
| "valid_targets_min": 1362 |
| }, |
| { |
| "epoch": 0.5347593582887701, |
| "grad_norm": 0.7714969570983577, |
| "learning_rate": 3.0413943355119828e-05, |
| "loss": 0.5802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3330127000808716, |
| "step": 350, |
| "valid_targets_mean": 3081.5, |
| "valid_targets_min": 1703 |
| }, |
| { |
| "epoch": 0.5423987776928954, |
| "grad_norm": 0.7754477862247269, |
| "learning_rate": 3.0849673202614384e-05, |
| "loss": 0.6115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28545576333999634, |
| "step": 355, |
| "valid_targets_mean": 2166.5, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 0.5500381970970206, |
| "grad_norm": 0.9165516616675281, |
| "learning_rate": 3.1285403050108936e-05, |
| "loss": 0.5981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3413655459880829, |
| "step": 360, |
| "valid_targets_mean": 2802.4, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 0.5576776165011459, |
| "grad_norm": 0.7628767779169452, |
| "learning_rate": 3.172113289760349e-05, |
| "loss": 0.5909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37848758697509766, |
| "step": 365, |
| "valid_targets_mean": 3536.0, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 0.5653170359052712, |
| "grad_norm": 0.6456443237893429, |
| "learning_rate": 3.215686274509804e-05, |
| "loss": 0.5739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23117348551750183, |
| "step": 370, |
| "valid_targets_mean": 3513.4, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 0.5729564553093965, |
| "grad_norm": 0.7131390860118433, |
| "learning_rate": 3.259259259259259e-05, |
| "loss": 0.5903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28896501660346985, |
| "step": 375, |
| "valid_targets_mean": 3813.5, |
| "valid_targets_min": 1767 |
| }, |
| { |
| "epoch": 0.5805958747135218, |
| "grad_norm": 0.7059247357677485, |
| "learning_rate": 3.3028322440087146e-05, |
| "loss": 0.5981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2769196033477783, |
| "step": 380, |
| "valid_targets_mean": 3733.4, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 0.5882352941176471, |
| "grad_norm": 0.7099487325643025, |
| "learning_rate": 3.3464052287581705e-05, |
| "loss": 0.574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2509758472442627, |
| "step": 385, |
| "valid_targets_mean": 3110.4, |
| "valid_targets_min": 1557 |
| }, |
| { |
| "epoch": 0.5958747135217723, |
| "grad_norm": 0.73751067378954, |
| "learning_rate": 3.389978213507625e-05, |
| "loss": 0.5929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2418426275253296, |
| "step": 390, |
| "valid_targets_mean": 2331.1, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 0.6035141329258976, |
| "grad_norm": 0.6947985101021568, |
| "learning_rate": 3.433551198257081e-05, |
| "loss": 0.6145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24075086414813995, |
| "step": 395, |
| "valid_targets_mean": 3555.6, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 0.6111535523300229, |
| "grad_norm": 0.6913463347195935, |
| "learning_rate": 3.477124183006536e-05, |
| "loss": 0.5987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3037499189376831, |
| "step": 400, |
| "valid_targets_mean": 4055.1, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 0.6187929717341482, |
| "grad_norm": 0.790293928960079, |
| "learning_rate": 3.5206971677559914e-05, |
| "loss": 0.572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2849627733230591, |
| "step": 405, |
| "valid_targets_mean": 3600.0, |
| "valid_targets_min": 2347 |
| }, |
| { |
| "epoch": 0.6264323911382735, |
| "grad_norm": 0.7315439623965397, |
| "learning_rate": 3.5642701525054466e-05, |
| "loss": 0.5668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3170517086982727, |
| "step": 410, |
| "valid_targets_mean": 3977.9, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 0.6340718105423988, |
| "grad_norm": 0.7687583162677026, |
| "learning_rate": 3.6078431372549025e-05, |
| "loss": 0.6283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3087868094444275, |
| "step": 415, |
| "valid_targets_mean": 2945.9, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 0.6417112299465241, |
| "grad_norm": 0.7628238951175478, |
| "learning_rate": 3.651416122004358e-05, |
| "loss": 0.5964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33389556407928467, |
| "step": 420, |
| "valid_targets_mean": 3730.8, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 0.6493506493506493, |
| "grad_norm": 0.6695423107998377, |
| "learning_rate": 3.694989106753813e-05, |
| "loss": 0.5885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22009310126304626, |
| "step": 425, |
| "valid_targets_mean": 3358.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 0.6569900687547746, |
| "grad_norm": 0.82620661841163, |
| "learning_rate": 3.738562091503268e-05, |
| "loss": 0.5811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26666954159736633, |
| "step": 430, |
| "valid_targets_mean": 2360.4, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 0.6646294881588999, |
| "grad_norm": 0.6929939957736985, |
| "learning_rate": 3.7821350762527235e-05, |
| "loss": 0.5774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22594678401947021, |
| "step": 435, |
| "valid_targets_mean": 2447.9, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 0.6722689075630253, |
| "grad_norm": 0.7019484401785123, |
| "learning_rate": 3.825708061002179e-05, |
| "loss": 0.5808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3131728768348694, |
| "step": 440, |
| "valid_targets_mean": 3665.8, |
| "valid_targets_min": 253 |
| }, |
| { |
| "epoch": 0.6799083269671505, |
| "grad_norm": 0.6685256141352108, |
| "learning_rate": 3.8692810457516346e-05, |
| "loss": 0.5552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2552865147590637, |
| "step": 445, |
| "valid_targets_mean": 3354.5, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 0.6875477463712758, |
| "grad_norm": 0.7265392876508043, |
| "learning_rate": 3.91285403050109e-05, |
| "loss": 0.5729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2652282118797302, |
| "step": 450, |
| "valid_targets_mean": 2713.8, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 0.6951871657754011, |
| "grad_norm": 0.6360107272199381, |
| "learning_rate": 3.956427015250545e-05, |
| "loss": 0.6083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2762466073036194, |
| "step": 455, |
| "valid_targets_mean": 4311.1, |
| "valid_targets_min": 1273 |
| }, |
| { |
| "epoch": 0.7028265851795263, |
| "grad_norm": 0.671880392414106, |
| "learning_rate": 4e-05, |
| "loss": 0.5937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2647872865200043, |
| "step": 460, |
| "valid_targets_mean": 3698.0, |
| "valid_targets_min": 1609 |
| }, |
| { |
| "epoch": 0.7104660045836516, |
| "grad_norm": 0.6591072439688226, |
| "learning_rate": 3.999985506249457e-05, |
| "loss": 0.5958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27107876539230347, |
| "step": 465, |
| "valid_targets_mean": 3154.5, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 0.7181054239877769, |
| "grad_norm": 0.779690577173135, |
| "learning_rate": 3.9999420252078994e-05, |
| "loss": 0.5721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27595773339271545, |
| "step": 470, |
| "valid_targets_mean": 3683.6, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.7257448433919023, |
| "grad_norm": 0.6772343189565297, |
| "learning_rate": 3.9998695575055276e-05, |
| "loss": 0.5944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38341811299324036, |
| "step": 475, |
| "valid_targets_mean": 4689.9, |
| "valid_targets_min": 1562 |
| }, |
| { |
| "epoch": 0.7333842627960275, |
| "grad_norm": 0.8079543845936882, |
| "learning_rate": 3.9997681041926714e-05, |
| "loss": 0.5551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.338105171918869, |
| "step": 480, |
| "valid_targets_mean": 2228.9, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.7410236822001528, |
| "grad_norm": 0.6586142611830866, |
| "learning_rate": 3.99963766673977e-05, |
| "loss": 0.5536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2373753786087036, |
| "step": 485, |
| "valid_targets_mean": 3322.0, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 0.7486631016042781, |
| "grad_norm": 0.7147237521146843, |
| "learning_rate": 3.999478247037352e-05, |
| "loss": 0.5756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3543473482131958, |
| "step": 490, |
| "valid_targets_mean": 4644.6, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 0.7563025210084033, |
| "grad_norm": 0.7867926605712047, |
| "learning_rate": 3.999289847396006e-05, |
| "loss": 0.6146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33008497953414917, |
| "step": 495, |
| "valid_targets_mean": 3087.8, |
| "valid_targets_min": 1208 |
| }, |
| { |
| "epoch": 0.7639419404125286, |
| "grad_norm": 0.6172355973475613, |
| "learning_rate": 3.9990724705463495e-05, |
| "loss": 0.5805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37864190340042114, |
| "step": 500, |
| "valid_targets_mean": 5465.1, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 0.771581359816654, |
| "grad_norm": 0.7480683025973461, |
| "learning_rate": 3.998826119638989e-05, |
| "loss": 0.5759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2788500487804413, |
| "step": 505, |
| "valid_targets_mean": 3069.6, |
| "valid_targets_min": 1494 |
| }, |
| { |
| "epoch": 0.7792207792207793, |
| "grad_norm": 0.7137435243602375, |
| "learning_rate": 3.998550798244472e-05, |
| "loss": 0.5894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3722362518310547, |
| "step": 510, |
| "valid_targets_mean": 3935.2, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 0.7868601986249045, |
| "grad_norm": 0.7133729047894137, |
| "learning_rate": 3.9982465103532386e-05, |
| "loss": 0.5479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29172253608703613, |
| "step": 515, |
| "valid_targets_mean": 3255.4, |
| "valid_targets_min": 1224 |
| }, |
| { |
| "epoch": 0.7944996180290298, |
| "grad_norm": 0.8123949372956061, |
| "learning_rate": 3.997913260375562e-05, |
| "loss": 0.5928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29111629724502563, |
| "step": 520, |
| "valid_targets_mean": 2608.0, |
| "valid_targets_min": 1413 |
| }, |
| { |
| "epoch": 0.8021390374331551, |
| "grad_norm": 0.7607753286866613, |
| "learning_rate": 3.9975510531414835e-05, |
| "loss": 0.5838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3003314435482025, |
| "step": 525, |
| "valid_targets_mean": 3636.6, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 0.8097784568372803, |
| "grad_norm": 0.7593775820169156, |
| "learning_rate": 3.997159893900745e-05, |
| "loss": 0.5411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2764055132865906, |
| "step": 530, |
| "valid_targets_mean": 2633.2, |
| "valid_targets_min": 1343 |
| }, |
| { |
| "epoch": 0.8174178762414056, |
| "grad_norm": 0.7550291803600192, |
| "learning_rate": 3.9967397883227104e-05, |
| "loss": 0.5935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2789875566959381, |
| "step": 535, |
| "valid_targets_mean": 2900.9, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 0.825057295645531, |
| "grad_norm": 0.6099292035548061, |
| "learning_rate": 3.9962907424962856e-05, |
| "loss": 0.5777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2896302044391632, |
| "step": 540, |
| "valid_targets_mean": 4579.8, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 0.8326967150496563, |
| "grad_norm": 0.6670417720845128, |
| "learning_rate": 3.995812762929829e-05, |
| "loss": 0.6051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20029598474502563, |
| "step": 545, |
| "valid_targets_mean": 2811.9, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 0.8403361344537815, |
| "grad_norm": 0.9488128832161037, |
| "learning_rate": 3.995305856551057e-05, |
| "loss": 0.5861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22825755178928375, |
| "step": 550, |
| "valid_targets_mean": 2501.6, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 0.8479755538579068, |
| "grad_norm": 0.6086366642647173, |
| "learning_rate": 3.994770030706944e-05, |
| "loss": 0.5494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3427432179450989, |
| "step": 555, |
| "valid_targets_mean": 5665.4, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 0.8556149732620321, |
| "grad_norm": 0.70513202037968, |
| "learning_rate": 3.994205293163616e-05, |
| "loss": 0.5937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29944777488708496, |
| "step": 560, |
| "valid_targets_mean": 3229.2, |
| "valid_targets_min": 1980 |
| }, |
| { |
| "epoch": 0.8632543926661573, |
| "grad_norm": 0.9851639022765896, |
| "learning_rate": 3.9936116521062376e-05, |
| "loss": 0.5482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28550928831100464, |
| "step": 565, |
| "valid_targets_mean": 3211.6, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 0.8708938120702827, |
| "grad_norm": 0.7534779579928215, |
| "learning_rate": 3.992989116138895e-05, |
| "loss": 0.5766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2996383011341095, |
| "step": 570, |
| "valid_targets_mean": 3115.0, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 0.878533231474408, |
| "grad_norm": 0.7458527629855309, |
| "learning_rate": 3.99233769428447e-05, |
| "loss": 0.5918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23829689621925354, |
| "step": 575, |
| "valid_targets_mean": 2372.4, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 0.8861726508785333, |
| "grad_norm": 0.7068928044009853, |
| "learning_rate": 3.991657395984507e-05, |
| "loss": 0.5691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30755138397216797, |
| "step": 580, |
| "valid_targets_mean": 3072.1, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 0.8938120702826585, |
| "grad_norm": 0.7004756487633861, |
| "learning_rate": 3.99094823109908e-05, |
| "loss": 0.602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21224084496498108, |
| "step": 585, |
| "valid_targets_mean": 2138.5, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 0.9014514896867838, |
| "grad_norm": 0.681477572048519, |
| "learning_rate": 3.990210209906649e-05, |
| "loss": 0.5667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23268462717533112, |
| "step": 590, |
| "valid_targets_mean": 3107.2, |
| "valid_targets_min": 2053 |
| }, |
| { |
| "epoch": 0.9090909090909091, |
| "grad_norm": 1.0438675359941987, |
| "learning_rate": 3.989443343103908e-05, |
| "loss": 0.5745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3275293707847595, |
| "step": 595, |
| "valid_targets_mean": 3463.5, |
| "valid_targets_min": 1444 |
| }, |
| { |
| "epoch": 0.9167303284950343, |
| "grad_norm": 0.7400160340371931, |
| "learning_rate": 3.9886476418056336e-05, |
| "loss": 0.5671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3153223991394043, |
| "step": 600, |
| "valid_targets_mean": 3044.6, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 0.9243697478991597, |
| "grad_norm": 0.6652294370667957, |
| "learning_rate": 3.987823117544522e-05, |
| "loss": 0.5372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.389309823513031, |
| "step": 605, |
| "valid_targets_mean": 4362.6, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 0.932009167303285, |
| "grad_norm": 0.6212675682208829, |
| "learning_rate": 3.986969782271022e-05, |
| "loss": 0.5665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21082836389541626, |
| "step": 610, |
| "valid_targets_mean": 3255.6, |
| "valid_targets_min": 1697 |
| }, |
| { |
| "epoch": 0.9396485867074102, |
| "grad_norm": 0.6862137461635358, |
| "learning_rate": 3.986087648353162e-05, |
| "loss": 0.6083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2789027988910675, |
| "step": 615, |
| "valid_targets_mean": 2877.1, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 0.9472880061115355, |
| "grad_norm": 0.6028470891869618, |
| "learning_rate": 3.985176728576371e-05, |
| "loss": 0.5559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2874605655670166, |
| "step": 620, |
| "valid_targets_mean": 4492.4, |
| "valid_targets_min": 2143 |
| }, |
| { |
| "epoch": 0.9549274255156608, |
| "grad_norm": 0.7101556487572386, |
| "learning_rate": 3.984237036143293e-05, |
| "loss": 0.5598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23973211646080017, |
| "step": 625, |
| "valid_targets_mean": 2781.4, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 0.9625668449197861, |
| "grad_norm": 0.6406876645725995, |
| "learning_rate": 3.9832685846735965e-05, |
| "loss": 0.5471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23441874980926514, |
| "step": 630, |
| "valid_targets_mean": 3437.4, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 0.9702062643239114, |
| "grad_norm": 0.8179086861154274, |
| "learning_rate": 3.982271388203775e-05, |
| "loss": 0.601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24605703353881836, |
| "step": 635, |
| "valid_targets_mean": 2201.5, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 0.9778456837280367, |
| "grad_norm": 0.7379654548504041, |
| "learning_rate": 3.981245461186945e-05, |
| "loss": 0.5831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2373408079147339, |
| "step": 640, |
| "valid_targets_mean": 1922.5, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 0.985485103132162, |
| "grad_norm": 0.6325975201384703, |
| "learning_rate": 3.980190818492637e-05, |
| "loss": 0.563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22413653135299683, |
| "step": 645, |
| "valid_targets_mean": 2914.0, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 0.9931245225362872, |
| "grad_norm": 0.7202033071183617, |
| "learning_rate": 3.979107475406579e-05, |
| "loss": 0.6126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4340353012084961, |
| "step": 650, |
| "valid_targets_mean": 3802.1, |
| "valid_targets_min": 1421 |
| }, |
| { |
| "epoch": 1.0, |
| "grad_norm": 1.1116558746504048, |
| "learning_rate": 3.977995447630475e-05, |
| "loss": 0.5592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5354721546173096, |
| "step": 655, |
| "valid_targets_mean": 2106.2, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 1.0076394194041254, |
| "grad_norm": 0.6522118231154711, |
| "learning_rate": 3.9768547512817794e-05, |
| "loss": 0.5855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2696242332458496, |
| "step": 660, |
| "valid_targets_mean": 2601.8, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 1.0152788388082505, |
| "grad_norm": 0.7282006050891634, |
| "learning_rate": 3.9756854028934604e-05, |
| "loss": 0.5707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30138200521469116, |
| "step": 665, |
| "valid_targets_mean": 3397.9, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 1.022918258212376, |
| "grad_norm": 0.6705684638682171, |
| "learning_rate": 3.974487419413761e-05, |
| "loss": 0.5371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26151737570762634, |
| "step": 670, |
| "valid_targets_mean": 3653.8, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 1.030557677616501, |
| "grad_norm": 0.723948374365064, |
| "learning_rate": 3.973260818205955e-05, |
| "loss": 0.5463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3313744366168976, |
| "step": 675, |
| "valid_targets_mean": 3186.4, |
| "valid_targets_min": 1538 |
| }, |
| { |
| "epoch": 1.0381970970206265, |
| "grad_norm": 0.7836642368648493, |
| "learning_rate": 3.972005617048094e-05, |
| "loss": 0.5226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37249183654785156, |
| "step": 680, |
| "valid_targets_mean": 3745.6, |
| "valid_targets_min": 1744 |
| }, |
| { |
| "epoch": 1.0458365164247516, |
| "grad_norm": 0.6689920597254674, |
| "learning_rate": 3.970721834132751e-05, |
| "loss": 0.5186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.237932026386261, |
| "step": 685, |
| "valid_targets_mean": 2938.4, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 1.053475935828877, |
| "grad_norm": 0.6766713408339188, |
| "learning_rate": 3.969409488066756e-05, |
| "loss": 0.5645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27513009309768677, |
| "step": 690, |
| "valid_targets_mean": 3106.2, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 1.0611153552330024, |
| "grad_norm": 0.7249242616575575, |
| "learning_rate": 3.9680685978709254e-05, |
| "loss": 0.5285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3080906271934509, |
| "step": 695, |
| "valid_targets_mean": 3352.1, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 1.0687547746371275, |
| "grad_norm": 0.6371623942622592, |
| "learning_rate": 3.966699182979785e-05, |
| "loss": 0.5529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2962953448295593, |
| "step": 700, |
| "valid_targets_mean": 4250.9, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 1.076394194041253, |
| "grad_norm": 0.7676470422260585, |
| "learning_rate": 3.965301263241296e-05, |
| "loss": 0.5641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2619950473308563, |
| "step": 705, |
| "valid_targets_mean": 2716.8, |
| "valid_targets_min": 1882 |
| }, |
| { |
| "epoch": 1.084033613445378, |
| "grad_norm": 0.6587402474304499, |
| "learning_rate": 3.963874858916556e-05, |
| "loss": 0.5408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28987687826156616, |
| "step": 710, |
| "valid_targets_mean": 3787.6, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 1.0916730328495035, |
| "grad_norm": 0.6913158304836163, |
| "learning_rate": 3.9624199906795136e-05, |
| "loss": 0.5436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28918856382369995, |
| "step": 715, |
| "valid_targets_mean": 4839.6, |
| "valid_targets_min": 1376 |
| }, |
| { |
| "epoch": 1.0993124522536286, |
| "grad_norm": 0.703709027064511, |
| "learning_rate": 3.960936679616667e-05, |
| "loss": 0.5102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26379460096359253, |
| "step": 720, |
| "valid_targets_mean": 3043.2, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 1.106951871657754, |
| "grad_norm": 0.5380096123166979, |
| "learning_rate": 3.959424947226756e-05, |
| "loss": 0.5143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24659261107444763, |
| "step": 725, |
| "valid_targets_mean": 4539.6, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 1.1145912910618794, |
| "grad_norm": 0.6464956071511203, |
| "learning_rate": 3.957884815420453e-05, |
| "loss": 0.5857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19127747416496277, |
| "step": 730, |
| "valid_targets_mean": 2436.2, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 1.1222307104660045, |
| "grad_norm": 0.7029816183033232, |
| "learning_rate": 3.956316306520044e-05, |
| "loss": 0.5619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28624215722084045, |
| "step": 735, |
| "valid_targets_mean": 3306.8, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 1.12987012987013, |
| "grad_norm": 0.6838882183908288, |
| "learning_rate": 3.9547194432591066e-05, |
| "loss": 0.5111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3031734824180603, |
| "step": 740, |
| "valid_targets_mean": 3253.0, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 1.137509549274255, |
| "grad_norm": 0.6539220963516174, |
| "learning_rate": 3.9530942487821785e-05, |
| "loss": 0.5282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22544610500335693, |
| "step": 745, |
| "valid_targets_mean": 2679.9, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 1.1451489686783805, |
| "grad_norm": 0.6232994419948458, |
| "learning_rate": 3.951440746644422e-05, |
| "loss": 0.5659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22838760912418365, |
| "step": 750, |
| "valid_targets_mean": 3408.6, |
| "valid_targets_min": 1703 |
| }, |
| { |
| "epoch": 1.1527883880825058, |
| "grad_norm": 0.7040726919722308, |
| "learning_rate": 3.949758960811284e-05, |
| "loss": 0.5475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23174643516540527, |
| "step": 755, |
| "valid_targets_mean": 2185.2, |
| "valid_targets_min": 430 |
| }, |
| { |
| "epoch": 1.160427807486631, |
| "grad_norm": 0.6789214431654883, |
| "learning_rate": 3.9480489156581514e-05, |
| "loss": 0.521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28578507900238037, |
| "step": 760, |
| "valid_targets_mean": 3754.8, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 1.1680672268907564, |
| "grad_norm": 0.7733782691321108, |
| "learning_rate": 3.94631063596999e-05, |
| "loss": 0.5316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2440919578075409, |
| "step": 765, |
| "valid_targets_mean": 2929.8, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 1.1757066462948815, |
| "grad_norm": 0.6473357152162962, |
| "learning_rate": 3.9445441469409924e-05, |
| "loss": 0.5058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3352232277393341, |
| "step": 770, |
| "valid_targets_mean": 4502.8, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 1.183346065699007, |
| "grad_norm": 0.7669883434486255, |
| "learning_rate": 3.94274947417421e-05, |
| "loss": 0.5436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27057844400405884, |
| "step": 775, |
| "valid_targets_mean": 3110.5, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 1.190985485103132, |
| "grad_norm": 0.7542936395101697, |
| "learning_rate": 3.9409266436811824e-05, |
| "loss": 0.5254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21778935194015503, |
| "step": 780, |
| "valid_targets_mean": 4820.9, |
| "valid_targets_min": 2305 |
| }, |
| { |
| "epoch": 1.1986249045072574, |
| "grad_norm": 0.7606927697328497, |
| "learning_rate": 3.9390756818815605e-05, |
| "loss": 0.5343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33282411098480225, |
| "step": 785, |
| "valid_targets_mean": 2609.5, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 1.2062643239113828, |
| "grad_norm": 0.7384013328069043, |
| "learning_rate": 3.937196615602722e-05, |
| "loss": 0.5432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34026217460632324, |
| "step": 790, |
| "valid_targets_mean": 3617.6, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 1.213903743315508, |
| "grad_norm": 0.7436645557686744, |
| "learning_rate": 3.9352894720793844e-05, |
| "loss": 0.5174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2270776778459549, |
| "step": 795, |
| "valid_targets_mean": 2522.6, |
| "valid_targets_min": 1883 |
| }, |
| { |
| "epoch": 1.2215431627196334, |
| "grad_norm": 0.7123365313732616, |
| "learning_rate": 3.9333542789532116e-05, |
| "loss": 0.5672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3193785548210144, |
| "step": 800, |
| "valid_targets_mean": 3023.6, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 1.2291825821237585, |
| "grad_norm": 0.7643663765177652, |
| "learning_rate": 3.9313910642724084e-05, |
| "loss": 0.518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1887185126543045, |
| "step": 805, |
| "valid_targets_mean": 1951.9, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 1.236822001527884, |
| "grad_norm": 0.6346468679822354, |
| "learning_rate": 3.92939985649132e-05, |
| "loss": 0.5205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29271286725997925, |
| "step": 810, |
| "valid_targets_mean": 4557.6, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 1.244461420932009, |
| "grad_norm": 0.6343394889103051, |
| "learning_rate": 3.927380684470016e-05, |
| "loss": 0.5072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1973128616809845, |
| "step": 815, |
| "valid_targets_mean": 2726.2, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 1.2521008403361344, |
| "grad_norm": 0.6630789556378238, |
| "learning_rate": 3.9253335774738693e-05, |
| "loss": 0.5256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32815930247306824, |
| "step": 820, |
| "valid_targets_mean": 3497.5, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 1.2597402597402598, |
| "grad_norm": 0.6526796753186936, |
| "learning_rate": 3.92325856517314e-05, |
| "loss": 0.5265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2999138832092285, |
| "step": 825, |
| "valid_targets_mean": 3903.5, |
| "valid_targets_min": 1335 |
| }, |
| { |
| "epoch": 1.267379679144385, |
| "grad_norm": 0.7827981591665036, |
| "learning_rate": 3.9211556776425374e-05, |
| "loss": 0.5689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3150915205478668, |
| "step": 830, |
| "valid_targets_mean": 2640.9, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 1.2750190985485104, |
| "grad_norm": 0.7247020902846159, |
| "learning_rate": 3.919024945360791e-05, |
| "loss": 0.5661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33880436420440674, |
| "step": 835, |
| "valid_targets_mean": 3613.6, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 1.2826585179526355, |
| "grad_norm": 0.6163344529726824, |
| "learning_rate": 3.916866399210201e-05, |
| "loss": 0.5022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2479287087917328, |
| "step": 840, |
| "valid_targets_mean": 3889.8, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.290297937356761, |
| "grad_norm": 0.5806538155279558, |
| "learning_rate": 3.9146800704761976e-05, |
| "loss": 0.5273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31038084626197815, |
| "step": 845, |
| "valid_targets_mean": 4618.4, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 1.2979373567608863, |
| "grad_norm": 0.6961922232392995, |
| "learning_rate": 3.912465990846884e-05, |
| "loss": 0.539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.347188800573349, |
| "step": 850, |
| "valid_targets_mean": 3624.2, |
| "valid_targets_min": 1515 |
| }, |
| { |
| "epoch": 1.3055767761650114, |
| "grad_norm": 0.710377247785307, |
| "learning_rate": 3.910224192412578e-05, |
| "loss": 0.542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3642812967300415, |
| "step": 855, |
| "valid_targets_mean": 3940.1, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 1.3132161955691368, |
| "grad_norm": 0.7270203911442068, |
| "learning_rate": 3.9079547076653466e-05, |
| "loss": 0.5641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16767947375774384, |
| "step": 860, |
| "valid_targets_mean": 1617.4, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 1.320855614973262, |
| "grad_norm": 0.6324169969165148, |
| "learning_rate": 3.9056575694985356e-05, |
| "loss": 0.5432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20532405376434326, |
| "step": 865, |
| "valid_targets_mean": 3589.0, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 1.3284950343773874, |
| "grad_norm": 0.8074126717640064, |
| "learning_rate": 3.903332811206293e-05, |
| "loss": 0.5787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3212442398071289, |
| "step": 870, |
| "valid_targets_mean": 3137.5, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 1.3361344537815127, |
| "grad_norm": 0.6871709684384119, |
| "learning_rate": 3.900980466483085e-05, |
| "loss": 0.5364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2149738073348999, |
| "step": 875, |
| "valid_targets_mean": 2576.8, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 1.343773873185638, |
| "grad_norm": 0.6932421836403329, |
| "learning_rate": 3.89860056942321e-05, |
| "loss": 0.5189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2367231249809265, |
| "step": 880, |
| "valid_targets_mean": 2527.0, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 1.351413292589763, |
| "grad_norm": 0.6497125710859505, |
| "learning_rate": 3.896193154520302e-05, |
| "loss": 0.5318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3200853168964386, |
| "step": 885, |
| "valid_targets_mean": 4165.2, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 1.3590527119938884, |
| "grad_norm": 0.7278203456258373, |
| "learning_rate": 3.8937582566668324e-05, |
| "loss": 0.515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1707996428012848, |
| "step": 890, |
| "valid_targets_mean": 2198.4, |
| "valid_targets_min": 1103 |
| }, |
| { |
| "epoch": 1.3666921313980138, |
| "grad_norm": 0.6901081116464821, |
| "learning_rate": 3.891295911153601e-05, |
| "loss": 0.5303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2586451470851898, |
| "step": 895, |
| "valid_targets_mean": 3480.6, |
| "valid_targets_min": 496 |
| }, |
| { |
| "epoch": 1.374331550802139, |
| "grad_norm": 0.75802472802529, |
| "learning_rate": 3.888806153669233e-05, |
| "loss": 0.5403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3226444125175476, |
| "step": 900, |
| "valid_targets_mean": 3047.5, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 1.3819709702062644, |
| "grad_norm": 0.7026070572178644, |
| "learning_rate": 3.88628902029965e-05, |
| "loss": 0.5463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2279137670993805, |
| "step": 905, |
| "valid_targets_mean": 2393.0, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 1.3896103896103895, |
| "grad_norm": 0.7385335795568237, |
| "learning_rate": 3.883744547527555e-05, |
| "loss": 0.5348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23169125616550446, |
| "step": 910, |
| "valid_targets_mean": 2278.2, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 1.397249809014515, |
| "grad_norm": 0.6321022169220797, |
| "learning_rate": 3.881172772231903e-05, |
| "loss": 0.5418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22475971281528473, |
| "step": 915, |
| "valid_targets_mean": 3198.1, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 1.4048892284186403, |
| "grad_norm": 0.61696149669697, |
| "learning_rate": 3.878573731687362e-05, |
| "loss": 0.572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22539305686950684, |
| "step": 920, |
| "valid_targets_mean": 3476.6, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 1.4125286478227654, |
| "grad_norm": 0.7842361184386845, |
| "learning_rate": 3.8759474635637785e-05, |
| "loss": 0.529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2607775926589966, |
| "step": 925, |
| "valid_targets_mean": 2646.8, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 1.4201680672268908, |
| "grad_norm": 0.7454444565263518, |
| "learning_rate": 3.8732940059256276e-05, |
| "loss": 0.5537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2992340326309204, |
| "step": 930, |
| "valid_targets_mean": 2702.8, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 1.427807486631016, |
| "grad_norm": 0.6734402228717832, |
| "learning_rate": 3.870613397231462e-05, |
| "loss": 0.5306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26427602767944336, |
| "step": 935, |
| "valid_targets_mean": 3468.4, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 1.4354469060351414, |
| "grad_norm": 0.6807817371217704, |
| "learning_rate": 3.867905676333354e-05, |
| "loss": 0.5311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2101900577545166, |
| "step": 940, |
| "valid_targets_mean": 2051.8, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 1.4430863254392667, |
| "grad_norm": 0.7057342976825963, |
| "learning_rate": 3.8651708824763384e-05, |
| "loss": 0.5346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1674555391073227, |
| "step": 945, |
| "valid_targets_mean": 2166.4, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 1.450725744843392, |
| "grad_norm": 0.7101649627528165, |
| "learning_rate": 3.862409055297831e-05, |
| "loss": 0.5648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19412991404533386, |
| "step": 950, |
| "valid_targets_mean": 2372.6, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 1.458365164247517, |
| "grad_norm": 0.7124796816451234, |
| "learning_rate": 3.8596202348270695e-05, |
| "loss": 0.525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34211790561676025, |
| "step": 955, |
| "valid_targets_mean": 3600.6, |
| "valid_targets_min": 1749 |
| }, |
| { |
| "epoch": 1.4660045836516424, |
| "grad_norm": 0.6495231524844639, |
| "learning_rate": 3.85680446148452e-05, |
| "loss": 0.5238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2449973225593567, |
| "step": 960, |
| "valid_targets_mean": 3596.6, |
| "valid_targets_min": 1903 |
| }, |
| { |
| "epoch": 1.4736440030557678, |
| "grad_norm": 0.7385068351743556, |
| "learning_rate": 3.853961776081299e-05, |
| "loss": 0.558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2591915726661682, |
| "step": 965, |
| "valid_targets_mean": 2599.1, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.481283422459893, |
| "grad_norm": 0.6640970141796577, |
| "learning_rate": 3.8510922198185805e-05, |
| "loss": 0.5318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2822009325027466, |
| "step": 970, |
| "valid_targets_mean": 3411.0, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 1.4889228418640184, |
| "grad_norm": 0.728614551507354, |
| "learning_rate": 3.8481958342869966e-05, |
| "loss": 0.5603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47605425119400024, |
| "step": 975, |
| "valid_targets_mean": 4951.6, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 1.4965622612681435, |
| "grad_norm": 0.5670458089086574, |
| "learning_rate": 3.8452726614660364e-05, |
| "loss": 0.4938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.246848464012146, |
| "step": 980, |
| "valid_targets_mean": 3967.6, |
| "valid_targets_min": 1739 |
| }, |
| { |
| "epoch": 1.504201680672269, |
| "grad_norm": 0.5967985021594041, |
| "learning_rate": 3.8423227437234385e-05, |
| "loss": 0.5159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21474456787109375, |
| "step": 985, |
| "valid_targets_mean": 3238.4, |
| "valid_targets_min": 1693 |
| }, |
| { |
| "epoch": 1.5118411000763943, |
| "grad_norm": 0.5896858060191866, |
| "learning_rate": 3.8393461238145737e-05, |
| "loss": 0.5241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27799534797668457, |
| "step": 990, |
| "valid_targets_mean": 3818.8, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 1.5194805194805194, |
| "grad_norm": 0.6403716120248297, |
| "learning_rate": 3.83634284488183e-05, |
| "loss": 0.5646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.310907781124115, |
| "step": 995, |
| "valid_targets_mean": 4377.5, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 1.5271199388846448, |
| "grad_norm": 0.6576858777363869, |
| "learning_rate": 3.833312950453981e-05, |
| "loss": 0.558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18086987733840942, |
| "step": 1000, |
| "valid_targets_mean": 2679.1, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 1.53475935828877, |
| "grad_norm": 0.6264938830245572, |
| "learning_rate": 3.830256484445562e-05, |
| "loss": 0.5231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24808485805988312, |
| "step": 1005, |
| "valid_targets_mean": 3809.2, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 1.5423987776928954, |
| "grad_norm": 0.6947851643347049, |
| "learning_rate": 3.827173491156228e-05, |
| "loss": 0.5597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3576025068759918, |
| "step": 1010, |
| "valid_targets_mean": 3728.4, |
| "valid_targets_min": 1797 |
| }, |
| { |
| "epoch": 1.5500381970970207, |
| "grad_norm": 0.6065532261217823, |
| "learning_rate": 3.824064015270116e-05, |
| "loss": 0.5225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29614564776420593, |
| "step": 1015, |
| "valid_targets_mean": 3743.4, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 1.557677616501146, |
| "grad_norm": 0.737923563809332, |
| "learning_rate": 3.820928101855193e-05, |
| "loss": 0.5736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3168005049228668, |
| "step": 1020, |
| "valid_targets_mean": 2394.5, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 1.565317035905271, |
| "grad_norm": 0.692425445994189, |
| "learning_rate": 3.817765796362606e-05, |
| "loss": 0.518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30288469791412354, |
| "step": 1025, |
| "valid_targets_mean": 3822.5, |
| "valid_targets_min": 1556 |
| }, |
| { |
| "epoch": 1.5729564553093964, |
| "grad_norm": 0.7094886326492358, |
| "learning_rate": 3.814577144626021e-05, |
| "loss": 0.5404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22933900356292725, |
| "step": 1030, |
| "valid_targets_mean": 2317.1, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 1.5805958747135218, |
| "grad_norm": 0.7336132414342458, |
| "learning_rate": 3.811362192860962e-05, |
| "loss": 0.5613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.260783851146698, |
| "step": 1035, |
| "valid_targets_mean": 2234.9, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 1.5882352941176472, |
| "grad_norm": 0.6472450868846049, |
| "learning_rate": 3.808120987664137e-05, |
| "loss": 0.5421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3125843405723572, |
| "step": 1040, |
| "valid_targets_mean": 3125.6, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 1.5958747135217723, |
| "grad_norm": 0.6464488415033857, |
| "learning_rate": 3.804853576012767e-05, |
| "loss": 0.5357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17949353158473969, |
| "step": 1045, |
| "valid_targets_mean": 2726.9, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 1.6035141329258975, |
| "grad_norm": 0.6816461927909948, |
| "learning_rate": 3.8015600052638994e-05, |
| "loss": 0.5328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2890270948410034, |
| "step": 1050, |
| "valid_targets_mean": 2916.8, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 1.6111535523300229, |
| "grad_norm": 0.7078659804169987, |
| "learning_rate": 3.798240323153729e-05, |
| "loss": 0.5186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2691645324230194, |
| "step": 1055, |
| "valid_targets_mean": 2478.0, |
| "valid_targets_min": 1475 |
| }, |
| { |
| "epoch": 1.6187929717341483, |
| "grad_norm": 0.5989882393105532, |
| "learning_rate": 3.7948945777968986e-05, |
| "loss": 0.5433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26992538571357727, |
| "step": 1060, |
| "valid_targets_mean": 3086.0, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 1.6264323911382736, |
| "grad_norm": 0.7037135548541353, |
| "learning_rate": 3.7915228176858076e-05, |
| "loss": 0.5291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1986842006444931, |
| "step": 1065, |
| "valid_targets_mean": 2687.5, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 1.6340718105423988, |
| "grad_norm": 0.6048821928261803, |
| "learning_rate": 3.788125091689906e-05, |
| "loss": 0.5656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23728778958320618, |
| "step": 1070, |
| "valid_targets_mean": 3255.9, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 1.641711229946524, |
| "grad_norm": 0.5355816192539666, |
| "learning_rate": 3.7847014490549865e-05, |
| "loss": 0.5188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24673610925674438, |
| "step": 1075, |
| "valid_targets_mean": 4140.5, |
| "valid_targets_min": 1148 |
| }, |
| { |
| "epoch": 1.6493506493506493, |
| "grad_norm": 0.636731420373111, |
| "learning_rate": 3.7812519394024714e-05, |
| "loss": 0.5173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28254377841949463, |
| "step": 1080, |
| "valid_targets_mean": 4065.0, |
| "valid_targets_min": 1622 |
| }, |
| { |
| "epoch": 1.6569900687547747, |
| "grad_norm": 0.584619470678609, |
| "learning_rate": 3.777776612728693e-05, |
| "loss": 0.5399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24916572868824005, |
| "step": 1085, |
| "valid_targets_mean": 3729.6, |
| "valid_targets_min": 1112 |
| }, |
| { |
| "epoch": 1.6646294881588999, |
| "grad_norm": 0.6309053969396224, |
| "learning_rate": 3.77427551940417e-05, |
| "loss": 0.5159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24699068069458008, |
| "step": 1090, |
| "valid_targets_mean": 3228.4, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 1.6722689075630253, |
| "grad_norm": 0.6306346754741646, |
| "learning_rate": 3.770748710172874e-05, |
| "loss": 0.5214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23530437052249908, |
| "step": 1095, |
| "valid_targets_mean": 3177.8, |
| "valid_targets_min": 1167 |
| }, |
| { |
| "epoch": 1.6799083269671504, |
| "grad_norm": 0.6802201791843018, |
| "learning_rate": 3.7671962361515e-05, |
| "loss": 0.5302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31233322620391846, |
| "step": 1100, |
| "valid_targets_mean": 3288.9, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 1.6875477463712758, |
| "grad_norm": 0.7477194331243122, |
| "learning_rate": 3.76361814882872e-05, |
| "loss": 0.516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23209503293037415, |
| "step": 1105, |
| "valid_targets_mean": 2395.2, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 1.6951871657754012, |
| "grad_norm": 0.6286405393933542, |
| "learning_rate": 3.760014500064437e-05, |
| "loss": 0.5525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3077746331691742, |
| "step": 1110, |
| "valid_targets_mean": 4294.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 1.7028265851795263, |
| "grad_norm": 0.6815312970337704, |
| "learning_rate": 3.75638534208904e-05, |
| "loss": 0.5417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21405085921287537, |
| "step": 1115, |
| "valid_targets_mean": 2392.6, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 1.7104660045836515, |
| "grad_norm": 0.5689062532951552, |
| "learning_rate": 3.7527307275026375e-05, |
| "loss": 0.4856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.196921706199646, |
| "step": 1120, |
| "valid_targets_mean": 3016.2, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 1.7181054239877769, |
| "grad_norm": 0.4857698883011697, |
| "learning_rate": 3.749050709274303e-05, |
| "loss": 0.5104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22700002789497375, |
| "step": 1125, |
| "valid_targets_mean": 4638.6, |
| "valid_targets_min": 1595 |
| }, |
| { |
| "epoch": 1.7257448433919023, |
| "grad_norm": 0.6172079732872118, |
| "learning_rate": 3.7453453407413017e-05, |
| "loss": 0.5307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24322380125522614, |
| "step": 1130, |
| "valid_targets_mean": 2821.2, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 1.7333842627960276, |
| "grad_norm": 0.6090536328384808, |
| "learning_rate": 3.7416146756083206e-05, |
| "loss": 0.5621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2388569712638855, |
| "step": 1135, |
| "valid_targets_mean": 3844.5, |
| "valid_targets_min": 1783 |
| }, |
| { |
| "epoch": 1.7410236822001528, |
| "grad_norm": 0.5783456560647274, |
| "learning_rate": 3.7378587679466905e-05, |
| "loss": 0.5091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17862531542778015, |
| "step": 1140, |
| "valid_targets_mean": 3060.9, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 1.748663101604278, |
| "grad_norm": 0.5769716592236767, |
| "learning_rate": 3.7340776721936e-05, |
| "loss": 0.5564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37400296330451965, |
| "step": 1145, |
| "valid_targets_mean": 4793.1, |
| "valid_targets_min": 2782 |
| }, |
| { |
| "epoch": 1.7563025210084033, |
| "grad_norm": 0.5706577300432857, |
| "learning_rate": 3.730271443151307e-05, |
| "loss": 0.5301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25871527194976807, |
| "step": 1150, |
| "valid_targets_mean": 3715.6, |
| "valid_targets_min": 1506 |
| }, |
| { |
| "epoch": 1.7639419404125287, |
| "grad_norm": 0.7272691515910408, |
| "learning_rate": 3.726440135986346e-05, |
| "loss": 0.5295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2796229422092438, |
| "step": 1155, |
| "valid_targets_mean": 2538.6, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 1.771581359816654, |
| "grad_norm": 0.6317299325267872, |
| "learning_rate": 3.722583806228727e-05, |
| "loss": 0.5332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30438125133514404, |
| "step": 1160, |
| "valid_targets_mean": 3455.2, |
| "valid_targets_min": 1715 |
| }, |
| { |
| "epoch": 1.7792207792207793, |
| "grad_norm": 0.6091979304515164, |
| "learning_rate": 3.7187025097711325e-05, |
| "loss": 0.5465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19755399227142334, |
| "step": 1165, |
| "valid_targets_mean": 2997.4, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 1.7868601986249044, |
| "grad_norm": 0.7220416396847499, |
| "learning_rate": 3.714796302868105e-05, |
| "loss": 0.5383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3491123914718628, |
| "step": 1170, |
| "valid_targets_mean": 3392.4, |
| "valid_targets_min": 1653 |
| }, |
| { |
| "epoch": 1.7944996180290298, |
| "grad_norm": 0.5964619045278258, |
| "learning_rate": 3.710865242135231e-05, |
| "loss": 0.5371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24358564615249634, |
| "step": 1175, |
| "valid_targets_mean": 3734.4, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.8021390374331552, |
| "grad_norm": 0.5873635920467295, |
| "learning_rate": 3.7069093845483265e-05, |
| "loss": 0.5058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24197137355804443, |
| "step": 1180, |
| "valid_targets_mean": 3604.4, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 1.8097784568372803, |
| "grad_norm": 0.6984507077197806, |
| "learning_rate": 3.702928787442603e-05, |
| "loss": 0.506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37548327445983887, |
| "step": 1185, |
| "valid_targets_mean": 3504.6, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 1.8174178762414055, |
| "grad_norm": 0.7830323580644593, |
| "learning_rate": 3.698923508511843e-05, |
| "loss": 0.5523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2729473412036896, |
| "step": 1190, |
| "valid_targets_mean": 2126.0, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 1.8250572956455309, |
| "grad_norm": 0.5967750220721146, |
| "learning_rate": 3.69489360580756e-05, |
| "loss": 0.509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21153341233730316, |
| "step": 1195, |
| "valid_targets_mean": 3077.9, |
| "valid_targets_min": 253 |
| }, |
| { |
| "epoch": 1.8326967150496563, |
| "grad_norm": 0.5605236353838795, |
| "learning_rate": 3.690839137738159e-05, |
| "loss": 0.4913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2955290675163269, |
| "step": 1200, |
| "valid_targets_mean": 4730.1, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 1.8403361344537816, |
| "grad_norm": 0.6085256947878469, |
| "learning_rate": 3.6867601630680866e-05, |
| "loss": 0.555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29254335165023804, |
| "step": 1205, |
| "valid_targets_mean": 4159.6, |
| "valid_targets_min": 1517 |
| }, |
| { |
| "epoch": 1.8479755538579068, |
| "grad_norm": 0.7044349997653415, |
| "learning_rate": 3.682656740916986e-05, |
| "loss": 0.5505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3043631911277771, |
| "step": 1210, |
| "valid_targets_mean": 3770.8, |
| "valid_targets_min": 1189 |
| }, |
| { |
| "epoch": 1.855614973262032, |
| "grad_norm": 0.6550764600527469, |
| "learning_rate": 3.678528930758834e-05, |
| "loss": 0.5594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3247641623020172, |
| "step": 1215, |
| "valid_targets_mean": 3556.6, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 1.8632543926661573, |
| "grad_norm": 0.7190327175451237, |
| "learning_rate": 3.674376792421081e-05, |
| "loss": 0.5401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3061503469944, |
| "step": 1220, |
| "valid_targets_mean": 2849.2, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 1.8708938120702827, |
| "grad_norm": 0.6887939667732077, |
| "learning_rate": 3.670200386083784e-05, |
| "loss": 0.5286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3267863392829895, |
| "step": 1225, |
| "valid_targets_mean": 3191.8, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 1.878533231474408, |
| "grad_norm": 0.6379586545313669, |
| "learning_rate": 3.665999772278736e-05, |
| "loss": 0.5662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39808523654937744, |
| "step": 1230, |
| "valid_targets_mean": 4236.0, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 1.8861726508785333, |
| "grad_norm": 0.6902444540079928, |
| "learning_rate": 3.661775011888584e-05, |
| "loss": 0.5345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24210360646247864, |
| "step": 1235, |
| "valid_targets_mean": 3590.6, |
| "valid_targets_min": 2191 |
| }, |
| { |
| "epoch": 1.8938120702826584, |
| "grad_norm": 0.6622678829508013, |
| "learning_rate": 3.657526166145952e-05, |
| "loss": 0.4882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25689786672592163, |
| "step": 1240, |
| "valid_targets_mean": 2681.5, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 1.9014514896867838, |
| "grad_norm": 0.6762001298834552, |
| "learning_rate": 3.65325329663255e-05, |
| "loss": 0.5019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23240089416503906, |
| "step": 1245, |
| "valid_targets_mean": 3059.0, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 1.9090909090909092, |
| "grad_norm": 0.7264235125054589, |
| "learning_rate": 3.648956465278284e-05, |
| "loss": 0.5196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22812113165855408, |
| "step": 1250, |
| "valid_targets_mean": 2430.2, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 1.9167303284950343, |
| "grad_norm": 0.6846670975363754, |
| "learning_rate": 3.6446357343603536e-05, |
| "loss": 0.5425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2963109612464905, |
| "step": 1255, |
| "valid_targets_mean": 3483.8, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 1.9243697478991597, |
| "grad_norm": 0.727888807975606, |
| "learning_rate": 3.6402911665023565e-05, |
| "loss": 0.5057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29520994424819946, |
| "step": 1260, |
| "valid_targets_mean": 3465.0, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 1.9320091673032849, |
| "grad_norm": 0.6640837422377913, |
| "learning_rate": 3.6359228246733744e-05, |
| "loss": 0.5472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34408777952194214, |
| "step": 1265, |
| "valid_targets_mean": 4042.9, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 1.9396485867074102, |
| "grad_norm": 0.6476482043969682, |
| "learning_rate": 3.631530772187065e-05, |
| "loss": 0.5313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2760136127471924, |
| "step": 1270, |
| "valid_targets_mean": 3540.1, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 1.9472880061115356, |
| "grad_norm": 0.6467092573010441, |
| "learning_rate": 3.627115072700741e-05, |
| "loss": 0.4999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32210585474967957, |
| "step": 1275, |
| "valid_targets_mean": 3878.0, |
| "valid_targets_min": 1552 |
| }, |
| { |
| "epoch": 1.9549274255156608, |
| "grad_norm": 0.5803166137506185, |
| "learning_rate": 3.6226757902144495e-05, |
| "loss": 0.5491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33720919489860535, |
| "step": 1280, |
| "valid_targets_mean": 4619.9, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 1.962566844919786, |
| "grad_norm": 0.5328390011256504, |
| "learning_rate": 3.618212989070043e-05, |
| "loss": 0.513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18014609813690186, |
| "step": 1285, |
| "valid_targets_mean": 3435.1, |
| "valid_targets_min": 2096 |
| }, |
| { |
| "epoch": 1.9702062643239113, |
| "grad_norm": 0.6854626615968217, |
| "learning_rate": 3.613726733950248e-05, |
| "loss": 0.5191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34878984093666077, |
| "step": 1290, |
| "valid_targets_mean": 3824.2, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 1.9778456837280367, |
| "grad_norm": 0.5949832136294794, |
| "learning_rate": 3.609217089877728e-05, |
| "loss": 0.5531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724492311477661, |
| "step": 1295, |
| "valid_targets_mean": 2781.6, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 1.985485103132162, |
| "grad_norm": 0.8455545653427853, |
| "learning_rate": 3.604684122214138e-05, |
| "loss": 0.5478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2157420665025711, |
| "step": 1300, |
| "valid_targets_mean": 1768.0, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 1.9931245225362872, |
| "grad_norm": 0.6959760784864205, |
| "learning_rate": 3.600127896659181e-05, |
| "loss": 0.5442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2532881200313568, |
| "step": 1305, |
| "valid_targets_mean": 2938.0, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 0.9358773564606009, |
| "learning_rate": 3.5955484792496536e-05, |
| "loss": 0.4938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5185206532478333, |
| "step": 1310, |
| "valid_targets_mean": 3101.2, |
| "valid_targets_min": 1261 |
| }, |
| { |
| "epoch": 2.0076394194041254, |
| "grad_norm": 0.5317421829410245, |
| "learning_rate": 3.5909459363584895e-05, |
| "loss": 0.4783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2319856882095337, |
| "step": 1315, |
| "valid_targets_mean": 4424.4, |
| "valid_targets_min": 1783 |
| }, |
| { |
| "epoch": 2.0152788388082508, |
| "grad_norm": 0.7259614209577792, |
| "learning_rate": 3.5863203346937974e-05, |
| "loss": 0.4646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2661840319633484, |
| "step": 1320, |
| "valid_targets_mean": 3145.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 2.0229182582123757, |
| "grad_norm": 0.6866135582932625, |
| "learning_rate": 3.5816717412978935e-05, |
| "loss": 0.4872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.274208664894104, |
| "step": 1325, |
| "valid_targets_mean": 4005.1, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 2.030557677616501, |
| "grad_norm": 0.6107569519174747, |
| "learning_rate": 3.577000223546331e-05, |
| "loss": 0.4855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2812064290046692, |
| "step": 1330, |
| "valid_targets_mean": 4395.8, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 2.0381970970206265, |
| "grad_norm": 0.5841200969185655, |
| "learning_rate": 3.5723058491469226e-05, |
| "loss": 0.4616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18964403867721558, |
| "step": 1335, |
| "valid_targets_mean": 2951.0, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 2.045836516424752, |
| "grad_norm": 0.7731622386210697, |
| "learning_rate": 3.56758868613876e-05, |
| "loss": 0.5099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22586776316165924, |
| "step": 1340, |
| "valid_targets_mean": 2463.9, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 2.053475935828877, |
| "grad_norm": 0.8201482091316316, |
| "learning_rate": 3.5628488028912284e-05, |
| "loss": 0.5191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2765929102897644, |
| "step": 1345, |
| "valid_targets_mean": 2273.8, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 2.061115355233002, |
| "grad_norm": 0.7559956865117078, |
| "learning_rate": 3.558086268103011e-05, |
| "loss": 0.4767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2768942713737488, |
| "step": 1350, |
| "valid_targets_mean": 3333.4, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 2.0687547746371275, |
| "grad_norm": 0.7010684764079771, |
| "learning_rate": 3.5533011508011e-05, |
| "loss": 0.4833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20257258415222168, |
| "step": 1355, |
| "valid_targets_mean": 3312.2, |
| "valid_targets_min": 407 |
| }, |
| { |
| "epoch": 2.076394194041253, |
| "grad_norm": 0.660599060190917, |
| "learning_rate": 3.548493520339792e-05, |
| "loss": 0.5111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21439898014068604, |
| "step": 1360, |
| "valid_targets_mean": 2463.9, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 2.0840336134453783, |
| "grad_norm": 0.7722765277601109, |
| "learning_rate": 3.5436634463996834e-05, |
| "loss": 0.507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2662246823310852, |
| "step": 1365, |
| "valid_targets_mean": 2362.0, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 2.0916730328495032, |
| "grad_norm": 0.6657604945302164, |
| "learning_rate": 3.538810998986661e-05, |
| "loss": 0.5495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2910098731517792, |
| "step": 1370, |
| "valid_targets_mean": 3378.8, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 2.0993124522536286, |
| "grad_norm": 0.6146058220275632, |
| "learning_rate": 3.533936248430887e-05, |
| "loss": 0.5278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2327723503112793, |
| "step": 1375, |
| "valid_targets_mean": 3400.5, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 2.106951871657754, |
| "grad_norm": 0.6323389179006582, |
| "learning_rate": 3.52903926538578e-05, |
| "loss": 0.4977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18094557523727417, |
| "step": 1380, |
| "valid_targets_mean": 3219.0, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 2.1145912910618794, |
| "grad_norm": 0.6714237005424043, |
| "learning_rate": 3.524120120826991e-05, |
| "loss": 0.5114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.261186420917511, |
| "step": 1385, |
| "valid_targets_mean": 2986.6, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 2.1222307104660048, |
| "grad_norm": 0.7168232477241365, |
| "learning_rate": 3.519178886051374e-05, |
| "loss": 0.4868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24357938766479492, |
| "step": 1390, |
| "valid_targets_mean": 3561.8, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 2.1298701298701297, |
| "grad_norm": 0.7179444771168448, |
| "learning_rate": 3.514215632675953e-05, |
| "loss": 0.4773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2347637414932251, |
| "step": 1395, |
| "valid_targets_mean": 3083.2, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 2.137509549274255, |
| "grad_norm": 0.8502474110018483, |
| "learning_rate": 3.509230432636884e-05, |
| "loss": 0.5114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30212515592575073, |
| "step": 1400, |
| "valid_targets_mean": 2405.1, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 2.1451489686783805, |
| "grad_norm": 0.619094616956861, |
| "learning_rate": 3.504223358188414e-05, |
| "loss": 0.4978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3284362554550171, |
| "step": 1405, |
| "valid_targets_mean": 4827.5, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 2.152788388082506, |
| "grad_norm": 0.7128343442681825, |
| "learning_rate": 3.4991944819018295e-05, |
| "loss": 0.4943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23888735473155975, |
| "step": 1410, |
| "valid_targets_mean": 3042.6, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 2.160427807486631, |
| "grad_norm": 0.5834794683505667, |
| "learning_rate": 3.4941438766644094e-05, |
| "loss": 0.4697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22566252946853638, |
| "step": 1415, |
| "valid_targets_mean": 4167.9, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 2.168067226890756, |
| "grad_norm": 0.5505262571807923, |
| "learning_rate": 3.489071615678366e-05, |
| "loss": 0.4957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29685625433921814, |
| "step": 1420, |
| "valid_targets_mean": 5135.1, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 2.1757066462948815, |
| "grad_norm": 0.6704037109861748, |
| "learning_rate": 3.483977772459786e-05, |
| "loss": 0.4863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3806396424770355, |
| "step": 1425, |
| "valid_targets_mean": 4908.2, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 2.183346065699007, |
| "grad_norm": 0.6015955329730339, |
| "learning_rate": 3.478862420837561e-05, |
| "loss": 0.4905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22024193406105042, |
| "step": 1430, |
| "valid_targets_mean": 3537.0, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 2.1909854851031323, |
| "grad_norm": 0.8149409610415594, |
| "learning_rate": 3.473725634952321e-05, |
| "loss": 0.5062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24890246987342834, |
| "step": 1435, |
| "valid_targets_mean": 2094.8, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 2.1986249045072572, |
| "grad_norm": 0.729224011887746, |
| "learning_rate": 3.4685674892553604e-05, |
| "loss": 0.4551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2595076262950897, |
| "step": 1440, |
| "valid_targets_mean": 3288.8, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 2.2062643239113826, |
| "grad_norm": 0.6441248015278864, |
| "learning_rate": 3.463388058507556e-05, |
| "loss": 0.4455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1921394020318985, |
| "step": 1445, |
| "valid_targets_mean": 2419.9, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 2.213903743315508, |
| "grad_norm": 0.6762838196132268, |
| "learning_rate": 3.458187417778284e-05, |
| "loss": 0.4922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27211958169937134, |
| "step": 1450, |
| "valid_targets_mean": 3996.0, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 2.2215431627196334, |
| "grad_norm": 0.6261428817660788, |
| "learning_rate": 3.452965642444334e-05, |
| "loss": 0.4853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1550438106060028, |
| "step": 1455, |
| "valid_targets_mean": 2566.4, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 2.2291825821237587, |
| "grad_norm": 0.7408606958154191, |
| "learning_rate": 3.447722808188816e-05, |
| "loss": 0.4831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18380820751190186, |
| "step": 1460, |
| "valid_targets_mean": 2003.5, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 2.2368220015278837, |
| "grad_norm": 0.7861802803128333, |
| "learning_rate": 3.442458991000062e-05, |
| "loss": 0.5236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2023487538099289, |
| "step": 1465, |
| "valid_targets_mean": 1830.8, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 2.244461420932009, |
| "grad_norm": 0.7124589412998297, |
| "learning_rate": 3.437174267170524e-05, |
| "loss": 0.5182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2585378885269165, |
| "step": 1470, |
| "valid_targets_mean": 2549.2, |
| "valid_targets_min": 438 |
| }, |
| { |
| "epoch": 2.2521008403361344, |
| "grad_norm": 0.6812098409271231, |
| "learning_rate": 3.4318687132956714e-05, |
| "loss": 0.4896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2898828387260437, |
| "step": 1475, |
| "valid_targets_mean": 4216.2, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 2.25974025974026, |
| "grad_norm": 0.7132327272659739, |
| "learning_rate": 3.426542406272879e-05, |
| "loss": 0.4805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22709037363529205, |
| "step": 1480, |
| "valid_targets_mean": 2697.4, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 2.267379679144385, |
| "grad_norm": 0.7185720305215236, |
| "learning_rate": 3.4211954233003115e-05, |
| "loss": 0.5131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2051008939743042, |
| "step": 1485, |
| "valid_targets_mean": 2768.2, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 2.27501909854851, |
| "grad_norm": 0.7435166801422771, |
| "learning_rate": 3.415827841875807e-05, |
| "loss": 0.4764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28377318382263184, |
| "step": 1490, |
| "valid_targets_mean": 3350.2, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 2.2826585179526355, |
| "grad_norm": 0.6818694893959436, |
| "learning_rate": 3.4104397397957495e-05, |
| "loss": 0.5384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2481977641582489, |
| "step": 1495, |
| "valid_targets_mean": 3382.8, |
| "valid_targets_min": 1961 |
| }, |
| { |
| "epoch": 2.290297937356761, |
| "grad_norm": 0.6664430457664224, |
| "learning_rate": 3.405031195153949e-05, |
| "loss": 0.4798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2219395637512207, |
| "step": 1500, |
| "valid_targets_mean": 2843.5, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 2.2979373567608863, |
| "grad_norm": 0.52820138423304, |
| "learning_rate": 3.399602286340503e-05, |
| "loss": 0.4687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22768482565879822, |
| "step": 1505, |
| "valid_targets_mean": 5526.1, |
| "valid_targets_min": 1584 |
| }, |
| { |
| "epoch": 2.3055767761650117, |
| "grad_norm": 0.7120542733941014, |
| "learning_rate": 3.394153092040658e-05, |
| "loss": 0.5092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29083842039108276, |
| "step": 1510, |
| "valid_targets_mean": 3225.1, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 2.3132161955691366, |
| "grad_norm": 0.6870040097106018, |
| "learning_rate": 3.3886836912336796e-05, |
| "loss": 0.5131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23260729014873505, |
| "step": 1515, |
| "valid_targets_mean": 2770.1, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 2.320855614973262, |
| "grad_norm": 0.7055648665859806, |
| "learning_rate": 3.383194163191698e-05, |
| "loss": 0.475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26753556728363037, |
| "step": 1520, |
| "valid_targets_mean": 3388.2, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 2.3284950343773874, |
| "grad_norm": 0.7916496584586002, |
| "learning_rate": 3.3776845874785624e-05, |
| "loss": 0.5013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2454243004322052, |
| "step": 1525, |
| "valid_targets_mean": 2547.4, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 2.3361344537815127, |
| "grad_norm": 0.7908259705075075, |
| "learning_rate": 3.37215504394869e-05, |
| "loss": 0.4798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2940301299095154, |
| "step": 1530, |
| "valid_targets_mean": 3533.6, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 2.343773873185638, |
| "grad_norm": 0.6546979140910963, |
| "learning_rate": 3.366605612745906e-05, |
| "loss": 0.4925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26727956533432007, |
| "step": 1535, |
| "valid_targets_mean": 3162.8, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 2.351413292589763, |
| "grad_norm": 0.6783177043359304, |
| "learning_rate": 3.3610363743022795e-05, |
| "loss": 0.4864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21130970120429993, |
| "step": 1540, |
| "valid_targets_mean": 3205.9, |
| "valid_targets_min": 1889 |
| }, |
| { |
| "epoch": 2.3590527119938884, |
| "grad_norm": 0.6555047268489784, |
| "learning_rate": 3.3554474093369656e-05, |
| "loss": 0.5, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31021979451179504, |
| "step": 1545, |
| "valid_targets_mean": 3555.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 2.366692131398014, |
| "grad_norm": 0.7305711433653311, |
| "learning_rate": 3.349838798855027e-05, |
| "loss": 0.5091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.331775963306427, |
| "step": 1550, |
| "valid_targets_mean": 3734.6, |
| "valid_targets_min": 411 |
| }, |
| { |
| "epoch": 2.374331550802139, |
| "grad_norm": 0.559575508819546, |
| "learning_rate": 3.3442106241462645e-05, |
| "loss": 0.4559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19253335893154144, |
| "step": 1555, |
| "valid_targets_mean": 2387.5, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 2.381970970206264, |
| "grad_norm": 0.7849640314141061, |
| "learning_rate": 3.338562966784038e-05, |
| "loss": 0.5004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22845134139060974, |
| "step": 1560, |
| "valid_targets_mean": 2045.8, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.3896103896103895, |
| "grad_norm": 0.8097550048727009, |
| "learning_rate": 3.3328959086240876e-05, |
| "loss": 0.494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21622112393379211, |
| "step": 1565, |
| "valid_targets_mean": 2250.2, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 2.397249809014515, |
| "grad_norm": 0.6803709574881871, |
| "learning_rate": 3.3272095318033376e-05, |
| "loss": 0.519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2511165738105774, |
| "step": 1570, |
| "valid_targets_mean": 2622.2, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 2.4048892284186403, |
| "grad_norm": 0.6712742285853818, |
| "learning_rate": 3.321503918738716e-05, |
| "loss": 0.4903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16048851609230042, |
| "step": 1575, |
| "valid_targets_mean": 2250.4, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 2.4125286478227657, |
| "grad_norm": 0.677457396605636, |
| "learning_rate": 3.315779152125955e-05, |
| "loss": 0.4936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17943637073040009, |
| "step": 1580, |
| "valid_targets_mean": 1933.6, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 2.4201680672268906, |
| "grad_norm": 0.5901481064339373, |
| "learning_rate": 3.310035314938394e-05, |
| "loss": 0.4993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22970394790172577, |
| "step": 1585, |
| "valid_targets_mean": 3705.9, |
| "valid_targets_min": 1259 |
| }, |
| { |
| "epoch": 2.427807486631016, |
| "grad_norm": 0.5963861967566215, |
| "learning_rate": 3.304272490425777e-05, |
| "loss": 0.4882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2982090711593628, |
| "step": 1590, |
| "valid_targets_mean": 5054.9, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 2.4354469060351414, |
| "grad_norm": 0.7130398946256007, |
| "learning_rate": 3.2984907621130435e-05, |
| "loss": 0.5389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35128599405288696, |
| "step": 1595, |
| "valid_targets_mean": 3656.8, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 2.4430863254392667, |
| "grad_norm": 0.6176299158495442, |
| "learning_rate": 3.292690213799122e-05, |
| "loss": 0.5318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24622666835784912, |
| "step": 1600, |
| "valid_targets_mean": 3358.4, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 2.4507257448433917, |
| "grad_norm": 0.5981587869828613, |
| "learning_rate": 3.286870929555713e-05, |
| "loss": 0.5288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2027554214000702, |
| "step": 1605, |
| "valid_targets_mean": 3590.0, |
| "valid_targets_min": 1349 |
| }, |
| { |
| "epoch": 2.458365164247517, |
| "grad_norm": 0.5744990440096281, |
| "learning_rate": 3.281032993726071e-05, |
| "loss": 0.4947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1916375458240509, |
| "step": 1610, |
| "valid_targets_mean": 3543.8, |
| "valid_targets_min": 1484 |
| }, |
| { |
| "epoch": 2.4660045836516424, |
| "grad_norm": 0.7430996004414889, |
| "learning_rate": 3.275176490923781e-05, |
| "loss": 0.4733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26889270544052124, |
| "step": 1615, |
| "valid_targets_mean": 3089.4, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 2.473644003055768, |
| "grad_norm": 0.7037506079471908, |
| "learning_rate": 3.269301506031534e-05, |
| "loss": 0.4731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25602343678474426, |
| "step": 1620, |
| "valid_targets_mean": 2495.0, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 2.481283422459893, |
| "grad_norm": 0.5842797711033675, |
| "learning_rate": 3.2634081241998954e-05, |
| "loss": 0.5177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2861538231372833, |
| "step": 1625, |
| "valid_targets_mean": 5589.2, |
| "valid_targets_min": 2931 |
| }, |
| { |
| "epoch": 2.488922841864018, |
| "grad_norm": 0.7575350211022752, |
| "learning_rate": 3.257496430846071e-05, |
| "loss": 0.525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2269067019224167, |
| "step": 1630, |
| "valid_targets_mean": 2871.0, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 2.4965622612681435, |
| "grad_norm": 0.6181133672275352, |
| "learning_rate": 3.251566511652669e-05, |
| "loss": 0.4685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24582752585411072, |
| "step": 1635, |
| "valid_targets_mean": 3053.4, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 2.504201680672269, |
| "grad_norm": 0.64742145917169, |
| "learning_rate": 3.245618452566461e-05, |
| "loss": 0.4816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3426717519760132, |
| "step": 1640, |
| "valid_targets_mean": 4025.6, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 2.5118411000763943, |
| "grad_norm": 0.6635442839695538, |
| "learning_rate": 3.23965233979713e-05, |
| "loss": 0.5, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17027682065963745, |
| "step": 1645, |
| "valid_targets_mean": 2165.4, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 2.5194805194805197, |
| "grad_norm": 0.5660316698532355, |
| "learning_rate": 3.233668259816026e-05, |
| "loss": 0.5077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22779259085655212, |
| "step": 1650, |
| "valid_targets_mean": 4539.5, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 2.5271199388846446, |
| "grad_norm": 0.6224770591422036, |
| "learning_rate": 3.227666299354912e-05, |
| "loss": 0.5, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22263994812965393, |
| "step": 1655, |
| "valid_targets_mean": 3727.9, |
| "valid_targets_min": 1163 |
| }, |
| { |
| "epoch": 2.53475935828877, |
| "grad_norm": 0.6907752213015932, |
| "learning_rate": 3.221646545404706e-05, |
| "loss": 0.506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3159465193748474, |
| "step": 1660, |
| "valid_targets_mean": 4150.0, |
| "valid_targets_min": 1808 |
| }, |
| { |
| "epoch": 2.5423987776928954, |
| "grad_norm": 0.7191273755219711, |
| "learning_rate": 3.21560908521422e-05, |
| "loss": 0.4704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25996077060699463, |
| "step": 1665, |
| "valid_targets_mean": 2863.5, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 2.5500381970970207, |
| "grad_norm": 0.680261011638979, |
| "learning_rate": 3.209554006288895e-05, |
| "loss": 0.4741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3104439377784729, |
| "step": 1670, |
| "valid_targets_mean": 4482.5, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 2.557677616501146, |
| "grad_norm": 0.6432998240930168, |
| "learning_rate": 3.203481396389535e-05, |
| "loss": 0.5118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2836974263191223, |
| "step": 1675, |
| "valid_targets_mean": 3161.0, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 2.565317035905271, |
| "grad_norm": 0.6448940137147883, |
| "learning_rate": 3.1973913435310335e-05, |
| "loss": 0.4825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20341014862060547, |
| "step": 1680, |
| "valid_targets_mean": 2595.0, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 2.5729564553093964, |
| "grad_norm": 0.6826751568198045, |
| "learning_rate": 3.1912839359810974e-05, |
| "loss": 0.5003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23161211609840393, |
| "step": 1685, |
| "valid_targets_mean": 2430.1, |
| "valid_targets_min": 1225 |
| }, |
| { |
| "epoch": 2.580595874713522, |
| "grad_norm": 0.704783143383557, |
| "learning_rate": 3.185159262258967e-05, |
| "loss": 0.4805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29678064584732056, |
| "step": 1690, |
| "valid_targets_mean": 3600.0, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 2.588235294117647, |
| "grad_norm": 0.5753956792109161, |
| "learning_rate": 3.179017411134137e-05, |
| "loss": 0.4918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.268524706363678, |
| "step": 1695, |
| "valid_targets_mean": 4652.6, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 2.5958747135217726, |
| "grad_norm": 0.7042435298107268, |
| "learning_rate": 3.172858471625065e-05, |
| "loss": 0.4995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21800410747528076, |
| "step": 1700, |
| "valid_targets_mean": 2551.8, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 2.6035141329258975, |
| "grad_norm": 0.6748037272112359, |
| "learning_rate": 3.166682532997883e-05, |
| "loss": 0.4978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30926668643951416, |
| "step": 1705, |
| "valid_targets_mean": 4062.9, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 2.611153552330023, |
| "grad_norm": 0.6581058243085496, |
| "learning_rate": 3.160489684765105e-05, |
| "loss": 0.4732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15238752961158752, |
| "step": 1710, |
| "valid_targets_mean": 2951.8, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 2.6187929717341483, |
| "grad_norm": 0.5961485901668413, |
| "learning_rate": 3.154280016684329e-05, |
| "loss": 0.4727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28147566318511963, |
| "step": 1715, |
| "valid_targets_mean": 4090.0, |
| "valid_targets_min": 1696 |
| }, |
| { |
| "epoch": 2.6264323911382736, |
| "grad_norm": 0.6635627417191078, |
| "learning_rate": 3.148053618756936e-05, |
| "loss": 0.4939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27265307307243347, |
| "step": 1720, |
| "valid_targets_mean": 3721.9, |
| "valid_targets_min": 1634 |
| }, |
| { |
| "epoch": 2.634071810542399, |
| "grad_norm": 0.7282926360608749, |
| "learning_rate": 3.141810581226782e-05, |
| "loss": 0.4862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.312755286693573, |
| "step": 1725, |
| "valid_targets_mean": 3535.2, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 2.641711229946524, |
| "grad_norm": 0.6956213326065784, |
| "learning_rate": 3.135550994578897e-05, |
| "loss": 0.4809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2344173789024353, |
| "step": 1730, |
| "valid_targets_mean": 3056.6, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 2.6493506493506493, |
| "grad_norm": 0.6031654478325641, |
| "learning_rate": 3.129274949538169e-05, |
| "loss": 0.5099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2556261122226715, |
| "step": 1735, |
| "valid_targets_mean": 3144.1, |
| "valid_targets_min": 1791 |
| }, |
| { |
| "epoch": 2.6569900687547747, |
| "grad_norm": 0.6706862876679621, |
| "learning_rate": 3.122982537068028e-05, |
| "loss": 0.4703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28426307439804077, |
| "step": 1740, |
| "valid_targets_mean": 4114.6, |
| "valid_targets_min": 1840 |
| }, |
| { |
| "epoch": 2.6646294881588997, |
| "grad_norm": 0.6346741898139652, |
| "learning_rate": 3.1166738483691305e-05, |
| "loss": 0.4571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2778932452201843, |
| "step": 1745, |
| "valid_targets_mean": 4111.8, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 2.6722689075630255, |
| "grad_norm": 0.8266245480740433, |
| "learning_rate": 3.110348974878038e-05, |
| "loss": 0.4965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2906370162963867, |
| "step": 1750, |
| "valid_targets_mean": 2386.2, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 2.6799083269671504, |
| "grad_norm": 0.6638752682144674, |
| "learning_rate": 3.104008008265888e-05, |
| "loss": 0.4863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27586424350738525, |
| "step": 1755, |
| "valid_targets_mean": 3002.8, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 2.687547746371276, |
| "grad_norm": 0.5942821754327564, |
| "learning_rate": 3.09765104043707e-05, |
| "loss": 0.4809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20257282257080078, |
| "step": 1760, |
| "valid_targets_mean": 3590.9, |
| "valid_targets_min": 1851 |
| }, |
| { |
| "epoch": 2.695187165775401, |
| "grad_norm": 0.5927687488678979, |
| "learning_rate": 3.0912781635278886e-05, |
| "loss": 0.4641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1888626366853714, |
| "step": 1765, |
| "valid_targets_mean": 3535.0, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.702826585179526, |
| "grad_norm": 0.7947503911879893, |
| "learning_rate": 3.0848894699052326e-05, |
| "loss": 0.507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21330304443836212, |
| "step": 1770, |
| "valid_targets_mean": 3395.4, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 2.7104660045836515, |
| "grad_norm": 0.5926029230343366, |
| "learning_rate": 3.0784850521652336e-05, |
| "loss": 0.4636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1835680454969406, |
| "step": 1775, |
| "valid_targets_mean": 3637.9, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 2.718105423987777, |
| "grad_norm": 0.6649422002748281, |
| "learning_rate": 3.072065003131925e-05, |
| "loss": 0.4696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3594931364059448, |
| "step": 1780, |
| "valid_targets_mean": 3790.4, |
| "valid_targets_min": 2012 |
| }, |
| { |
| "epoch": 2.7257448433919023, |
| "grad_norm": 0.9506459102901791, |
| "learning_rate": 3.0656294158558954e-05, |
| "loss": 0.5542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2790099084377289, |
| "step": 1785, |
| "valid_targets_mean": 3921.5, |
| "valid_targets_min": 2246 |
| }, |
| { |
| "epoch": 2.7333842627960276, |
| "grad_norm": 0.7082670183686091, |
| "learning_rate": 3.059178383612941e-05, |
| "loss": 0.4799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25146788358688354, |
| "step": 1790, |
| "valid_targets_mean": 2553.1, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 2.7410236822001526, |
| "grad_norm": 0.706151992610167, |
| "learning_rate": 3.052711999902715e-05, |
| "loss": 0.477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32185858488082886, |
| "step": 1795, |
| "valid_targets_mean": 3541.9, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 2.748663101604278, |
| "grad_norm": 0.6419423098815215, |
| "learning_rate": 3.0462303584473692e-05, |
| "loss": 0.5119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.327781081199646, |
| "step": 1800, |
| "valid_targets_mean": 4346.9, |
| "valid_targets_min": 2177 |
| }, |
| { |
| "epoch": 2.7563025210084033, |
| "grad_norm": 0.8570229225472685, |
| "learning_rate": 3.039733553190198e-05, |
| "loss": 0.4682, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14253611862659454, |
| "step": 1805, |
| "valid_targets_mean": 1997.4, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 2.7639419404125287, |
| "grad_norm": 0.7558810429065274, |
| "learning_rate": 3.0332216782942763e-05, |
| "loss": 0.4915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2567565441131592, |
| "step": 1810, |
| "valid_targets_mean": 2702.4, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 2.771581359816654, |
| "grad_norm": 0.5963411952289389, |
| "learning_rate": 3.0266948281410943e-05, |
| "loss": 0.4823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1956261396408081, |
| "step": 1815, |
| "valid_targets_mean": 3508.9, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 2.779220779220779, |
| "grad_norm": 0.6388646518127971, |
| "learning_rate": 3.020153097329189e-05, |
| "loss": 0.4715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21967804431915283, |
| "step": 1820, |
| "valid_targets_mean": 3618.1, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 2.7868601986249044, |
| "grad_norm": 0.6146109467059201, |
| "learning_rate": 3.013596580672777e-05, |
| "loss": 0.4841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20610034465789795, |
| "step": 1825, |
| "valid_targets_mean": 3072.5, |
| "valid_targets_min": 1280 |
| }, |
| { |
| "epoch": 2.79449961802903, |
| "grad_norm": 0.8220069533572829, |
| "learning_rate": 3.0070253732003736e-05, |
| "loss": 0.5067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.287387490272522, |
| "step": 1830, |
| "valid_targets_mean": 2372.0, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 2.802139037433155, |
| "grad_norm": 0.6060216832677047, |
| "learning_rate": 3.0004395701534208e-05, |
| "loss": 0.5046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1976098269224167, |
| "step": 1835, |
| "valid_targets_mean": 3524.0, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 2.8097784568372806, |
| "grad_norm": 0.6533429306985723, |
| "learning_rate": 2.9938392669849053e-05, |
| "loss": 0.4447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26395583152770996, |
| "step": 1840, |
| "valid_targets_mean": 3673.1, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 2.8174178762414055, |
| "grad_norm": 0.7125496744028057, |
| "learning_rate": 2.9872245593579752e-05, |
| "loss": 0.494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25991716980934143, |
| "step": 1845, |
| "valid_targets_mean": 2532.6, |
| "valid_targets_min": 1158 |
| }, |
| { |
| "epoch": 2.825057295645531, |
| "grad_norm": 0.6313460986453029, |
| "learning_rate": 2.9805955431445514e-05, |
| "loss": 0.4549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2249601185321808, |
| "step": 1850, |
| "valid_targets_mean": 4385.2, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 2.8326967150496563, |
| "grad_norm": 0.6358505528090321, |
| "learning_rate": 2.973952314423943e-05, |
| "loss": 0.4566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28464820981025696, |
| "step": 1855, |
| "valid_targets_mean": 4168.4, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 2.8403361344537816, |
| "grad_norm": 0.7230163206181031, |
| "learning_rate": 2.9672949694814485e-05, |
| "loss": 0.4829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24439480900764465, |
| "step": 1860, |
| "valid_targets_mean": 2667.0, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 2.847975553857907, |
| "grad_norm": 0.6704723628046145, |
| "learning_rate": 2.9606236048069655e-05, |
| "loss": 0.5093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18326005339622498, |
| "step": 1865, |
| "valid_targets_mean": 2370.1, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 2.855614973262032, |
| "grad_norm": 0.6270630791742493, |
| "learning_rate": 2.9539383170935888e-05, |
| "loss": 0.5206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20464631915092468, |
| "step": 1870, |
| "valid_targets_mean": 2579.9, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 2.8632543926661573, |
| "grad_norm": 0.6911077958995703, |
| "learning_rate": 2.9472392032362118e-05, |
| "loss": 0.5005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27718856930732727, |
| "step": 1875, |
| "valid_targets_mean": 3162.6, |
| "valid_targets_min": 1687 |
| }, |
| { |
| "epoch": 2.8708938120702827, |
| "grad_norm": 0.6414965035160827, |
| "learning_rate": 2.9405263603301185e-05, |
| "loss": 0.5001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2760189473628998, |
| "step": 1880, |
| "valid_targets_mean": 4009.4, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 2.878533231474408, |
| "grad_norm": 0.6551981321713435, |
| "learning_rate": 2.93379988566958e-05, |
| "loss": 0.4851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3242207169532776, |
| "step": 1885, |
| "valid_targets_mean": 4115.9, |
| "valid_targets_min": 1409 |
| }, |
| { |
| "epoch": 2.8861726508785335, |
| "grad_norm": 0.679402550463882, |
| "learning_rate": 2.9270598767464422e-05, |
| "loss": 0.4948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25107401609420776, |
| "step": 1890, |
| "valid_targets_mean": 3046.4, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 2.8938120702826584, |
| "grad_norm": 0.6390110048027222, |
| "learning_rate": 2.920306431248712e-05, |
| "loss": 0.5069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22953186929225922, |
| "step": 1895, |
| "valid_targets_mean": 3236.5, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 2.901451489686784, |
| "grad_norm": 0.6664644335329467, |
| "learning_rate": 2.9135396470591456e-05, |
| "loss": 0.4846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2379942238330841, |
| "step": 1900, |
| "valid_targets_mean": 2498.2, |
| "valid_targets_min": 1587 |
| }, |
| { |
| "epoch": 2.909090909090909, |
| "grad_norm": 0.7196033199681839, |
| "learning_rate": 2.9067596222538234e-05, |
| "loss": 0.5126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28052574396133423, |
| "step": 1905, |
| "valid_targets_mean": 3221.8, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 2.916730328495034, |
| "grad_norm": 0.7282565137655552, |
| "learning_rate": 2.8999664551007344e-05, |
| "loss": 0.5072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.298537015914917, |
| "step": 1910, |
| "valid_targets_mean": 2929.0, |
| "valid_targets_min": 1486 |
| }, |
| { |
| "epoch": 2.92436974789916, |
| "grad_norm": 0.6119949515081662, |
| "learning_rate": 2.8931602440583488e-05, |
| "loss": 0.505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22523435950279236, |
| "step": 1915, |
| "valid_targets_mean": 3136.1, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 2.932009167303285, |
| "grad_norm": 0.5399954941991891, |
| "learning_rate": 2.8863410877741906e-05, |
| "loss": 0.5075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24924825131893158, |
| "step": 1920, |
| "valid_targets_mean": 4078.1, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 2.9396485867074102, |
| "grad_norm": 0.6177014347831229, |
| "learning_rate": 2.8795090850834113e-05, |
| "loss": 0.5141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30639275908470154, |
| "step": 1925, |
| "valid_targets_mean": 4244.5, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 2.9472880061115356, |
| "grad_norm": 0.6346987774339923, |
| "learning_rate": 2.8726643350073528e-05, |
| "loss": 0.4939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30813929438591003, |
| "step": 1930, |
| "valid_targets_mean": 4161.6, |
| "valid_targets_min": 1781 |
| }, |
| { |
| "epoch": 2.9549274255156606, |
| "grad_norm": 0.5630616587425123, |
| "learning_rate": 2.865806936752115e-05, |
| "loss": 0.4925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20618033409118652, |
| "step": 1935, |
| "valid_targets_mean": 3727.6, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 2.962566844919786, |
| "grad_norm": 0.6042368887587112, |
| "learning_rate": 2.8589369897071174e-05, |
| "loss": 0.4893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3170982003211975, |
| "step": 1940, |
| "valid_targets_mean": 4726.5, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 2.9702062643239113, |
| "grad_norm": 0.7568286827833816, |
| "learning_rate": 2.8520545934436602e-05, |
| "loss": 0.5234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21794971823692322, |
| "step": 1945, |
| "valid_targets_mean": 2020.6, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.9778456837280367, |
| "grad_norm": 0.6106059417680693, |
| "learning_rate": 2.845159847713477e-05, |
| "loss": 0.4762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24992212653160095, |
| "step": 1950, |
| "valid_targets_mean": 3954.1, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 2.985485103132162, |
| "grad_norm": 0.5435572161508933, |
| "learning_rate": 2.8382528524472916e-05, |
| "loss": 0.479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23369833827018738, |
| "step": 1955, |
| "valid_targets_mean": 4845.0, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 2.993124522536287, |
| "grad_norm": 0.6506312663229364, |
| "learning_rate": 2.831333707753372e-05, |
| "loss": 0.5213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3393819332122803, |
| "step": 1960, |
| "valid_targets_mean": 4771.0, |
| "valid_targets_min": 2823 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 0.7542635576732258, |
| "learning_rate": 2.8244025139160745e-05, |
| "loss": 0.4668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.45052003860473633, |
| "step": 1965, |
| "valid_targets_mean": 4757.8, |
| "valid_targets_min": 1701 |
| }, |
| { |
| "epoch": 3.0076394194041254, |
| "grad_norm": 0.8520083341535113, |
| "learning_rate": 2.8174593713943933e-05, |
| "loss": 0.4627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.256170392036438, |
| "step": 1970, |
| "valid_targets_mean": 3575.5, |
| "valid_targets_min": 1617 |
| }, |
| { |
| "epoch": 3.0152788388082508, |
| "grad_norm": 0.6927471642692427, |
| "learning_rate": 2.8105043808205042e-05, |
| "loss": 0.4775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13694897294044495, |
| "step": 1975, |
| "valid_targets_mean": 2587.1, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 3.0229182582123757, |
| "grad_norm": 0.6552096347277138, |
| "learning_rate": 2.803537642998307e-05, |
| "loss": 0.4444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18564541637897491, |
| "step": 1980, |
| "valid_targets_mean": 2760.9, |
| "valid_targets_min": 1688 |
| }, |
| { |
| "epoch": 3.030557677616501, |
| "grad_norm": 0.7055118318105523, |
| "learning_rate": 2.79655925890196e-05, |
| "loss": 0.462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26022660732269287, |
| "step": 1985, |
| "valid_targets_mean": 3840.8, |
| "valid_targets_min": 1374 |
| }, |
| { |
| "epoch": 3.0381970970206265, |
| "grad_norm": 0.6819692775207933, |
| "learning_rate": 2.789569329674422e-05, |
| "loss": 0.4743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2793933153152466, |
| "step": 1990, |
| "valid_targets_mean": 3820.4, |
| "valid_targets_min": 2194 |
| }, |
| { |
| "epoch": 3.045836516424752, |
| "grad_norm": 0.6759014212454788, |
| "learning_rate": 2.7825679566259834e-05, |
| "loss": 0.4322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31307685375213623, |
| "step": 1995, |
| "valid_targets_mean": 4136.8, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 3.053475935828877, |
| "grad_norm": 0.7186371415409949, |
| "learning_rate": 2.7755552412327996e-05, |
| "loss": 0.5, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2766656279563904, |
| "step": 2000, |
| "valid_targets_mean": 3391.2, |
| "valid_targets_min": 976 |
| }, |
| { |
| "epoch": 3.061115355233002, |
| "grad_norm": 0.8200488852788307, |
| "learning_rate": 2.768531285135417e-05, |
| "loss": 0.433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21261753141880035, |
| "step": 2005, |
| "valid_targets_mean": 3123.6, |
| "valid_targets_min": 1113 |
| }, |
| { |
| "epoch": 3.0687547746371275, |
| "grad_norm": 0.7072416391028573, |
| "learning_rate": 2.7614961901373027e-05, |
| "loss": 0.446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2160511314868927, |
| "step": 2010, |
| "valid_targets_mean": 2450.9, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 3.076394194041253, |
| "grad_norm": 0.650830887467269, |
| "learning_rate": 2.7544500582033706e-05, |
| "loss": 0.4686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36730068922042847, |
| "step": 2015, |
| "valid_targets_mean": 4055.4, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 3.0840336134453783, |
| "grad_norm": 0.690349423058777, |
| "learning_rate": 2.7473929914584977e-05, |
| "loss": 0.4463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23585245013237, |
| "step": 2020, |
| "valid_targets_mean": 3368.2, |
| "valid_targets_min": 1710 |
| }, |
| { |
| "epoch": 3.0916730328495032, |
| "grad_norm": 0.650718819701116, |
| "learning_rate": 2.7403250921860497e-05, |
| "loss": 0.453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25358718633651733, |
| "step": 2025, |
| "valid_targets_mean": 4090.8, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 3.0993124522536286, |
| "grad_norm": 0.5963126945918865, |
| "learning_rate": 2.7332464628263945e-05, |
| "loss": 0.4718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22683659195899963, |
| "step": 2030, |
| "valid_targets_mean": 4324.2, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 3.106951871657754, |
| "grad_norm": 0.7170890890169099, |
| "learning_rate": 2.7261572059754217e-05, |
| "loss": 0.4698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21194159984588623, |
| "step": 2035, |
| "valid_targets_mean": 2557.9, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 3.1145912910618794, |
| "grad_norm": 0.6270816527342218, |
| "learning_rate": 2.7190574243830505e-05, |
| "loss": 0.4708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25633394718170166, |
| "step": 2040, |
| "valid_targets_mean": 4321.0, |
| "valid_targets_min": 1909 |
| }, |
| { |
| "epoch": 3.1222307104660048, |
| "grad_norm": 0.6768057541438881, |
| "learning_rate": 2.7119472209517442e-05, |
| "loss": 0.4434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14575080573558807, |
| "step": 2045, |
| "valid_targets_mean": 2207.1, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 3.1298701298701297, |
| "grad_norm": 0.6233377285938715, |
| "learning_rate": 2.7048266987350183e-05, |
| "loss": 0.4766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24185675382614136, |
| "step": 2050, |
| "valid_targets_mean": 3896.8, |
| "valid_targets_min": 1606 |
| }, |
| { |
| "epoch": 3.137509549274255, |
| "grad_norm": 0.8300155530398309, |
| "learning_rate": 2.6976959609359447e-05, |
| "loss": 0.4393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20969784259796143, |
| "step": 2055, |
| "valid_targets_mean": 2864.4, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 3.1451489686783805, |
| "grad_norm": 0.7022719532986335, |
| "learning_rate": 2.6905551109056598e-05, |
| "loss": 0.4505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17745709419250488, |
| "step": 2060, |
| "valid_targets_mean": 2705.0, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 3.152788388082506, |
| "grad_norm": 0.7176816603828999, |
| "learning_rate": 2.6834042521418604e-05, |
| "loss": 0.4618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27983376383781433, |
| "step": 2065, |
| "valid_targets_mean": 3271.4, |
| "valid_targets_min": 1878 |
| }, |
| { |
| "epoch": 3.160427807486631, |
| "grad_norm": 0.5748440814115998, |
| "learning_rate": 2.6762434882873116e-05, |
| "loss": 0.4114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23593346774578094, |
| "step": 2070, |
| "valid_targets_mean": 4988.9, |
| "valid_targets_min": 2159 |
| }, |
| { |
| "epoch": 3.168067226890756, |
| "grad_norm": 0.6550371187304824, |
| "learning_rate": 2.6690729231283374e-05, |
| "loss": 0.4752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21643373370170593, |
| "step": 2075, |
| "valid_targets_mean": 3548.8, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 3.1757066462948815, |
| "grad_norm": 0.7666764522952328, |
| "learning_rate": 2.66189266059332e-05, |
| "loss": 0.4793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32998839020729065, |
| "step": 2080, |
| "valid_targets_mean": 3029.2, |
| "valid_targets_min": 1459 |
| }, |
| { |
| "epoch": 3.183346065699007, |
| "grad_norm": 0.7500681322915863, |
| "learning_rate": 2.6547028047511943e-05, |
| "loss": 0.4558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17174682021141052, |
| "step": 2085, |
| "valid_targets_mean": 2901.1, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 3.1909854851031323, |
| "grad_norm": 0.7097897437767872, |
| "learning_rate": 2.6475034598099372e-05, |
| "loss": 0.4833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2244066298007965, |
| "step": 2090, |
| "valid_targets_mean": 3690.8, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 3.1986249045072572, |
| "grad_norm": 0.6152739239508643, |
| "learning_rate": 2.6402947301150583e-05, |
| "loss": 0.4655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2872171998023987, |
| "step": 2095, |
| "valid_targets_mean": 3874.6, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 3.2062643239113826, |
| "grad_norm": 0.6686147346154969, |
| "learning_rate": 2.6330767201480873e-05, |
| "loss": 0.4547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22372795641422272, |
| "step": 2100, |
| "valid_targets_mean": 3518.4, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 3.213903743315508, |
| "grad_norm": 0.6456365193151155, |
| "learning_rate": 2.62584953452506e-05, |
| "loss": 0.4367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21859055757522583, |
| "step": 2105, |
| "valid_targets_mean": 3339.4, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 3.2215431627196334, |
| "grad_norm": 0.7593984041165075, |
| "learning_rate": 2.6186132779950022e-05, |
| "loss": 0.4772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26761341094970703, |
| "step": 2110, |
| "valid_targets_mean": 2970.4, |
| "valid_targets_min": 1902 |
| }, |
| { |
| "epoch": 3.2291825821237587, |
| "grad_norm": 0.6501007799307098, |
| "learning_rate": 2.6113680554384107e-05, |
| "loss": 0.4602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2438923865556717, |
| "step": 2115, |
| "valid_targets_mean": 4634.4, |
| "valid_targets_min": 1688 |
| }, |
| { |
| "epoch": 3.2368220015278837, |
| "grad_norm": 0.5797241376930075, |
| "learning_rate": 2.604113971865734e-05, |
| "loss": 0.4383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31843867897987366, |
| "step": 2120, |
| "valid_targets_mean": 6170.1, |
| "valid_targets_min": 2066 |
| }, |
| { |
| "epoch": 3.244461420932009, |
| "grad_norm": 0.6842024873599893, |
| "learning_rate": 2.59685113241585e-05, |
| "loss": 0.463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35103440284729004, |
| "step": 2125, |
| "valid_targets_mean": 4209.1, |
| "valid_targets_min": 1380 |
| }, |
| { |
| "epoch": 3.2521008403361344, |
| "grad_norm": 0.752689560807153, |
| "learning_rate": 2.5895796423545418e-05, |
| "loss": 0.461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20140741765499115, |
| "step": 2130, |
| "valid_targets_mean": 2656.8, |
| "valid_targets_min": 1519 |
| }, |
| { |
| "epoch": 3.25974025974026, |
| "grad_norm": 0.6413068877083942, |
| "learning_rate": 2.5822996070729723e-05, |
| "loss": 0.4546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21095341444015503, |
| "step": 2135, |
| "valid_targets_mean": 3406.9, |
| "valid_targets_min": 1623 |
| }, |
| { |
| "epoch": 3.267379679144385, |
| "grad_norm": 0.6451875065112788, |
| "learning_rate": 2.575011132086157e-05, |
| "loss": 0.4528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25910890102386475, |
| "step": 2140, |
| "valid_targets_mean": 4925.0, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 3.27501909854851, |
| "grad_norm": 0.9084443226542351, |
| "learning_rate": 2.567714323031434e-05, |
| "loss": 0.4391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22554218769073486, |
| "step": 2145, |
| "valid_targets_mean": 1927.1, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 3.2826585179526355, |
| "grad_norm": 0.7610395813343054, |
| "learning_rate": 2.560409285666933e-05, |
| "loss": 0.4654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23040610551834106, |
| "step": 2150, |
| "valid_targets_mean": 3317.0, |
| "valid_targets_min": 1487 |
| }, |
| { |
| "epoch": 3.290297937356761, |
| "grad_norm": 0.6121775750148253, |
| "learning_rate": 2.5530961258700444e-05, |
| "loss": 0.4053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1965913474559784, |
| "step": 2155, |
| "valid_targets_mean": 3397.2, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 3.2979373567608863, |
| "grad_norm": 0.5434110974544242, |
| "learning_rate": 2.545774949635881e-05, |
| "loss": 0.4473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12601837515830994, |
| "step": 2160, |
| "valid_targets_mean": 3408.4, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 3.3055767761650117, |
| "grad_norm": 0.6224547099221401, |
| "learning_rate": 2.5384458630757456e-05, |
| "loss": 0.459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25731584429740906, |
| "step": 2165, |
| "valid_targets_mean": 4671.9, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 3.3132161955691366, |
| "grad_norm": 0.6957316558389659, |
| "learning_rate": 2.5311089724155896e-05, |
| "loss": 0.4592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15687590837478638, |
| "step": 2170, |
| "valid_targets_mean": 2381.5, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 3.320855614973262, |
| "grad_norm": 0.6437378155332701, |
| "learning_rate": 2.5237643839944774e-05, |
| "loss": 0.4614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18906278908252716, |
| "step": 2175, |
| "valid_targets_mean": 3104.6, |
| "valid_targets_min": 1500 |
| }, |
| { |
| "epoch": 3.3284950343773874, |
| "grad_norm": 0.7374192641903924, |
| "learning_rate": 2.5164122042630405e-05, |
| "loss": 0.4579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20864637196063995, |
| "step": 2180, |
| "valid_targets_mean": 2575.0, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 3.3361344537815127, |
| "grad_norm": 0.6409476943750227, |
| "learning_rate": 2.509052539781937e-05, |
| "loss": 0.4325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2770101726055145, |
| "step": 2185, |
| "valid_targets_mean": 4118.1, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.343773873185638, |
| "grad_norm": 1.0079250001951137, |
| "learning_rate": 2.5016854972203094e-05, |
| "loss": 0.4945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20084837079048157, |
| "step": 2190, |
| "valid_targets_mean": 1417.4, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 3.351413292589763, |
| "grad_norm": 0.8895234998263297, |
| "learning_rate": 2.4943111833542333e-05, |
| "loss": 0.4724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28576815128326416, |
| "step": 2195, |
| "valid_targets_mean": 2029.2, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 3.3590527119938884, |
| "grad_norm": 0.681661277197927, |
| "learning_rate": 2.4869297050651765e-05, |
| "loss": 0.4782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21255749464035034, |
| "step": 2200, |
| "valid_targets_mean": 3347.1, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 3.366692131398014, |
| "grad_norm": 0.6721290525161261, |
| "learning_rate": 2.479541169338442e-05, |
| "loss": 0.474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2670324742794037, |
| "step": 2205, |
| "valid_targets_mean": 3668.6, |
| "valid_targets_min": 1138 |
| }, |
| { |
| "epoch": 3.374331550802139, |
| "grad_norm": 0.7347531309138814, |
| "learning_rate": 2.4721456832616247e-05, |
| "loss": 0.5287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2706944942474365, |
| "step": 2210, |
| "valid_targets_mean": 2375.9, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 3.381970970206264, |
| "grad_norm": 0.6102358699138265, |
| "learning_rate": 2.4647433540230547e-05, |
| "loss": 0.4516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22291956841945648, |
| "step": 2215, |
| "valid_targets_mean": 4539.0, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 3.3896103896103895, |
| "grad_norm": 0.6827759823432588, |
| "learning_rate": 2.4573342889102443e-05, |
| "loss": 0.4694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1694415807723999, |
| "step": 2220, |
| "valid_targets_mean": 2403.1, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 3.397249809014515, |
| "grad_norm": 0.6951348124592946, |
| "learning_rate": 2.4499185953083363e-05, |
| "loss": 0.4493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18465524911880493, |
| "step": 2225, |
| "valid_targets_mean": 2890.0, |
| "valid_targets_min": 1722 |
| }, |
| { |
| "epoch": 3.4048892284186403, |
| "grad_norm": 0.5973099924759062, |
| "learning_rate": 2.4424963806985432e-05, |
| "loss": 0.4948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22179313004016876, |
| "step": 2230, |
| "valid_targets_mean": 3594.6, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 3.4125286478227657, |
| "grad_norm": 0.750343525606607, |
| "learning_rate": 2.4350677526565934e-05, |
| "loss": 0.4442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3058930039405823, |
| "step": 2235, |
| "valid_targets_mean": 3820.2, |
| "valid_targets_min": 1639 |
| }, |
| { |
| "epoch": 3.4201680672268906, |
| "grad_norm": 0.8202808105318293, |
| "learning_rate": 2.427632818851166e-05, |
| "loss": 0.4853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28285735845565796, |
| "step": 2240, |
| "valid_targets_mean": 3445.6, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 3.427807486631016, |
| "grad_norm": 0.7045598247602469, |
| "learning_rate": 2.4201916870423393e-05, |
| "loss": 0.4965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17256322503089905, |
| "step": 2245, |
| "valid_targets_mean": 2347.6, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 3.4354469060351414, |
| "grad_norm": 0.7389047344210837, |
| "learning_rate": 2.4127444650800203e-05, |
| "loss": 0.4842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2350621223449707, |
| "step": 2250, |
| "valid_targets_mean": 2283.5, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 3.4430863254392667, |
| "grad_norm": 0.5995621961731215, |
| "learning_rate": 2.405291260902387e-05, |
| "loss": 0.4814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18150877952575684, |
| "step": 2255, |
| "valid_targets_mean": 3665.9, |
| "valid_targets_min": 1568 |
| }, |
| { |
| "epoch": 3.4507257448433917, |
| "grad_norm": 0.6681977273319017, |
| "learning_rate": 2.3978321825343206e-05, |
| "loss": 0.4655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22443902492523193, |
| "step": 2260, |
| "valid_targets_mean": 3334.6, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 3.458365164247517, |
| "grad_norm": 0.7011279817974063, |
| "learning_rate": 2.390367338085843e-05, |
| "loss": 0.4542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15961575508117676, |
| "step": 2265, |
| "valid_targets_mean": 1922.6, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 3.4660045836516424, |
| "grad_norm": 0.6225101653595909, |
| "learning_rate": 2.382896835750547e-05, |
| "loss": 0.4334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17323069274425507, |
| "step": 2270, |
| "valid_targets_mean": 3204.8, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 3.473644003055768, |
| "grad_norm": 0.7095294516028836, |
| "learning_rate": 2.3754207838040296e-05, |
| "loss": 0.4482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1739782691001892, |
| "step": 2275, |
| "valid_targets_mean": 2280.6, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 3.481283422459893, |
| "grad_norm": 0.6968490266068142, |
| "learning_rate": 2.367939290602324e-05, |
| "loss": 0.4817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17820501327514648, |
| "step": 2280, |
| "valid_targets_mean": 2033.0, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 3.488922841864018, |
| "grad_norm": 0.6648554409574585, |
| "learning_rate": 2.360452464580326e-05, |
| "loss": 0.4778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2294338345527649, |
| "step": 2285, |
| "valid_targets_mean": 3581.5, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 3.4965622612681435, |
| "grad_norm": 0.7430674337203963, |
| "learning_rate": 2.352960414250223e-05, |
| "loss": 0.4631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24158762395381927, |
| "step": 2290, |
| "valid_targets_mean": 2921.4, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 3.504201680672269, |
| "grad_norm": 0.7298796222195553, |
| "learning_rate": 2.345463248199925e-05, |
| "loss": 0.4822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23775427043437958, |
| "step": 2295, |
| "valid_targets_mean": 2701.9, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 3.5118411000763943, |
| "grad_norm": 0.5806557240484798, |
| "learning_rate": 2.337961075091486e-05, |
| "loss": 0.4335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.221890389919281, |
| "step": 2300, |
| "valid_targets_mean": 4218.2, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 3.5194805194805197, |
| "grad_norm": 0.7571866275166863, |
| "learning_rate": 2.3304540036595313e-05, |
| "loss": 0.4776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2549300789833069, |
| "step": 2305, |
| "valid_targets_mean": 2839.0, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 3.5271199388846446, |
| "grad_norm": 0.5758410523457546, |
| "learning_rate": 2.322942142709682e-05, |
| "loss": 0.4637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26692140102386475, |
| "step": 2310, |
| "valid_targets_mean": 4998.4, |
| "valid_targets_min": 1708 |
| }, |
| { |
| "epoch": 3.53475935828877, |
| "grad_norm": 0.6878409192331846, |
| "learning_rate": 2.3154256011169758e-05, |
| "loss": 0.4551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17327441275119781, |
| "step": 2315, |
| "valid_targets_mean": 2440.4, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 3.5423987776928954, |
| "grad_norm": 0.6394586452229399, |
| "learning_rate": 2.3079044878242934e-05, |
| "loss": 0.4654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19388046860694885, |
| "step": 2320, |
| "valid_targets_mean": 3832.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 3.5500381970970207, |
| "grad_norm": 0.6385412390527023, |
| "learning_rate": 2.300378911840773e-05, |
| "loss": 0.439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21402673423290253, |
| "step": 2325, |
| "valid_targets_mean": 3548.6, |
| "valid_targets_min": 2209 |
| }, |
| { |
| "epoch": 3.557677616501146, |
| "grad_norm": 0.7468771536187816, |
| "learning_rate": 2.2928489822402363e-05, |
| "loss": 0.4712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27554431557655334, |
| "step": 2330, |
| "valid_targets_mean": 3242.6, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 3.565317035905271, |
| "grad_norm": 0.8019666864327368, |
| "learning_rate": 2.285314808159604e-05, |
| "loss": 0.4488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22434744238853455, |
| "step": 2335, |
| "valid_targets_mean": 2466.4, |
| "valid_targets_min": 1480 |
| }, |
| { |
| "epoch": 3.5729564553093964, |
| "grad_norm": 0.6877910040053126, |
| "learning_rate": 2.2777764987973167e-05, |
| "loss": 0.4621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2005833387374878, |
| "step": 2340, |
| "valid_targets_mean": 2540.5, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 3.580595874713522, |
| "grad_norm": 0.6611814458537609, |
| "learning_rate": 2.2702341634117487e-05, |
| "loss": 0.4665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27685844898223877, |
| "step": 2345, |
| "valid_targets_mean": 3624.1, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 3.588235294117647, |
| "grad_norm": 0.7269943364354757, |
| "learning_rate": 2.262687911319628e-05, |
| "loss": 0.4541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2215583324432373, |
| "step": 2350, |
| "valid_targets_mean": 3072.8, |
| "valid_targets_min": 1418 |
| }, |
| { |
| "epoch": 3.5958747135217726, |
| "grad_norm": 0.7803987380189772, |
| "learning_rate": 2.2551378518944505e-05, |
| "loss": 0.4519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18608278036117554, |
| "step": 2355, |
| "valid_targets_mean": 2090.5, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 3.6035141329258975, |
| "grad_norm": 0.7800039264188372, |
| "learning_rate": 2.247584094564894e-05, |
| "loss": 0.4157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2047506868839264, |
| "step": 2360, |
| "valid_targets_mean": 2571.6, |
| "valid_targets_min": 1560 |
| }, |
| { |
| "epoch": 3.611153552330023, |
| "grad_norm": 0.7134902841112694, |
| "learning_rate": 2.240026748813232e-05, |
| "loss": 0.4754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2151254266500473, |
| "step": 2365, |
| "valid_targets_mean": 2401.8, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 3.6187929717341483, |
| "grad_norm": 0.7075951063514955, |
| "learning_rate": 2.2324659241737495e-05, |
| "loss": 0.4702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21446746587753296, |
| "step": 2370, |
| "valid_targets_mean": 2707.9, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 3.6264323911382736, |
| "grad_norm": 0.6949316016720868, |
| "learning_rate": 2.2249017302311527e-05, |
| "loss": 0.4511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18831145763397217, |
| "step": 2375, |
| "valid_targets_mean": 1897.2, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 3.634071810542399, |
| "grad_norm": 0.629633789269152, |
| "learning_rate": 2.2173342766189803e-05, |
| "loss": 0.4597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25491413474082947, |
| "step": 2380, |
| "valid_targets_mean": 4428.2, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 3.641711229946524, |
| "grad_norm": 0.5838022402143164, |
| "learning_rate": 2.209763673018019e-05, |
| "loss": 0.4803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20996476709842682, |
| "step": 2385, |
| "valid_targets_mean": 3756.1, |
| "valid_targets_min": 1593 |
| }, |
| { |
| "epoch": 3.6493506493506493, |
| "grad_norm": 0.7815834244454084, |
| "learning_rate": 2.202190029154708e-05, |
| "loss": 0.4427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23983490467071533, |
| "step": 2390, |
| "valid_targets_mean": 2568.0, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 3.6569900687547747, |
| "grad_norm": 0.7150259118212184, |
| "learning_rate": 2.1946134547995524e-05, |
| "loss": 0.4577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22549794614315033, |
| "step": 2395, |
| "valid_targets_mean": 2506.2, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 3.6646294881588997, |
| "grad_norm": 0.6335828466810162, |
| "learning_rate": 2.1870340597655303e-05, |
| "loss": 0.4405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22980603575706482, |
| "step": 2400, |
| "valid_targets_mean": 3558.9, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 3.6722689075630255, |
| "grad_norm": 0.5764257422938297, |
| "learning_rate": 2.1794519539065037e-05, |
| "loss": 0.449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25543129444122314, |
| "step": 2405, |
| "valid_targets_mean": 4303.6, |
| "valid_targets_min": 1453 |
| }, |
| { |
| "epoch": 3.6799083269671504, |
| "grad_norm": 0.6545961859716691, |
| "learning_rate": 2.171867247115622e-05, |
| "loss": 0.4624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21702466905117035, |
| "step": 2410, |
| "valid_targets_mean": 3388.0, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 3.687547746371276, |
| "grad_norm": 0.644534217804787, |
| "learning_rate": 2.1642800493237343e-05, |
| "loss": 0.4353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2263290137052536, |
| "step": 2415, |
| "valid_targets_mean": 3678.1, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 3.695187165775401, |
| "grad_norm": 0.6221388982483342, |
| "learning_rate": 2.1566904704977925e-05, |
| "loss": 0.4741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2882634401321411, |
| "step": 2420, |
| "valid_targets_mean": 4166.2, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 3.702826585179526, |
| "grad_norm": 0.6658830128145721, |
| "learning_rate": 2.1490986206392598e-05, |
| "loss": 0.4841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18079718947410583, |
| "step": 2425, |
| "valid_targets_mean": 2733.5, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 3.7104660045836515, |
| "grad_norm": 0.7140090226865587, |
| "learning_rate": 2.1415046097825126e-05, |
| "loss": 0.4792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1596052497625351, |
| "step": 2430, |
| "valid_targets_mean": 2203.0, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 3.718105423987777, |
| "grad_norm": 0.6683971640083712, |
| "learning_rate": 2.1339085479932503e-05, |
| "loss": 0.5025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2300308346748352, |
| "step": 2435, |
| "valid_targets_mean": 3503.5, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 3.7257448433919023, |
| "grad_norm": 0.7666648806984934, |
| "learning_rate": 2.1263105453668987e-05, |
| "loss": 0.4922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20825770497322083, |
| "step": 2440, |
| "valid_targets_mean": 2057.6, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 3.7333842627960276, |
| "grad_norm": 0.7095697789754806, |
| "learning_rate": 2.1187107120270115e-05, |
| "loss": 0.4759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2333410680294037, |
| "step": 2445, |
| "valid_targets_mean": 2544.0, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 3.7410236822001526, |
| "grad_norm": 0.7848497019198811, |
| "learning_rate": 2.1111091581236764e-05, |
| "loss": 0.453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23937958478927612, |
| "step": 2450, |
| "valid_targets_mean": 2462.8, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.748663101604278, |
| "grad_norm": 0.7309498905361822, |
| "learning_rate": 2.1035059938319212e-05, |
| "loss": 0.4407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18757390975952148, |
| "step": 2455, |
| "valid_targets_mean": 2259.8, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 3.7563025210084033, |
| "grad_norm": 0.6296154351875214, |
| "learning_rate": 2.0959013293501117e-05, |
| "loss": 0.4533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1372356116771698, |
| "step": 2460, |
| "valid_targets_mean": 2102.8, |
| "valid_targets_min": 877 |
| }, |
| { |
| "epoch": 3.7639419404125287, |
| "grad_norm": 0.6363160856990357, |
| "learning_rate": 2.0882952748983586e-05, |
| "loss": 0.4877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2305780053138733, |
| "step": 2465, |
| "valid_targets_mean": 3732.1, |
| "valid_targets_min": 1882 |
| }, |
| { |
| "epoch": 3.771581359816654, |
| "grad_norm": 0.7045522442945755, |
| "learning_rate": 2.080687940716916e-05, |
| "loss": 0.445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1693146526813507, |
| "step": 2470, |
| "valid_targets_mean": 2391.8, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 3.779220779220779, |
| "grad_norm": 0.8102188625701466, |
| "learning_rate": 2.0730794370645895e-05, |
| "loss": 0.4462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3031376004219055, |
| "step": 2475, |
| "valid_targets_mean": 4573.8, |
| "valid_targets_min": 1604 |
| }, |
| { |
| "epoch": 3.7868601986249044, |
| "grad_norm": 0.5563888204797931, |
| "learning_rate": 2.0654698742171324e-05, |
| "loss": 0.4215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1911643147468567, |
| "step": 2480, |
| "valid_targets_mean": 3630.9, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 3.79449961802903, |
| "grad_norm": 0.5959316920949063, |
| "learning_rate": 2.05785936246565e-05, |
| "loss": 0.4614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.191148579120636, |
| "step": 2485, |
| "valid_targets_mean": 3104.6, |
| "valid_targets_min": 581 |
| }, |
| { |
| "epoch": 3.802139037433155, |
| "grad_norm": 0.553521615537144, |
| "learning_rate": 2.050248012115001e-05, |
| "loss": 0.4291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17974773049354553, |
| "step": 2490, |
| "valid_targets_mean": 3192.0, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 3.8097784568372806, |
| "grad_norm": 0.6997963953790906, |
| "learning_rate": 2.0426359334822e-05, |
| "loss": 0.453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2714889943599701, |
| "step": 2495, |
| "valid_targets_mean": 3805.4, |
| "valid_targets_min": 1498 |
| }, |
| { |
| "epoch": 3.8174178762414055, |
| "grad_norm": 0.6771839343218619, |
| "learning_rate": 2.035023236894815e-05, |
| "loss": 0.4673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20033538341522217, |
| "step": 2500, |
| "valid_targets_mean": 3261.2, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 3.825057295645531, |
| "grad_norm": 0.6777326221424306, |
| "learning_rate": 2.0274100326893707e-05, |
| "loss": 0.4696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24825991690158844, |
| "step": 2505, |
| "valid_targets_mean": 3330.6, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 3.8326967150496563, |
| "grad_norm": 0.7787026130733954, |
| "learning_rate": 2.0197964312097506e-05, |
| "loss": 0.4553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1855577826499939, |
| "step": 2510, |
| "valid_targets_mean": 2357.2, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 3.8403361344537816, |
| "grad_norm": 0.6224254712363454, |
| "learning_rate": 2.012182542805595e-05, |
| "loss": 0.4693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21993130445480347, |
| "step": 2515, |
| "valid_targets_mean": 4545.5, |
| "valid_targets_min": 1754 |
| }, |
| { |
| "epoch": 3.847975553857907, |
| "grad_norm": 0.867489528747725, |
| "learning_rate": 2.004568477830703e-05, |
| "loss": 0.4698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23368635773658752, |
| "step": 2520, |
| "valid_targets_mean": 2934.0, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 3.855614973262032, |
| "grad_norm": 0.6239465544977696, |
| "learning_rate": 1.9969543466414322e-05, |
| "loss": 0.4457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2778353691101074, |
| "step": 2525, |
| "valid_targets_mean": 4597.9, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 3.8632543926661573, |
| "grad_norm": 0.8117178518330349, |
| "learning_rate": 1.989340259595102e-05, |
| "loss": 0.4726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33868181705474854, |
| "step": 2530, |
| "valid_targets_mean": 2752.0, |
| "valid_targets_min": 410 |
| }, |
| { |
| "epoch": 3.8708938120702827, |
| "grad_norm": 0.6934224395837933, |
| "learning_rate": 1.9817263270483905e-05, |
| "loss": 0.4556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20168477296829224, |
| "step": 2535, |
| "valid_targets_mean": 3182.5, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 3.878533231474408, |
| "grad_norm": 0.8264078961610266, |
| "learning_rate": 1.9741126593557353e-05, |
| "loss": 0.4348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26114290952682495, |
| "step": 2540, |
| "valid_targets_mean": 3085.1, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 3.8861726508785335, |
| "grad_norm": 0.5747399845624196, |
| "learning_rate": 1.9664993668677387e-05, |
| "loss": 0.4539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21519362926483154, |
| "step": 2545, |
| "valid_targets_mean": 4435.5, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 3.8938120702826584, |
| "grad_norm": 0.6078829505251382, |
| "learning_rate": 1.958886559929561e-05, |
| "loss": 0.4467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22459211945533752, |
| "step": 2550, |
| "valid_targets_mean": 3909.1, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 3.901451489686784, |
| "grad_norm": 0.6421094318252095, |
| "learning_rate": 1.9512743488793272e-05, |
| "loss": 0.4512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23274767398834229, |
| "step": 2555, |
| "valid_targets_mean": 3336.9, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 3.909090909090909, |
| "grad_norm": 0.6246019102739618, |
| "learning_rate": 1.9436628440465267e-05, |
| "loss": 0.4673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21863816678524017, |
| "step": 2560, |
| "valid_targets_mean": 2936.9, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 3.916730328495034, |
| "grad_norm": 0.6435846868106468, |
| "learning_rate": 1.9360521557504102e-05, |
| "loss": 0.435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21502043306827545, |
| "step": 2565, |
| "valid_targets_mean": 3620.2, |
| "valid_targets_min": 1533 |
| }, |
| { |
| "epoch": 3.92436974789916, |
| "grad_norm": 0.7828764498827379, |
| "learning_rate": 1.928442394298397e-05, |
| "loss": 0.4702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1875026375055313, |
| "step": 2570, |
| "valid_targets_mean": 1726.6, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 3.932009167303285, |
| "grad_norm": 0.5941210989208424, |
| "learning_rate": 1.9208336699844695e-05, |
| "loss": 0.4621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1600552201271057, |
| "step": 2575, |
| "valid_targets_mean": 3049.6, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 3.9396485867074102, |
| "grad_norm": 0.6554685877224805, |
| "learning_rate": 1.913226093087581e-05, |
| "loss": 0.5097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22393539547920227, |
| "step": 2580, |
| "valid_targets_mean": 3305.1, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 3.9472880061115356, |
| "grad_norm": 0.7422842219293272, |
| "learning_rate": 1.905619773870052e-05, |
| "loss": 0.4846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29345467686653137, |
| "step": 2585, |
| "valid_targets_mean": 3128.4, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 3.9549274255156606, |
| "grad_norm": 0.6220768386463338, |
| "learning_rate": 1.898014822575977e-05, |
| "loss": 0.4482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17033663392066956, |
| "step": 2590, |
| "valid_targets_mean": 2552.4, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 3.962566844919786, |
| "grad_norm": 0.6903241768662477, |
| "learning_rate": 1.890411349429623e-05, |
| "loss": 0.4633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20769096910953522, |
| "step": 2595, |
| "valid_targets_mean": 2664.8, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 3.9702062643239113, |
| "grad_norm": 0.6154692002970737, |
| "learning_rate": 1.8828094646338323e-05, |
| "loss": 0.4755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22253820300102234, |
| "step": 2600, |
| "valid_targets_mean": 3467.6, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 3.9778456837280367, |
| "grad_norm": 0.5858709827232779, |
| "learning_rate": 1.875209278368428e-05, |
| "loss": 0.4247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25010430812835693, |
| "step": 2605, |
| "valid_targets_mean": 4649.6, |
| "valid_targets_min": 2062 |
| }, |
| { |
| "epoch": 3.985485103132162, |
| "grad_norm": 0.7705722890771514, |
| "learning_rate": 1.867610900788612e-05, |
| "loss": 0.4601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24480944871902466, |
| "step": 2610, |
| "valid_targets_mean": 2811.4, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 3.993124522536287, |
| "grad_norm": 0.7432406655539916, |
| "learning_rate": 1.8600144420233752e-05, |
| "loss": 0.4532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3015478551387787, |
| "step": 2615, |
| "valid_targets_mean": 3291.5, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 1.118384436602522, |
| "learning_rate": 1.8524200121738948e-05, |
| "loss": 0.492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5947331190109253, |
| "step": 2620, |
| "valid_targets_mean": 2656.5, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 4.007639419404125, |
| "grad_norm": 0.7690026283732248, |
| "learning_rate": 1.844827721311943e-05, |
| "loss": 0.4482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21468114852905273, |
| "step": 2625, |
| "valid_targets_mean": 3231.8, |
| "valid_targets_min": 1540 |
| }, |
| { |
| "epoch": 4.015278838808251, |
| "grad_norm": 0.681129686061914, |
| "learning_rate": 1.83723767947829e-05, |
| "loss": 0.4226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1789844036102295, |
| "step": 2630, |
| "valid_targets_mean": 2767.0, |
| "valid_targets_min": 1733 |
| }, |
| { |
| "epoch": 4.022918258212376, |
| "grad_norm": 0.710910135229329, |
| "learning_rate": 1.829649996681108e-05, |
| "loss": 0.4452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22730287909507751, |
| "step": 2635, |
| "valid_targets_mean": 3989.2, |
| "valid_targets_min": 1211 |
| }, |
| { |
| "epoch": 4.0305576776165015, |
| "grad_norm": 0.7390014967088522, |
| "learning_rate": 1.8220647828943798e-05, |
| "loss": 0.419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1696176379919052, |
| "step": 2640, |
| "valid_targets_mean": 2481.0, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 4.0381970970206265, |
| "grad_norm": 0.7079151818997759, |
| "learning_rate": 1.8144821480563004e-05, |
| "loss": 0.4246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18761557340621948, |
| "step": 2645, |
| "valid_targets_mean": 2711.4, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 4.045836516424751, |
| "grad_norm": 0.7977337206226138, |
| "learning_rate": 1.8069022020676883e-05, |
| "loss": 0.4329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2581322193145752, |
| "step": 2650, |
| "valid_targets_mean": 2545.1, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 4.053475935828877, |
| "grad_norm": 0.706216871603318, |
| "learning_rate": 1.7993250547903898e-05, |
| "loss": 0.4365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16597332060337067, |
| "step": 2655, |
| "valid_targets_mean": 2274.2, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 4.061115355233002, |
| "grad_norm": 0.6452920539721788, |
| "learning_rate": 1.791750816045687e-05, |
| "loss": 0.4409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20056098699569702, |
| "step": 2660, |
| "valid_targets_mean": 4523.8, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 4.068754774637128, |
| "grad_norm": 0.7588857980340116, |
| "learning_rate": 1.7841795956127076e-05, |
| "loss": 0.4164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2161455899477005, |
| "step": 2665, |
| "valid_targets_mean": 2293.6, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.076394194041253, |
| "grad_norm": 0.6876134340921465, |
| "learning_rate": 1.7766115032268313e-05, |
| "loss": 0.4106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.299022912979126, |
| "step": 2670, |
| "valid_targets_mean": 4430.9, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 4.084033613445378, |
| "grad_norm": 0.6926601809186282, |
| "learning_rate": 1.769046648578102e-05, |
| "loss": 0.4538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2319658249616623, |
| "step": 2675, |
| "valid_targets_mean": 3480.9, |
| "valid_targets_min": 1354 |
| }, |
| { |
| "epoch": 4.091673032849504, |
| "grad_norm": 0.6594589767473226, |
| "learning_rate": 1.7614851413096338e-05, |
| "loss": 0.4423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19595220685005188, |
| "step": 2680, |
| "valid_targets_mean": 3187.6, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 4.099312452253629, |
| "grad_norm": 0.790419683409844, |
| "learning_rate": 1.753927091016029e-05, |
| "loss": 0.423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20953130722045898, |
| "step": 2685, |
| "valid_targets_mean": 3638.5, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 4.106951871657754, |
| "grad_norm": 0.7733355338048273, |
| "learning_rate": 1.746372607241782e-05, |
| "loss": 0.4761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20323872566223145, |
| "step": 2690, |
| "valid_targets_mean": 2683.2, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 4.114591291061879, |
| "grad_norm": 0.6552366064915041, |
| "learning_rate": 1.738821799479696e-05, |
| "loss": 0.4312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24009570479393005, |
| "step": 2695, |
| "valid_targets_mean": 3705.1, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 4.122230710466004, |
| "grad_norm": 0.7529808173350705, |
| "learning_rate": 1.731274777169296e-05, |
| "loss": 0.4277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14969006180763245, |
| "step": 2700, |
| "valid_targets_mean": 2055.2, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 4.12987012987013, |
| "grad_norm": 0.6936218633949953, |
| "learning_rate": 1.72373164969524e-05, |
| "loss": 0.4449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20020580291748047, |
| "step": 2705, |
| "valid_targets_mean": 2911.5, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.137509549274255, |
| "grad_norm": 0.6778934162946096, |
| "learning_rate": 1.7161925263857367e-05, |
| "loss": 0.4402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17394796013832092, |
| "step": 2710, |
| "valid_targets_mean": 2909.0, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 4.145148968678381, |
| "grad_norm": 0.7116686368909119, |
| "learning_rate": 1.7086575165109576e-05, |
| "loss": 0.4603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23824220895767212, |
| "step": 2715, |
| "valid_targets_mean": 3688.0, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 4.152788388082506, |
| "grad_norm": 0.7389107606127957, |
| "learning_rate": 1.7011267292814567e-05, |
| "loss": 0.416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2256026566028595, |
| "step": 2720, |
| "valid_targets_mean": 3048.5, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 4.160427807486631, |
| "grad_norm": 0.6209290096899042, |
| "learning_rate": 1.6936002738465852e-05, |
| "loss": 0.4299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2748083174228668, |
| "step": 2725, |
| "valid_targets_mean": 5696.2, |
| "valid_targets_min": 1923 |
| }, |
| { |
| "epoch": 4.168067226890757, |
| "grad_norm": 0.7609911879557028, |
| "learning_rate": 1.686078259292911e-05, |
| "loss": 0.4333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22729676961898804, |
| "step": 2730, |
| "valid_targets_mean": 3419.4, |
| "valid_targets_min": 2046 |
| }, |
| { |
| "epoch": 4.1757066462948815, |
| "grad_norm": 0.7136364581542297, |
| "learning_rate": 1.6785607946426365e-05, |
| "loss": 0.431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2431565523147583, |
| "step": 2735, |
| "valid_targets_mean": 4014.6, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.1833460656990065, |
| "grad_norm": 0.653814674078787, |
| "learning_rate": 1.671047988852019e-05, |
| "loss": 0.4323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26763594150543213, |
| "step": 2740, |
| "valid_targets_mean": 4340.1, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 4.190985485103132, |
| "grad_norm": 0.6477365295148055, |
| "learning_rate": 1.663539950809792e-05, |
| "loss": 0.4154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20111311972141266, |
| "step": 2745, |
| "valid_targets_mean": 3306.9, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 4.198624904507257, |
| "grad_norm": 0.6923380432257537, |
| "learning_rate": 1.6560367893355852e-05, |
| "loss": 0.4078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15234971046447754, |
| "step": 2750, |
| "valid_targets_mean": 2417.6, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 4.206264323911383, |
| "grad_norm": 0.7693482875043431, |
| "learning_rate": 1.6485386131783495e-05, |
| "loss": 0.4319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2205432653427124, |
| "step": 2755, |
| "valid_targets_mean": 2677.0, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 4.213903743315508, |
| "grad_norm": 0.615414794511978, |
| "learning_rate": 1.6410455310147797e-05, |
| "loss": 0.4536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2940524220466614, |
| "step": 2760, |
| "valid_targets_mean": 3730.5, |
| "valid_targets_min": 1592 |
| }, |
| { |
| "epoch": 4.221543162719633, |
| "grad_norm": 0.7076306553236521, |
| "learning_rate": 1.63355765144774e-05, |
| "loss": 0.4086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16093017160892487, |
| "step": 2765, |
| "valid_targets_mean": 3209.5, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 4.229182582123759, |
| "grad_norm": 0.8056253074864008, |
| "learning_rate": 1.6260750830046876e-05, |
| "loss": 0.4166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.245550736784935, |
| "step": 2770, |
| "valid_targets_mean": 3017.1, |
| "valid_targets_min": 1784 |
| }, |
| { |
| "epoch": 4.236822001527884, |
| "grad_norm": 0.748600942244156, |
| "learning_rate": 1.6185979341361037e-05, |
| "loss": 0.4275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19234326481819153, |
| "step": 2775, |
| "valid_targets_mean": 2891.6, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 4.2444614209320095, |
| "grad_norm": 0.5918768300976833, |
| "learning_rate": 1.6111263132139198e-05, |
| "loss": 0.4173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2575937509536743, |
| "step": 2780, |
| "valid_targets_mean": 5343.8, |
| "valid_targets_min": 2623 |
| }, |
| { |
| "epoch": 4.2521008403361344, |
| "grad_norm": 0.7756708955173703, |
| "learning_rate": 1.6036603285299443e-05, |
| "loss": 0.4585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19431465864181519, |
| "step": 2785, |
| "valid_targets_mean": 2496.0, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 4.259740259740259, |
| "grad_norm": 0.7551317271285645, |
| "learning_rate": 1.596200088294297e-05, |
| "loss": 0.4041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2065984159708023, |
| "step": 2790, |
| "valid_targets_mean": 2938.9, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 4.267379679144385, |
| "grad_norm": 0.7576742731600777, |
| "learning_rate": 1.588745700633839e-05, |
| "loss": 0.4341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2416866570711136, |
| "step": 2795, |
| "valid_targets_mean": 2821.4, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 4.27501909854851, |
| "grad_norm": 0.7111031081474437, |
| "learning_rate": 1.5812972735906066e-05, |
| "loss": 0.4069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13971193134784698, |
| "step": 2800, |
| "valid_targets_mean": 2554.2, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 4.282658517952636, |
| "grad_norm": 0.6615809212808664, |
| "learning_rate": 1.5738549151202407e-05, |
| "loss": 0.4319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20371738076210022, |
| "step": 2805, |
| "valid_targets_mean": 3638.4, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 4.290297937356761, |
| "grad_norm": 0.8364032589879101, |
| "learning_rate": 1.5664187330904306e-05, |
| "loss": 0.4446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19082514941692352, |
| "step": 2810, |
| "valid_targets_mean": 2542.2, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 4.297937356760886, |
| "grad_norm": 0.7049427991206001, |
| "learning_rate": 1.5589888352793436e-05, |
| "loss": 0.4502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22058123350143433, |
| "step": 2815, |
| "valid_targets_mean": 4915.6, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 4.305576776165012, |
| "grad_norm": 0.7212184176724953, |
| "learning_rate": 1.5515653293740637e-05, |
| "loss": 0.4387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25808072090148926, |
| "step": 2820, |
| "valid_targets_mean": 3785.6, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 4.313216195569137, |
| "grad_norm": 0.6826238022765982, |
| "learning_rate": 1.544148322969035e-05, |
| "loss": 0.4278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22490471601486206, |
| "step": 2825, |
| "valid_targets_mean": 3405.4, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 4.320855614973262, |
| "grad_norm": 0.8261773124931177, |
| "learning_rate": 1.5367379235644973e-05, |
| "loss": 0.4179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19495196640491486, |
| "step": 2830, |
| "valid_targets_mean": 2450.9, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 4.328495034377387, |
| "grad_norm": 0.6390880153692574, |
| "learning_rate": 1.529334238564932e-05, |
| "loss": 0.4201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17437967658042908, |
| "step": 2835, |
| "valid_targets_mean": 4055.9, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 4.336134453781512, |
| "grad_norm": 0.7703651186273575, |
| "learning_rate": 1.521937375277501e-05, |
| "loss": 0.4335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18413357436656952, |
| "step": 2840, |
| "valid_targets_mean": 2652.8, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 4.343773873185638, |
| "grad_norm": 0.6368753230093523, |
| "learning_rate": 1.5145474409104962e-05, |
| "loss": 0.4265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2968963384628296, |
| "step": 2845, |
| "valid_targets_mean": 4633.8, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 4.351413292589763, |
| "grad_norm": 0.5903985232599476, |
| "learning_rate": 1.507164542571784e-05, |
| "loss": 0.4196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18544989824295044, |
| "step": 2850, |
| "valid_targets_mean": 3483.8, |
| "valid_targets_min": 407 |
| }, |
| { |
| "epoch": 4.359052711993888, |
| "grad_norm": 0.662217973508679, |
| "learning_rate": 1.49978878726725e-05, |
| "loss": 0.4607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17374002933502197, |
| "step": 2855, |
| "valid_targets_mean": 2742.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 4.366692131398014, |
| "grad_norm": 0.6636333553320053, |
| "learning_rate": 1.4924202818992517e-05, |
| "loss": 0.4384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3518938720226288, |
| "step": 2860, |
| "valid_targets_mean": 4384.1, |
| "valid_targets_min": 1059 |
| }, |
| { |
| "epoch": 4.374331550802139, |
| "grad_norm": 0.8000423908088488, |
| "learning_rate": 1.4850591332650679e-05, |
| "loss": 0.4178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17594996094703674, |
| "step": 2865, |
| "valid_targets_mean": 2390.4, |
| "valid_targets_min": 1549 |
| }, |
| { |
| "epoch": 4.381970970206265, |
| "grad_norm": 0.6055308221886132, |
| "learning_rate": 1.4777054480553514e-05, |
| "loss": 0.4552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24170832335948944, |
| "step": 2870, |
| "valid_targets_mean": 4342.2, |
| "valid_targets_min": 975 |
| }, |
| { |
| "epoch": 4.3896103896103895, |
| "grad_norm": 0.6903510024741975, |
| "learning_rate": 1.47035933285258e-05, |
| "loss": 0.4326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21987634897232056, |
| "step": 2875, |
| "valid_targets_mean": 3401.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 4.3972498090145145, |
| "grad_norm": 0.6979371022754717, |
| "learning_rate": 1.4630208941295156e-05, |
| "loss": 0.399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1578153818845749, |
| "step": 2880, |
| "valid_targets_mean": 2634.9, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 4.40488922841864, |
| "grad_norm": 0.7514413276024192, |
| "learning_rate": 1.4556902382476579e-05, |
| "loss": 0.4158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23249536752700806, |
| "step": 2885, |
| "valid_targets_mean": 3987.5, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.412528647822765, |
| "grad_norm": 0.7198762011769154, |
| "learning_rate": 1.448367471455705e-05, |
| "loss": 0.4487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.207943394780159, |
| "step": 2890, |
| "valid_targets_mean": 2996.8, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 4.420168067226891, |
| "grad_norm": 0.6599812130280833, |
| "learning_rate": 1.4410526998880122e-05, |
| "loss": 0.4602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23088182508945465, |
| "step": 2895, |
| "valid_targets_mean": 4051.1, |
| "valid_targets_min": 1394 |
| }, |
| { |
| "epoch": 4.427807486631016, |
| "grad_norm": 0.9040364751596435, |
| "learning_rate": 1.4337460295630531e-05, |
| "loss": 0.4528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2535208463668823, |
| "step": 2900, |
| "valid_targets_mean": 4407.2, |
| "valid_targets_min": 1606 |
| }, |
| { |
| "epoch": 4.435446906035141, |
| "grad_norm": 0.6946233200223303, |
| "learning_rate": 1.4264475663818864e-05, |
| "loss": 0.4225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20772013068199158, |
| "step": 2905, |
| "valid_targets_mean": 3627.0, |
| "valid_targets_min": 1727 |
| }, |
| { |
| "epoch": 4.443086325439267, |
| "grad_norm": 0.6996399854509193, |
| "learning_rate": 1.419157416126615e-05, |
| "loss": 0.4594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23996701836585999, |
| "step": 2910, |
| "valid_targets_mean": 3127.0, |
| "valid_targets_min": 751 |
| }, |
| { |
| "epoch": 4.450725744843392, |
| "grad_norm": 0.6603193020020982, |
| "learning_rate": 1.4118756844588585e-05, |
| "loss": 0.4441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22003193199634552, |
| "step": 2915, |
| "valid_targets_mean": 4034.8, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 4.4583651642475175, |
| "grad_norm": 0.667399183048132, |
| "learning_rate": 1.4046024769182194e-05, |
| "loss": 0.4148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23613163828849792, |
| "step": 2920, |
| "valid_targets_mean": 4173.1, |
| "valid_targets_min": 1640 |
| }, |
| { |
| "epoch": 4.466004583651642, |
| "grad_norm": 0.8259826448808988, |
| "learning_rate": 1.3973378989207535e-05, |
| "loss": 0.4363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2937498092651367, |
| "step": 2925, |
| "valid_targets_mean": 3235.8, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 4.473644003055767, |
| "grad_norm": 0.7033941655509587, |
| "learning_rate": 1.3900820557574425e-05, |
| "loss": 0.4472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23923955857753754, |
| "step": 2930, |
| "valid_targets_mean": 4048.2, |
| "valid_targets_min": 1459 |
| }, |
| { |
| "epoch": 4.481283422459893, |
| "grad_norm": 0.7454285606687833, |
| "learning_rate": 1.3828350525926663e-05, |
| "loss": 0.4237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21835088729858398, |
| "step": 2935, |
| "valid_targets_mean": 2663.1, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 4.488922841864018, |
| "grad_norm": 0.7110475251004348, |
| "learning_rate": 1.3755969944626823e-05, |
| "loss": 0.4194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2952437996864319, |
| "step": 2940, |
| "valid_targets_mean": 4387.2, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 4.496562261268144, |
| "grad_norm": 0.8828237294270216, |
| "learning_rate": 1.368367986274098e-05, |
| "loss": 0.4394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2030916064977646, |
| "step": 2945, |
| "valid_targets_mean": 1706.4, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 4.504201680672269, |
| "grad_norm": 0.6954473223855169, |
| "learning_rate": 1.3611481328023554e-05, |
| "loss": 0.4564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25050777196884155, |
| "step": 2950, |
| "valid_targets_mean": 3577.8, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 4.511841100076394, |
| "grad_norm": 0.6422040953597707, |
| "learning_rate": 1.3539375386902092e-05, |
| "loss": 0.4139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19034726917743683, |
| "step": 2955, |
| "valid_targets_mean": 3637.6, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 4.51948051948052, |
| "grad_norm": 0.813407071704735, |
| "learning_rate": 1.3467363084462122e-05, |
| "loss": 0.4588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22248804569244385, |
| "step": 2960, |
| "valid_targets_mean": 2901.4, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 4.527119938884645, |
| "grad_norm": 0.598255408018068, |
| "learning_rate": 1.3395445464431997e-05, |
| "loss": 0.4403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2788901925086975, |
| "step": 2965, |
| "valid_targets_mean": 5120.8, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 4.53475935828877, |
| "grad_norm": 0.7320702572816888, |
| "learning_rate": 1.3323623569167748e-05, |
| "loss": 0.4426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2455928921699524, |
| "step": 2970, |
| "valid_targets_mean": 3704.1, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 4.542398777692895, |
| "grad_norm": 0.8656712332196725, |
| "learning_rate": 1.3251898439638025e-05, |
| "loss": 0.4323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28234678506851196, |
| "step": 2975, |
| "valid_targets_mean": 2744.9, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 4.55003819709702, |
| "grad_norm": 0.6145036757635849, |
| "learning_rate": 1.3180271115408944e-05, |
| "loss": 0.4606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20645278692245483, |
| "step": 2980, |
| "valid_targets_mean": 4847.0, |
| "valid_targets_min": 1823 |
| }, |
| { |
| "epoch": 4.557677616501146, |
| "grad_norm": 0.7084910960235971, |
| "learning_rate": 1.310874263462909e-05, |
| "loss": 0.409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17451977729797363, |
| "step": 2985, |
| "valid_targets_mean": 2182.5, |
| "valid_targets_min": 831 |
| }, |
| { |
| "epoch": 4.565317035905271, |
| "grad_norm": 0.6562259432752094, |
| "learning_rate": 1.303731403401441e-05, |
| "loss": 0.4415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2443830817937851, |
| "step": 2990, |
| "valid_targets_mean": 4561.2, |
| "valid_targets_min": 2325 |
| }, |
| { |
| "epoch": 4.572956455309397, |
| "grad_norm": 0.696214858440501, |
| "learning_rate": 1.2965986348833229e-05, |
| "loss": 0.4487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27823278307914734, |
| "step": 2995, |
| "valid_targets_mean": 4183.0, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 4.580595874713522, |
| "grad_norm": 0.7307211959598596, |
| "learning_rate": 1.2894760612891219e-05, |
| "loss": 0.4133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17543989419937134, |
| "step": 3000, |
| "valid_targets_mean": 3196.6, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 4.588235294117647, |
| "grad_norm": 0.7005195593755522, |
| "learning_rate": 1.2823637858516432e-05, |
| "loss": 0.4569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24170951545238495, |
| "step": 3005, |
| "valid_targets_mean": 3459.9, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 4.595874713521773, |
| "grad_norm": 0.7209567127788638, |
| "learning_rate": 1.2752619116544333e-05, |
| "loss": 0.4303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22956225275993347, |
| "step": 3010, |
| "valid_targets_mean": 3502.8, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 4.6035141329258975, |
| "grad_norm": 0.6653489435920646, |
| "learning_rate": 1.2681705416302839e-05, |
| "loss": 0.4554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18298763036727905, |
| "step": 3015, |
| "valid_targets_mean": 3679.9, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 4.611153552330023, |
| "grad_norm": 0.7852042606455901, |
| "learning_rate": 1.2610897785597441e-05, |
| "loss": 0.458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2998313307762146, |
| "step": 3020, |
| "valid_targets_mean": 3142.8, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 4.618792971734148, |
| "grad_norm": 0.7486001259075058, |
| "learning_rate": 1.2540197250696266e-05, |
| "loss": 0.4231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27724653482437134, |
| "step": 3025, |
| "valid_targets_mean": 3724.6, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 4.626432391138273, |
| "grad_norm": 0.6340367863972102, |
| "learning_rate": 1.2469604836315237e-05, |
| "loss": 0.4362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3218015730381012, |
| "step": 3030, |
| "valid_targets_mean": 5287.8, |
| "valid_targets_min": 1415 |
| }, |
| { |
| "epoch": 4.634071810542399, |
| "grad_norm": 0.8297601491978646, |
| "learning_rate": 1.2399121565603203e-05, |
| "loss": 0.4173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27993282675743103, |
| "step": 3035, |
| "valid_targets_mean": 3140.9, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 4.641711229946524, |
| "grad_norm": 0.8392576086594048, |
| "learning_rate": 1.2328748460127095e-05, |
| "loss": 0.4372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24703417718410492, |
| "step": 3040, |
| "valid_targets_mean": 2254.0, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 4.64935064935065, |
| "grad_norm": 0.76403301632943, |
| "learning_rate": 1.2258486539857163e-05, |
| "loss": 0.4339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.214448019862175, |
| "step": 3045, |
| "valid_targets_mean": 2798.6, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 4.656990068754775, |
| "grad_norm": 0.7607712205600897, |
| "learning_rate": 1.2188336823152137e-05, |
| "loss": 0.456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2419661283493042, |
| "step": 3050, |
| "valid_targets_mean": 3125.0, |
| "valid_targets_min": 1810 |
| }, |
| { |
| "epoch": 4.6646294881589, |
| "grad_norm": 0.6780774718582251, |
| "learning_rate": 1.2118300326744525e-05, |
| "loss": 0.4407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2228745073080063, |
| "step": 3055, |
| "valid_targets_mean": 3821.5, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 4.6722689075630255, |
| "grad_norm": 0.7415756571172493, |
| "learning_rate": 1.2048378065725821e-05, |
| "loss": 0.4282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21102388203144073, |
| "step": 3060, |
| "valid_targets_mean": 2965.5, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 4.67990832696715, |
| "grad_norm": 0.826558813326542, |
| "learning_rate": 1.1978571053531848e-05, |
| "loss": 0.4675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27071088552474976, |
| "step": 3065, |
| "valid_targets_mean": 3043.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 4.687547746371276, |
| "grad_norm": 0.8463261732397126, |
| "learning_rate": 1.1908880301928012e-05, |
| "loss": 0.4489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25644421577453613, |
| "step": 3070, |
| "valid_targets_mean": 2437.5, |
| "valid_targets_min": 1480 |
| }, |
| { |
| "epoch": 4.695187165775401, |
| "grad_norm": 0.7807727309561482, |
| "learning_rate": 1.1839306820994692e-05, |
| "loss": 0.4537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23279087245464325, |
| "step": 3075, |
| "valid_targets_mean": 3059.1, |
| "valid_targets_min": 1494 |
| }, |
| { |
| "epoch": 4.702826585179526, |
| "grad_norm": 0.664795453987691, |
| "learning_rate": 1.1769851619112571e-05, |
| "loss": 0.4268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1653788685798645, |
| "step": 3080, |
| "valid_targets_mean": 2827.6, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 4.710466004583652, |
| "grad_norm": 0.7404044663755746, |
| "learning_rate": 1.1700515702948003e-05, |
| "loss": 0.4363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18012934923171997, |
| "step": 3085, |
| "valid_targets_mean": 2408.6, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 4.718105423987777, |
| "grad_norm": 0.6959670506262801, |
| "learning_rate": 1.1631300077438474e-05, |
| "loss": 0.4032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1842706799507141, |
| "step": 3090, |
| "valid_targets_mean": 2286.6, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 4.725744843391903, |
| "grad_norm": 0.6789388370499856, |
| "learning_rate": 1.1562205745777976e-05, |
| "loss": 0.4147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16564428806304932, |
| "step": 3095, |
| "valid_targets_mean": 3138.4, |
| "valid_targets_min": 1894 |
| }, |
| { |
| "epoch": 4.733384262796028, |
| "grad_norm": 0.6829775331974125, |
| "learning_rate": 1.149323370940254e-05, |
| "loss": 0.4374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20033124089241028, |
| "step": 3100, |
| "valid_targets_mean": 2759.4, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 4.741023682200153, |
| "grad_norm": 0.6955835942094102, |
| "learning_rate": 1.1424384967975638e-05, |
| "loss": 0.4386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19949236512184143, |
| "step": 3105, |
| "valid_targets_mean": 2783.8, |
| "valid_targets_min": 1222 |
| }, |
| { |
| "epoch": 4.748663101604278, |
| "grad_norm": 0.8058435461758185, |
| "learning_rate": 1.1355660519373757e-05, |
| "loss": 0.4324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2256844937801361, |
| "step": 3110, |
| "valid_targets_mean": 3453.5, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 4.756302521008403, |
| "grad_norm": 0.543464576904595, |
| "learning_rate": 1.1287061359671918e-05, |
| "loss": 0.4511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1765793263912201, |
| "step": 3115, |
| "valid_targets_mean": 4341.4, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 4.763941940412528, |
| "grad_norm": 0.6367461792370757, |
| "learning_rate": 1.1218588483129226e-05, |
| "loss": 0.4428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.232584148645401, |
| "step": 3120, |
| "valid_targets_mean": 3673.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.771581359816654, |
| "grad_norm": 0.635073599945755, |
| "learning_rate": 1.115024288217447e-05, |
| "loss": 0.4254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18331608176231384, |
| "step": 3125, |
| "valid_targets_mean": 3576.4, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 4.779220779220779, |
| "grad_norm": 0.7428588724353016, |
| "learning_rate": 1.1082025547391742e-05, |
| "loss": 0.4409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22744230926036835, |
| "step": 3130, |
| "valid_targets_mean": 2550.1, |
| "valid_targets_min": 951 |
| }, |
| { |
| "epoch": 4.786860198624905, |
| "grad_norm": 0.831972596497422, |
| "learning_rate": 1.1013937467506075e-05, |
| "loss": 0.4348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24062250554561615, |
| "step": 3135, |
| "valid_targets_mean": 2996.0, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 4.79449961802903, |
| "grad_norm": 0.7072316785824789, |
| "learning_rate": 1.0945979629369103e-05, |
| "loss": 0.4284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20350953936576843, |
| "step": 3140, |
| "valid_targets_mean": 3159.4, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 4.802139037433155, |
| "grad_norm": 0.7422268731369834, |
| "learning_rate": 1.0878153017944801e-05, |
| "loss": 0.4664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37612760066986084, |
| "step": 3145, |
| "valid_targets_mean": 4292.4, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 4.809778456837281, |
| "grad_norm": 0.7624693176548212, |
| "learning_rate": 1.0810458616295146e-05, |
| "loss": 0.4421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21782265603542328, |
| "step": 3150, |
| "valid_targets_mean": 2382.0, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 4.8174178762414055, |
| "grad_norm": 0.7281106937968902, |
| "learning_rate": 1.0742897405565892e-05, |
| "loss": 0.4394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2107025533914566, |
| "step": 3155, |
| "valid_targets_mean": 3610.5, |
| "valid_targets_min": 1363 |
| }, |
| { |
| "epoch": 4.825057295645531, |
| "grad_norm": 0.6543758653177835, |
| "learning_rate": 1.0675470364972412e-05, |
| "loss": 0.4434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2604054808616638, |
| "step": 3160, |
| "valid_targets_mean": 4376.6, |
| "valid_targets_min": 1138 |
| }, |
| { |
| "epoch": 4.832696715049656, |
| "grad_norm": 0.7376066895580519, |
| "learning_rate": 1.0608178471785369e-05, |
| "loss": 0.4605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2066906839609146, |
| "step": 3165, |
| "valid_targets_mean": 2716.8, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 4.840336134453781, |
| "grad_norm": 0.867558948336844, |
| "learning_rate": 1.0541022701316704e-05, |
| "loss": 0.415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22561189532279968, |
| "step": 3170, |
| "valid_targets_mean": 2282.2, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 4.847975553857907, |
| "grad_norm": 0.753345607833048, |
| "learning_rate": 1.0474004026905393e-05, |
| "loss": 0.4214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17792923748493195, |
| "step": 3175, |
| "valid_targets_mean": 2575.5, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 4.855614973262032, |
| "grad_norm": 0.6965195935418431, |
| "learning_rate": 1.040712341990338e-05, |
| "loss": 0.4427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21977144479751587, |
| "step": 3180, |
| "valid_targets_mean": 3192.2, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 4.863254392666157, |
| "grad_norm": 0.7244562227938083, |
| "learning_rate": 1.0340381849661512e-05, |
| "loss": 0.4209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20825041830539703, |
| "step": 3185, |
| "valid_targets_mean": 2705.8, |
| "valid_targets_min": 1218 |
| }, |
| { |
| "epoch": 4.870893812070283, |
| "grad_norm": 1.1658836220367665, |
| "learning_rate": 1.027378028351545e-05, |
| "loss": 0.4843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23123201727867126, |
| "step": 3190, |
| "valid_targets_mean": 2676.0, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 4.878533231474408, |
| "grad_norm": 0.6428607046807531, |
| "learning_rate": 1.020731968677168e-05, |
| "loss": 0.4559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2840641140937805, |
| "step": 3195, |
| "valid_targets_mean": 4760.5, |
| "valid_targets_min": 1489 |
| }, |
| { |
| "epoch": 4.8861726508785335, |
| "grad_norm": 0.6424493789075727, |
| "learning_rate": 1.0141001022693513e-05, |
| "loss": 0.4392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19804728031158447, |
| "step": 3200, |
| "valid_targets_mean": 4134.6, |
| "valid_targets_min": 1719 |
| }, |
| { |
| "epoch": 4.893812070282658, |
| "grad_norm": 0.6689835440970003, |
| "learning_rate": 1.0074825252487124e-05, |
| "loss": 0.4411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25073152780532837, |
| "step": 3205, |
| "valid_targets_mean": 4041.5, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 4.901451489686783, |
| "grad_norm": 0.6395385434248182, |
| "learning_rate": 1.0008793335287605e-05, |
| "loss": 0.4115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18766605854034424, |
| "step": 3210, |
| "valid_targets_mean": 3877.2, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 4.909090909090909, |
| "grad_norm": 0.5500861300454841, |
| "learning_rate": 9.942906228145123e-06, |
| "loss": 0.4486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19914793968200684, |
| "step": 3215, |
| "valid_targets_mean": 5092.1, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 4.916730328495034, |
| "grad_norm": 0.7386027211516123, |
| "learning_rate": 9.877164886010938e-06, |
| "loss": 0.4429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2817431688308716, |
| "step": 3220, |
| "valid_targets_mean": 4743.6, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 4.92436974789916, |
| "grad_norm": 0.7019719562878625, |
| "learning_rate": 9.811570261723676e-06, |
| "loss": 0.4377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19408079981803894, |
| "step": 3225, |
| "valid_targets_mean": 3703.9, |
| "valid_targets_min": 2009 |
| }, |
| { |
| "epoch": 4.932009167303285, |
| "grad_norm": 0.5384230165710143, |
| "learning_rate": 9.746123305995476e-06, |
| "loss": 0.4166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2503221035003662, |
| "step": 3230, |
| "valid_targets_mean": 5923.2, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 4.93964858670741, |
| "grad_norm": 0.5960933611824211, |
| "learning_rate": 9.68082496739816e-06, |
| "loss": 0.4418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16890287399291992, |
| "step": 3235, |
| "valid_targets_mean": 3072.4, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 4.947288006111536, |
| "grad_norm": 0.6770220213062155, |
| "learning_rate": 9.615676192349577e-06, |
| "loss": 0.4071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2525444030761719, |
| "step": 3240, |
| "valid_targets_mean": 4509.0, |
| "valid_targets_min": 1865 |
| }, |
| { |
| "epoch": 4.954927425515661, |
| "grad_norm": 0.6485055817592701, |
| "learning_rate": 9.550677925099815e-06, |
| "loss": 0.4239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1657400280237198, |
| "step": 3245, |
| "valid_targets_mean": 3076.2, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 4.962566844919786, |
| "grad_norm": 0.6337463064952114, |
| "learning_rate": 9.485831107717547e-06, |
| "loss": 0.4375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18350504338741302, |
| "step": 3250, |
| "valid_targets_mean": 3156.8, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 4.970206264323911, |
| "grad_norm": 0.7324159499991673, |
| "learning_rate": 9.421136680076365e-06, |
| "loss": 0.4194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22422681748867035, |
| "step": 3255, |
| "valid_targets_mean": 3919.8, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 4.977845683728036, |
| "grad_norm": 0.7105972910190749, |
| "learning_rate": 9.356595579841158e-06, |
| "loss": 0.4544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23887526988983154, |
| "step": 3260, |
| "valid_targets_mean": 3753.4, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 4.985485103132162, |
| "grad_norm": 0.7336493987221758, |
| "learning_rate": 9.292208742454549e-06, |
| "loss": 0.4498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2927570641040802, |
| "step": 3265, |
| "valid_targets_mean": 4896.9, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 4.993124522536287, |
| "grad_norm": 0.6727667356515784, |
| "learning_rate": 9.227977101123287e-06, |
| "loss": 0.4317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1748276650905609, |
| "step": 3270, |
| "valid_targets_mean": 2757.0, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.9434978159648666, |
| "learning_rate": 9.16390158680476e-06, |
| "loss": 0.4491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4982553720474243, |
| "step": 3275, |
| "valid_targets_mean": 3907.4, |
| "valid_targets_min": 2144 |
| }, |
| { |
| "epoch": 5.007639419404125, |
| "grad_norm": 0.6507985228704842, |
| "learning_rate": 9.099983128193481e-06, |
| "loss": 0.411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18580271303653717, |
| "step": 3280, |
| "valid_targets_mean": 2795.2, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 5.015278838808251, |
| "grad_norm": 0.7057074937993735, |
| "learning_rate": 9.036222651707666e-06, |
| "loss": 0.4068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2280879020690918, |
| "step": 3285, |
| "valid_targets_mean": 4809.2, |
| "valid_targets_min": 1883 |
| }, |
| { |
| "epoch": 5.022918258212376, |
| "grad_norm": 0.5656641524682343, |
| "learning_rate": 8.972621081475727e-06, |
| "loss": 0.4542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10994422435760498, |
| "step": 3290, |
| "valid_targets_mean": 2460.4, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 5.0305576776165015, |
| "grad_norm": 0.8761421207054235, |
| "learning_rate": 8.909179339322971e-06, |
| "loss": 0.4142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22071196138858795, |
| "step": 3295, |
| "valid_targets_mean": 2460.5, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 5.0381970970206265, |
| "grad_norm": 0.7295305809963956, |
| "learning_rate": 8.845898344758199e-06, |
| "loss": 0.4163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19741207361221313, |
| "step": 3300, |
| "valid_targets_mean": 2860.1, |
| "valid_targets_min": 1663 |
| }, |
| { |
| "epoch": 5.045836516424751, |
| "grad_norm": 0.7112452731180018, |
| "learning_rate": 8.782779014960327e-06, |
| "loss": 0.4009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17603464424610138, |
| "step": 3305, |
| "valid_targets_mean": 2539.2, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 5.053475935828877, |
| "grad_norm": 0.7839524218700084, |
| "learning_rate": 8.719822264765204e-06, |
| "loss": 0.418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24770452082157135, |
| "step": 3310, |
| "valid_targets_mean": 3061.1, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.061115355233002, |
| "grad_norm": 0.6200210304675198, |
| "learning_rate": 8.657029006652247e-06, |
| "loss": 0.3937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1898297518491745, |
| "step": 3315, |
| "valid_targets_mean": 4409.4, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 5.068754774637128, |
| "grad_norm": 0.7448282508495098, |
| "learning_rate": 8.594400150731278e-06, |
| "loss": 0.4165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20044977962970734, |
| "step": 3320, |
| "valid_targets_mean": 3152.1, |
| "valid_targets_min": 1468 |
| }, |
| { |
| "epoch": 5.076394194041253, |
| "grad_norm": 0.7330563381797555, |
| "learning_rate": 8.531936604729315e-06, |
| "loss": 0.4048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2015673816204071, |
| "step": 3325, |
| "valid_targets_mean": 3392.9, |
| "valid_targets_min": 1959 |
| }, |
| { |
| "epoch": 5.084033613445378, |
| "grad_norm": 0.6574570667834281, |
| "learning_rate": 8.469639273977404e-06, |
| "loss": 0.4092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2060699760913849, |
| "step": 3330, |
| "valid_targets_mean": 3534.9, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 5.091673032849504, |
| "grad_norm": 0.7192898176205931, |
| "learning_rate": 8.407509061397525e-06, |
| "loss": 0.4242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19831335544586182, |
| "step": 3335, |
| "valid_targets_mean": 3844.0, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 5.099312452253629, |
| "grad_norm": 0.6989885300271562, |
| "learning_rate": 8.345546867489478e-06, |
| "loss": 0.431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22625543177127838, |
| "step": 3340, |
| "valid_targets_mean": 3683.0, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 5.106951871657754, |
| "grad_norm": 0.6891661447879618, |
| "learning_rate": 8.283753590317844e-06, |
| "loss": 0.4167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1683456003665924, |
| "step": 3345, |
| "valid_targets_mean": 2819.9, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 5.114591291061879, |
| "grad_norm": 0.6744309100184774, |
| "learning_rate": 8.222130125498959e-06, |
| "loss": 0.4175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2619309425354004, |
| "step": 3350, |
| "valid_targets_mean": 4709.9, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 5.122230710466004, |
| "grad_norm": 0.7643882359784762, |
| "learning_rate": 8.160677366187973e-06, |
| "loss": 0.4037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24490387737751007, |
| "step": 3355, |
| "valid_targets_mean": 4076.8, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.12987012987013, |
| "grad_norm": 0.765032206390207, |
| "learning_rate": 8.099396203065818e-06, |
| "loss": 0.4049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15527962148189545, |
| "step": 3360, |
| "valid_targets_mean": 2164.2, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 5.137509549274255, |
| "grad_norm": 0.672539908906615, |
| "learning_rate": 8.038287524326412e-06, |
| "loss": 0.4215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17782077193260193, |
| "step": 3365, |
| "valid_targets_mean": 3591.0, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 5.145148968678381, |
| "grad_norm": 0.7211933101160407, |
| "learning_rate": 7.977352215663687e-06, |
| "loss": 0.4217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15421822667121887, |
| "step": 3370, |
| "valid_targets_mean": 2195.5, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 5.152788388082506, |
| "grad_norm": 0.8298079760424127, |
| "learning_rate": 7.916591160258801e-06, |
| "loss": 0.4492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18245047330856323, |
| "step": 3375, |
| "valid_targets_mean": 2769.5, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 5.160427807486631, |
| "grad_norm": 0.7848489488943335, |
| "learning_rate": 7.856005238767352e-06, |
| "loss": 0.4031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1802041083574295, |
| "step": 3380, |
| "valid_targets_mean": 2449.5, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 5.168067226890757, |
| "grad_norm": 0.828689552301754, |
| "learning_rate": 7.79559532930656e-06, |
| "loss": 0.4003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17640046775341034, |
| "step": 3385, |
| "valid_targets_mean": 2253.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 5.1757066462948815, |
| "grad_norm": 0.8939948317428271, |
| "learning_rate": 7.735362307442587e-06, |
| "loss": 0.4254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20057544112205505, |
| "step": 3390, |
| "valid_targets_mean": 2309.8, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 5.1833460656990065, |
| "grad_norm": 0.7064878087869875, |
| "learning_rate": 7.675307046177824e-06, |
| "loss": 0.444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1704927682876587, |
| "step": 3395, |
| "valid_targets_mean": 3034.6, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 5.190985485103132, |
| "grad_norm": 0.8392581300544377, |
| "learning_rate": 7.615430415938247e-06, |
| "loss": 0.4146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26886194944381714, |
| "step": 3400, |
| "valid_targets_mean": 3126.4, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 5.198624904507257, |
| "grad_norm": 0.5899801518379102, |
| "learning_rate": 7.555733284560791e-06, |
| "loss": 0.4166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19343039393424988, |
| "step": 3405, |
| "valid_targets_mean": 4824.8, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 5.206264323911383, |
| "grad_norm": 0.6828929324395993, |
| "learning_rate": 7.496216517280801e-06, |
| "loss": 0.4104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21579919755458832, |
| "step": 3410, |
| "valid_targets_mean": 3761.9, |
| "valid_targets_min": 2207 |
| }, |
| { |
| "epoch": 5.213903743315508, |
| "grad_norm": 0.7563428889342848, |
| "learning_rate": 7.436880976719447e-06, |
| "loss": 0.4272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22617709636688232, |
| "step": 3415, |
| "valid_targets_mean": 3657.2, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 5.221543162719633, |
| "grad_norm": 0.9220246281743919, |
| "learning_rate": 7.377727522871246e-06, |
| "loss": 0.4128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20721417665481567, |
| "step": 3420, |
| "valid_targets_mean": 2134.1, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 5.229182582123759, |
| "grad_norm": 0.7834904193038889, |
| "learning_rate": 7.318757013091622e-06, |
| "loss": 0.3837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1851697862148285, |
| "step": 3425, |
| "valid_targets_mean": 2451.8, |
| "valid_targets_min": 951 |
| }, |
| { |
| "epoch": 5.236822001527884, |
| "grad_norm": 0.648240952651534, |
| "learning_rate": 7.259970302084405e-06, |
| "loss": 0.3728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18699084222316742, |
| "step": 3430, |
| "valid_targets_mean": 3529.8, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 5.2444614209320095, |
| "grad_norm": 0.8208594769460752, |
| "learning_rate": 7.2013682418895435e-06, |
| "loss": 0.4363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20773524045944214, |
| "step": 3435, |
| "valid_targets_mean": 2560.2, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 5.2521008403361344, |
| "grad_norm": 0.8545535257360884, |
| "learning_rate": 7.142951681870669e-06, |
| "loss": 0.4256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21555760502815247, |
| "step": 3440, |
| "valid_targets_mean": 2220.1, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 5.259740259740259, |
| "grad_norm": 0.7813176036108497, |
| "learning_rate": 7.084721468702822e-06, |
| "loss": 0.3894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22744975984096527, |
| "step": 3445, |
| "valid_targets_mean": 2960.5, |
| "valid_targets_min": 1632 |
| }, |
| { |
| "epoch": 5.267379679144385, |
| "grad_norm": 0.7830401754519163, |
| "learning_rate": 7.026678446360204e-06, |
| "loss": 0.3987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18200945854187012, |
| "step": 3450, |
| "valid_targets_mean": 2975.2, |
| "valid_targets_min": 1274 |
| }, |
| { |
| "epoch": 5.27501909854851, |
| "grad_norm": 0.7338311439811203, |
| "learning_rate": 6.9688234561038925e-06, |
| "loss": 0.4252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16019290685653687, |
| "step": 3455, |
| "valid_targets_mean": 2500.2, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 5.282658517952636, |
| "grad_norm": 0.7882790373444832, |
| "learning_rate": 6.911157336469685e-06, |
| "loss": 0.4159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18955618143081665, |
| "step": 3460, |
| "valid_targets_mean": 3472.8, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 5.290297937356761, |
| "grad_norm": 0.8243210594375885, |
| "learning_rate": 6.853680923255932e-06, |
| "loss": 0.4084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24365636706352234, |
| "step": 3465, |
| "valid_targets_mean": 3001.8, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 5.297937356760886, |
| "grad_norm": 0.7590409540259425, |
| "learning_rate": 6.796395049511431e-06, |
| "loss": 0.4149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21231132745742798, |
| "step": 3470, |
| "valid_targets_mean": 3273.2, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 5.305576776165012, |
| "grad_norm": 1.0632303615019383, |
| "learning_rate": 6.739300545523335e-06, |
| "loss": 0.4052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2338356226682663, |
| "step": 3475, |
| "valid_targets_mean": 3178.6, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 5.313216195569137, |
| "grad_norm": 0.756230519495017, |
| "learning_rate": 6.682398238805161e-06, |
| "loss": 0.4145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24491998553276062, |
| "step": 3480, |
| "valid_targets_mean": 2977.2, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 5.320855614973262, |
| "grad_norm": 0.845343670274438, |
| "learning_rate": 6.625688954084739e-06, |
| "loss": 0.3901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1987672746181488, |
| "step": 3485, |
| "valid_targets_mean": 2708.9, |
| "valid_targets_min": 871 |
| }, |
| { |
| "epoch": 5.328495034377387, |
| "grad_norm": 0.7592874195569738, |
| "learning_rate": 6.569173513292289e-06, |
| "loss": 0.4121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2058597207069397, |
| "step": 3490, |
| "valid_targets_mean": 2993.6, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 5.336134453781512, |
| "grad_norm": 0.7987958580833625, |
| "learning_rate": 6.512852735548529e-06, |
| "loss": 0.4422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18779411911964417, |
| "step": 3495, |
| "valid_targets_mean": 2571.9, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 5.343773873185638, |
| "grad_norm": 0.6740552418391473, |
| "learning_rate": 6.456727437152737e-06, |
| "loss": 0.4181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21062324941158295, |
| "step": 3500, |
| "valid_targets_mean": 3471.2, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 5.351413292589763, |
| "grad_norm": 0.7949901183059733, |
| "learning_rate": 6.400798431571009e-06, |
| "loss": 0.4309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19252058863639832, |
| "step": 3505, |
| "valid_targets_mean": 2609.5, |
| "valid_targets_min": 1768 |
| }, |
| { |
| "epoch": 5.359052711993888, |
| "grad_norm": 0.9011653868394018, |
| "learning_rate": 6.345066529424391e-06, |
| "loss": 0.4146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19950778782367706, |
| "step": 3510, |
| "valid_targets_mean": 2509.4, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 5.366692131398014, |
| "grad_norm": 0.8226863591976814, |
| "learning_rate": 6.289532538477163e-06, |
| "loss": 0.4199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16507697105407715, |
| "step": 3515, |
| "valid_targets_mean": 2465.1, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 5.374331550802139, |
| "grad_norm": 0.7702667277518003, |
| "learning_rate": 6.234197263625157e-06, |
| "loss": 0.4154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18763992190361023, |
| "step": 3520, |
| "valid_targets_mean": 2658.5, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 5.381970970206265, |
| "grad_norm": 0.7546441510309715, |
| "learning_rate": 6.179061506884018e-06, |
| "loss": 0.4036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20631533861160278, |
| "step": 3525, |
| "valid_targets_mean": 3253.8, |
| "valid_targets_min": 1863 |
| }, |
| { |
| "epoch": 5.3896103896103895, |
| "grad_norm": 1.0332493720632743, |
| "learning_rate": 6.124126067377669e-06, |
| "loss": 0.4486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18635576963424683, |
| "step": 3530, |
| "valid_targets_mean": 2523.4, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 5.3972498090145145, |
| "grad_norm": 0.8600167635311569, |
| "learning_rate": 6.069391741326658e-06, |
| "loss": 0.4272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23452191054821014, |
| "step": 3535, |
| "valid_targets_mean": 3307.4, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 5.40488922841864, |
| "grad_norm": 0.7472968803751108, |
| "learning_rate": 6.014859322036655e-06, |
| "loss": 0.475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25068214535713196, |
| "step": 3540, |
| "valid_targets_mean": 3746.0, |
| "valid_targets_min": 1742 |
| }, |
| { |
| "epoch": 5.412528647822765, |
| "grad_norm": 0.7724354110335331, |
| "learning_rate": 5.960529599886933e-06, |
| "loss": 0.4249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2862878441810608, |
| "step": 3545, |
| "valid_targets_mean": 3475.9, |
| "valid_targets_min": 871 |
| }, |
| { |
| "epoch": 5.420168067226891, |
| "grad_norm": 0.5927597795747025, |
| "learning_rate": 5.906403362318953e-06, |
| "loss": 0.4233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13544148206710815, |
| "step": 3550, |
| "valid_targets_mean": 3212.5, |
| "valid_targets_min": 1620 |
| }, |
| { |
| "epoch": 5.427807486631016, |
| "grad_norm": 0.8215858475471198, |
| "learning_rate": 5.852481393824876e-06, |
| "loss": 0.4273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1856689155101776, |
| "step": 3555, |
| "valid_targets_mean": 2500.4, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 5.435446906035141, |
| "grad_norm": 0.7534978382823645, |
| "learning_rate": 5.7987644759362715e-06, |
| "loss": 0.4056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2625764310359955, |
| "step": 3560, |
| "valid_targets_mean": 3408.6, |
| "valid_targets_min": 1712 |
| }, |
| { |
| "epoch": 5.443086325439267, |
| "grad_norm": 0.7365666325994856, |
| "learning_rate": 5.745253387212759e-06, |
| "loss": 0.4148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22502942383289337, |
| "step": 3565, |
| "valid_targets_mean": 3521.4, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 5.450725744843392, |
| "grad_norm": 0.7997567097717743, |
| "learning_rate": 5.691948903230691e-06, |
| "loss": 0.3924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2259596586227417, |
| "step": 3570, |
| "valid_targets_mean": 3082.4, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 5.4583651642475175, |
| "grad_norm": 0.8822731379082949, |
| "learning_rate": 5.638851796571974e-06, |
| "loss": 0.4349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22405478358268738, |
| "step": 3575, |
| "valid_targets_mean": 2302.9, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 5.466004583651642, |
| "grad_norm": 0.7443175145614003, |
| "learning_rate": 5.585962836812822e-06, |
| "loss": 0.4053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3522719144821167, |
| "step": 3580, |
| "valid_targets_mean": 4707.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 5.473644003055767, |
| "grad_norm": 0.7684422668048446, |
| "learning_rate": 5.533282790512624e-06, |
| "loss": 0.3872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18864914774894714, |
| "step": 3585, |
| "valid_targets_mean": 2916.6, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 5.481283422459893, |
| "grad_norm": 0.6752647565568806, |
| "learning_rate": 5.480812421202828e-06, |
| "loss": 0.4047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17078009247779846, |
| "step": 3590, |
| "valid_targets_mean": 3693.9, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 5.488922841864018, |
| "grad_norm": 0.815831254632104, |
| "learning_rate": 5.428552489375876e-06, |
| "loss": 0.4002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18773040175437927, |
| "step": 3595, |
| "valid_targets_mean": 2936.0, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 5.496562261268144, |
| "grad_norm": 0.6615077791531486, |
| "learning_rate": 5.376503752474191e-06, |
| "loss": 0.3985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13504765927791595, |
| "step": 3600, |
| "valid_targets_mean": 3119.9, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 5.504201680672269, |
| "grad_norm": 0.6605364243810754, |
| "learning_rate": 5.32466696487918e-06, |
| "loss": 0.417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17553292214870453, |
| "step": 3605, |
| "valid_targets_mean": 3754.2, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 5.511841100076394, |
| "grad_norm": 0.6762092368293349, |
| "learning_rate": 5.273042877900308e-06, |
| "loss": 0.4103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14567619562149048, |
| "step": 3610, |
| "valid_targets_mean": 2932.9, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 5.51948051948052, |
| "grad_norm": 0.6178381332291257, |
| "learning_rate": 5.221632239764207e-06, |
| "loss": 0.4082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16620564460754395, |
| "step": 3615, |
| "valid_targets_mean": 4656.1, |
| "valid_targets_min": 2486 |
| }, |
| { |
| "epoch": 5.527119938884645, |
| "grad_norm": 0.7235563732760826, |
| "learning_rate": 5.170435795603863e-06, |
| "loss": 0.4218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1886502504348755, |
| "step": 3620, |
| "valid_targets_mean": 3256.5, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 5.53475935828877, |
| "grad_norm": 0.8302130888371341, |
| "learning_rate": 5.119454287447738e-06, |
| "loss": 0.4508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29996421933174133, |
| "step": 3625, |
| "valid_targets_mean": 3539.0, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 5.542398777692895, |
| "grad_norm": 0.6664804259859938, |
| "learning_rate": 5.068688454209114e-06, |
| "loss": 0.4187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20061370730400085, |
| "step": 3630, |
| "valid_targets_mean": 4539.8, |
| "valid_targets_min": 2136 |
| }, |
| { |
| "epoch": 5.55003819709702, |
| "grad_norm": 0.8158756541380983, |
| "learning_rate": 5.018139031675309e-06, |
| "loss": 0.3994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.287477046251297, |
| "step": 3635, |
| "valid_targets_mean": 3718.4, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 5.557677616501146, |
| "grad_norm": 0.7383633611419538, |
| "learning_rate": 4.967806752497036e-06, |
| "loss": 0.4128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20177043974399567, |
| "step": 3640, |
| "valid_targets_mean": 3811.8, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 5.565317035905271, |
| "grad_norm": 0.6984282055877477, |
| "learning_rate": 4.917692346177804e-06, |
| "loss": 0.4224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18860375881195068, |
| "step": 3645, |
| "valid_targets_mean": 2725.0, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 5.572956455309397, |
| "grad_norm": 0.7157370657179769, |
| "learning_rate": 4.8677965390633145e-06, |
| "loss": 0.4094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1753612458705902, |
| "step": 3650, |
| "valid_targets_mean": 3218.1, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 5.580595874713522, |
| "grad_norm": 0.8658457792874761, |
| "learning_rate": 4.818120054330946e-06, |
| "loss": 0.4224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23552726209163666, |
| "step": 3655, |
| "valid_targets_mean": 2594.4, |
| "valid_targets_min": 1090 |
| }, |
| { |
| "epoch": 5.588235294117647, |
| "grad_norm": 0.6971295570889691, |
| "learning_rate": 4.768663611979276e-06, |
| "loss": 0.4246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18920549750328064, |
| "step": 3660, |
| "valid_targets_mean": 2897.9, |
| "valid_targets_min": 1045 |
| }, |
| { |
| "epoch": 5.595874713521773, |
| "grad_norm": 0.7536367310381494, |
| "learning_rate": 4.719427928817637e-06, |
| "loss": 0.3903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23616181313991547, |
| "step": 3665, |
| "valid_targets_mean": 3631.9, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 5.6035141329258975, |
| "grad_norm": 0.7259568515171714, |
| "learning_rate": 4.670413718455753e-06, |
| "loss": 0.4041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16838884353637695, |
| "step": 3670, |
| "valid_targets_mean": 3266.1, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 5.611153552330023, |
| "grad_norm": 0.6880333970118933, |
| "learning_rate": 4.6216216912933546e-06, |
| "loss": 0.4116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17340365052223206, |
| "step": 3675, |
| "valid_targets_mean": 4112.2, |
| "valid_targets_min": 983 |
| }, |
| { |
| "epoch": 5.618792971734148, |
| "grad_norm": 0.6469773412047066, |
| "learning_rate": 4.5730525545099095e-06, |
| "loss": 0.4107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17914192378520966, |
| "step": 3680, |
| "valid_targets_mean": 4227.9, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 5.626432391138273, |
| "grad_norm": 0.7773716945089362, |
| "learning_rate": 4.524707012054368e-06, |
| "loss": 0.4294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15195128321647644, |
| "step": 3685, |
| "valid_targets_mean": 2487.1, |
| "valid_targets_min": 1543 |
| }, |
| { |
| "epoch": 5.634071810542399, |
| "grad_norm": 0.7776984018425589, |
| "learning_rate": 4.476585764634975e-06, |
| "loss": 0.4114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1720089614391327, |
| "step": 3690, |
| "valid_targets_mean": 2077.1, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 5.641711229946524, |
| "grad_norm": 0.7688079872450757, |
| "learning_rate": 4.4286895097090695e-06, |
| "loss": 0.4307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16758956015110016, |
| "step": 3695, |
| "valid_targets_mean": 2742.0, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 5.64935064935065, |
| "grad_norm": 0.8486912659015311, |
| "learning_rate": 4.381018941473037e-06, |
| "loss": 0.4381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19494405388832092, |
| "step": 3700, |
| "valid_targets_mean": 2297.6, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 5.656990068754775, |
| "grad_norm": 0.6372751365054492, |
| "learning_rate": 4.333574750852194e-06, |
| "loss": 0.4181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16869252920150757, |
| "step": 3705, |
| "valid_targets_mean": 3551.4, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 5.6646294881589, |
| "grad_norm": 0.7390356711726472, |
| "learning_rate": 4.2863576254908e-06, |
| "loss": 0.4226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2157163769006729, |
| "step": 3710, |
| "valid_targets_mean": 3476.8, |
| "valid_targets_min": 1540 |
| }, |
| { |
| "epoch": 5.6722689075630255, |
| "grad_norm": 0.6872901624459158, |
| "learning_rate": 4.239368249742102e-06, |
| "loss": 0.4236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13273492455482483, |
| "step": 3715, |
| "valid_targets_mean": 3911.5, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 5.67990832696715, |
| "grad_norm": 0.6586970729788763, |
| "learning_rate": 4.192607304658387e-06, |
| "loss": 0.4125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2191186547279358, |
| "step": 3720, |
| "valid_targets_mean": 4228.1, |
| "valid_targets_min": 2073 |
| }, |
| { |
| "epoch": 5.687547746371276, |
| "grad_norm": 0.749146299694098, |
| "learning_rate": 4.146075467981125e-06, |
| "loss": 0.4663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23675943911075592, |
| "step": 3725, |
| "valid_targets_mean": 3733.4, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 5.695187165775401, |
| "grad_norm": 0.7237635954729931, |
| "learning_rate": 4.09977341413115e-06, |
| "loss": 0.4271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2258036732673645, |
| "step": 3730, |
| "valid_targets_mean": 3386.2, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 5.702826585179526, |
| "grad_norm": 0.8123035113980734, |
| "learning_rate": 4.053701814198882e-06, |
| "loss": 0.4025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21003013849258423, |
| "step": 3735, |
| "valid_targets_mean": 2482.4, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 5.710466004583652, |
| "grad_norm": 0.8015439623306877, |
| "learning_rate": 4.0078613359345884e-06, |
| "loss": 0.4187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21075120568275452, |
| "step": 3740, |
| "valid_targets_mean": 2767.1, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 5.718105423987777, |
| "grad_norm": 1.0739970964489634, |
| "learning_rate": 3.962252643738742e-06, |
| "loss": 0.4154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23278754949569702, |
| "step": 3745, |
| "valid_targets_mean": 4178.6, |
| "valid_targets_min": 2456 |
| }, |
| { |
| "epoch": 5.725744843391903, |
| "grad_norm": 0.8237327127175776, |
| "learning_rate": 3.916876398652338e-06, |
| "loss": 0.4236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19142091274261475, |
| "step": 3750, |
| "valid_targets_mean": 2622.1, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 5.733384262796028, |
| "grad_norm": 0.7601068750941172, |
| "learning_rate": 3.8717332583473545e-06, |
| "loss": 0.4194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21591442823410034, |
| "step": 3755, |
| "valid_targets_mean": 2982.9, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 5.741023682200153, |
| "grad_norm": 0.6831402579456276, |
| "learning_rate": 3.826823877117218e-06, |
| "loss": 0.402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23567482829093933, |
| "step": 3760, |
| "valid_targets_mean": 4372.5, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 5.748663101604278, |
| "grad_norm": 0.7518305106243018, |
| "learning_rate": 3.7821489058672754e-06, |
| "loss": 0.3925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19822347164154053, |
| "step": 3765, |
| "valid_targets_mean": 2959.9, |
| "valid_targets_min": 1891 |
| }, |
| { |
| "epoch": 5.756302521008403, |
| "grad_norm": 0.7856806336487985, |
| "learning_rate": 3.7377089921054355e-06, |
| "loss": 0.4083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1958726942539215, |
| "step": 3770, |
| "valid_targets_mean": 2575.6, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 5.763941940412528, |
| "grad_norm": 0.820934440949876, |
| "learning_rate": 3.6935047799327107e-06, |
| "loss": 0.4336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23241233825683594, |
| "step": 3775, |
| "valid_targets_mean": 2996.4, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 5.771581359816654, |
| "grad_norm": 0.7654930925671581, |
| "learning_rate": 3.649536910033926e-06, |
| "loss": 0.4282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29833102226257324, |
| "step": 3780, |
| "valid_targets_mean": 3378.2, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 5.779220779220779, |
| "grad_norm": 0.6768166172539385, |
| "learning_rate": 3.605806019668432e-06, |
| "loss": 0.4232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1405220776796341, |
| "step": 3785, |
| "valid_targets_mean": 2789.8, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 5.786860198624905, |
| "grad_norm": 0.772007067318885, |
| "learning_rate": 3.562312742660825e-06, |
| "loss": 0.4247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20937494933605194, |
| "step": 3790, |
| "valid_targets_mean": 3826.2, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 5.79449961802903, |
| "grad_norm": 0.9119664688683919, |
| "learning_rate": 3.5190577093918266e-06, |
| "loss": 0.4449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2521716356277466, |
| "step": 3795, |
| "valid_targets_mean": 2620.5, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 5.802139037433155, |
| "grad_norm": 0.7883929824332396, |
| "learning_rate": 3.476041546789095e-06, |
| "loss": 0.4243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16708248853683472, |
| "step": 3800, |
| "valid_targets_mean": 2520.9, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 5.809778456837281, |
| "grad_norm": 0.7676063261588877, |
| "learning_rate": 3.433264878318159e-06, |
| "loss": 0.4288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724417507648468, |
| "step": 3805, |
| "valid_targets_mean": 2547.8, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 5.8174178762414055, |
| "grad_norm": 0.6236657792139778, |
| "learning_rate": 3.390728323973376e-06, |
| "loss": 0.4071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21887004375457764, |
| "step": 3810, |
| "valid_targets_mean": 3950.0, |
| "valid_targets_min": 1549 |
| }, |
| { |
| "epoch": 5.825057295645531, |
| "grad_norm": 0.6774652652821819, |
| "learning_rate": 3.3484325002689653e-06, |
| "loss": 0.4448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1620153933763504, |
| "step": 3815, |
| "valid_targets_mean": 2540.0, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 5.832696715049656, |
| "grad_norm": 0.7869552702440537, |
| "learning_rate": 3.3063780202300365e-06, |
| "loss": 0.4425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21578902006149292, |
| "step": 3820, |
| "valid_targets_mean": 3193.5, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 5.840336134453781, |
| "grad_norm": 0.7777560326400809, |
| "learning_rate": 3.264565493383729e-06, |
| "loss": 0.4271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19921430945396423, |
| "step": 3825, |
| "valid_targets_mean": 2760.4, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 5.847975553857907, |
| "grad_norm": 0.7448361766226455, |
| "learning_rate": 3.222995525750392e-06, |
| "loss": 0.3845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18640117347240448, |
| "step": 3830, |
| "valid_targets_mean": 2556.9, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 5.855614973262032, |
| "grad_norm": 0.7582221040698467, |
| "learning_rate": 3.181668719834745e-06, |
| "loss": 0.4, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028721570968628, |
| "step": 3835, |
| "valid_targets_mean": 2988.4, |
| "valid_targets_min": 1683 |
| }, |
| { |
| "epoch": 5.863254392666157, |
| "grad_norm": 0.8320638276938915, |
| "learning_rate": 3.14058567461722e-06, |
| "loss": 0.415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22501055896282196, |
| "step": 3840, |
| "valid_targets_mean": 3268.4, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 5.870893812070283, |
| "grad_norm": 0.8161565674228954, |
| "learning_rate": 3.0997469855452222e-06, |
| "loss": 0.4349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24944055080413818, |
| "step": 3845, |
| "valid_targets_mean": 2357.2, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 5.878533231474408, |
| "grad_norm": 0.7146833623918105, |
| "learning_rate": 3.0591532445245155e-06, |
| "loss": 0.4424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2273748219013214, |
| "step": 3850, |
| "valid_targets_mean": 3512.4, |
| "valid_targets_min": 425 |
| }, |
| { |
| "epoch": 5.8861726508785335, |
| "grad_norm": 0.7530428991334562, |
| "learning_rate": 3.0188050399106726e-06, |
| "loss": 0.414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22839196026325226, |
| "step": 3855, |
| "valid_targets_mean": 3654.9, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 5.893812070282658, |
| "grad_norm": 0.7187394717038206, |
| "learning_rate": 2.9787029565004856e-06, |
| "loss": 0.4129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16635143756866455, |
| "step": 3860, |
| "valid_targets_mean": 2724.4, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 5.901451489686783, |
| "grad_norm": 0.8174325937619282, |
| "learning_rate": 2.93884757552356e-06, |
| "loss": 0.3855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2066618800163269, |
| "step": 3865, |
| "valid_targets_mean": 2795.5, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 5.909090909090909, |
| "grad_norm": 0.809517014176693, |
| "learning_rate": 2.8992394746338457e-06, |
| "loss": 0.4305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21883273124694824, |
| "step": 3870, |
| "valid_targets_mean": 3162.0, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 5.916730328495034, |
| "grad_norm": 0.7913869749669057, |
| "learning_rate": 2.8598792279012745e-06, |
| "loss": 0.4229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036246955394745, |
| "step": 3875, |
| "valid_targets_mean": 3123.5, |
| "valid_targets_min": 1275 |
| }, |
| { |
| "epoch": 5.92436974789916, |
| "grad_norm": 0.7449934448241319, |
| "learning_rate": 2.8207674058034374e-06, |
| "loss": 0.4367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19343721866607666, |
| "step": 3880, |
| "valid_targets_mean": 3974.1, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 5.932009167303285, |
| "grad_norm": 0.702412074741444, |
| "learning_rate": 2.7819045752173425e-06, |
| "loss": 0.3896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15918338298797607, |
| "step": 3885, |
| "valid_targets_mean": 3438.9, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 5.93964858670741, |
| "grad_norm": 0.7471411887353139, |
| "learning_rate": 2.7432912994111417e-06, |
| "loss": 0.4329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.206735759973526, |
| "step": 3890, |
| "valid_targets_mean": 3419.1, |
| "valid_targets_min": 1536 |
| }, |
| { |
| "epoch": 5.947288006111536, |
| "grad_norm": 0.78771027659784, |
| "learning_rate": 2.7049281380360382e-06, |
| "loss": 0.443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3115561008453369, |
| "step": 3895, |
| "valid_targets_mean": 3303.0, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 5.954927425515661, |
| "grad_norm": 0.7524415873142796, |
| "learning_rate": 2.666815647118117e-06, |
| "loss": 0.4348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23538583517074585, |
| "step": 3900, |
| "valid_targets_mean": 3236.2, |
| "valid_targets_min": 1325 |
| }, |
| { |
| "epoch": 5.962566844919786, |
| "grad_norm": 0.6883297919046488, |
| "learning_rate": 2.6289543790503103e-06, |
| "loss": 0.4034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2727777659893036, |
| "step": 3905, |
| "valid_targets_mean": 4847.6, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 5.970206264323911, |
| "grad_norm": 0.7745226944687247, |
| "learning_rate": 2.591344882584401e-06, |
| "loss": 0.4449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19000530242919922, |
| "step": 3910, |
| "valid_targets_mean": 2781.6, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 5.977845683728036, |
| "grad_norm": 0.6578254545339572, |
| "learning_rate": 2.5539877028230442e-06, |
| "loss": 0.4289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13370674848556519, |
| "step": 3915, |
| "valid_targets_mean": 2355.8, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 5.985485103132162, |
| "grad_norm": 0.8718248131787556, |
| "learning_rate": 2.5168833812118855e-06, |
| "loss": 0.4427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21779406070709229, |
| "step": 3920, |
| "valid_targets_mean": 2524.6, |
| "valid_targets_min": 359 |
| }, |
| { |
| "epoch": 5.993124522536287, |
| "grad_norm": 0.6650728699135563, |
| "learning_rate": 2.480032455531707e-06, |
| "loss": 0.4061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17643976211547852, |
| "step": 3925, |
| "valid_targets_mean": 2614.1, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 6.0, |
| "grad_norm": 1.031459537664997, |
| "learning_rate": 2.443435459890626e-06, |
| "loss": 0.4544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44087493419647217, |
| "step": 3930, |
| "valid_targets_mean": 3814.1, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 6.007639419404125, |
| "grad_norm": 0.6863931120269993, |
| "learning_rate": 2.4070929247163764e-06, |
| "loss": 0.4425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252174437046051, |
| "step": 3935, |
| "valid_targets_mean": 3363.9, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 6.015278838808251, |
| "grad_norm": 0.8065060516729766, |
| "learning_rate": 2.371005376748596e-06, |
| "loss": 0.381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19682547450065613, |
| "step": 3940, |
| "valid_targets_mean": 2635.6, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 6.022918258212376, |
| "grad_norm": 0.6875190773960217, |
| "learning_rate": 2.3351733390312005e-06, |
| "loss": 0.4147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1877930611371994, |
| "step": 3945, |
| "valid_targets_mean": 3125.6, |
| "valid_targets_min": 1002 |
| }, |
| { |
| "epoch": 6.0305576776165015, |
| "grad_norm": 0.7113750000743607, |
| "learning_rate": 2.2995973309048013e-06, |
| "loss": 0.3916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18945392966270447, |
| "step": 3950, |
| "valid_targets_mean": 3022.5, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 6.0381970970206265, |
| "grad_norm": 0.7668863834844798, |
| "learning_rate": 2.2642778679992007e-06, |
| "loss": 0.441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18376567959785461, |
| "step": 3955, |
| "valid_targets_mean": 2929.2, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 6.045836516424751, |
| "grad_norm": 0.6400997176841478, |
| "learning_rate": 2.2292154622258623e-06, |
| "loss": 0.4039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10822135210037231, |
| "step": 3960, |
| "valid_targets_mean": 2783.8, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 6.053475935828877, |
| "grad_norm": 0.6827622640359982, |
| "learning_rate": 2.194410621770566e-06, |
| "loss": 0.395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2305392324924469, |
| "step": 3965, |
| "valid_targets_mean": 4637.6, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 6.061115355233002, |
| "grad_norm": 0.6742130374126593, |
| "learning_rate": 2.1598638510859795e-06, |
| "loss": 0.3969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17292946577072144, |
| "step": 3970, |
| "valid_targets_mean": 3895.4, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 6.068754774637128, |
| "grad_norm": 0.7224201918662315, |
| "learning_rate": 2.1255756508843774e-06, |
| "loss": 0.4092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2280636876821518, |
| "step": 3975, |
| "valid_targets_mean": 3655.5, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 6.076394194041253, |
| "grad_norm": 0.696693155288902, |
| "learning_rate": 2.0915465181303874e-06, |
| "loss": 0.4309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18954971432685852, |
| "step": 3980, |
| "valid_targets_mean": 3254.5, |
| "valid_targets_min": 1125 |
| }, |
| { |
| "epoch": 6.084033613445378, |
| "grad_norm": 0.7159544890081604, |
| "learning_rate": 2.057776946033765e-06, |
| "loss": 0.396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17513585090637207, |
| "step": 3985, |
| "valid_targets_mean": 3132.8, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 6.091673032849504, |
| "grad_norm": 0.7488349752843247, |
| "learning_rate": 2.0242674240422655e-06, |
| "loss": 0.404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14049875736236572, |
| "step": 3990, |
| "valid_targets_mean": 2235.8, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 6.099312452253629, |
| "grad_norm": 0.7563615274137214, |
| "learning_rate": 1.991018437834542e-06, |
| "loss": 0.4378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19269230961799622, |
| "step": 3995, |
| "valid_targets_mean": 3002.5, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 6.106951871657754, |
| "grad_norm": 0.7581872453513444, |
| "learning_rate": 1.9580304693131015e-06, |
| "loss": 0.4248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2181900590658188, |
| "step": 4000, |
| "valid_targets_mean": 3014.9, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 6.114591291061879, |
| "grad_norm": 0.7927614418513154, |
| "learning_rate": 1.925303996597341e-06, |
| "loss": 0.3909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17333531379699707, |
| "step": 4005, |
| "valid_targets_mean": 2303.4, |
| "valid_targets_min": 1163 |
| }, |
| { |
| "epoch": 6.122230710466004, |
| "grad_norm": 0.6627386326218554, |
| "learning_rate": 1.8928394940165828e-06, |
| "loss": 0.422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21585026383399963, |
| "step": 4010, |
| "valid_targets_mean": 4336.9, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 6.12987012987013, |
| "grad_norm": 0.6910708074716676, |
| "learning_rate": 1.860637432103234e-06, |
| "loss": 0.4067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18705642223358154, |
| "step": 4015, |
| "valid_targets_mean": 3601.0, |
| "valid_targets_min": 1149 |
| }, |
| { |
| "epoch": 6.137509549274255, |
| "grad_norm": 0.654947784139743, |
| "learning_rate": 1.8286982775859407e-06, |
| "loss": 0.3906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21154358983039856, |
| "step": 4020, |
| "valid_targets_mean": 4067.4, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 6.145148968678381, |
| "grad_norm": 0.786026884990914, |
| "learning_rate": 1.7970224933828539e-06, |
| "loss": 0.4181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17581038177013397, |
| "step": 4025, |
| "valid_targets_mean": 2357.8, |
| "valid_targets_min": 1129 |
| }, |
| { |
| "epoch": 6.152788388082506, |
| "grad_norm": 0.6201923882409753, |
| "learning_rate": 1.7656105385948708e-06, |
| "loss": 0.3878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32060492038726807, |
| "step": 4030, |
| "valid_targets_mean": 6241.4, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 6.160427807486631, |
| "grad_norm": 0.821742202354764, |
| "learning_rate": 1.7344628684990405e-06, |
| "loss": 0.4066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22368258237838745, |
| "step": 4035, |
| "valid_targets_mean": 2545.4, |
| "valid_targets_min": 871 |
| }, |
| { |
| "epoch": 6.168067226890757, |
| "grad_norm": 0.787669642326113, |
| "learning_rate": 1.7035799345419212e-06, |
| "loss": 0.4129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22682487964630127, |
| "step": 4040, |
| "valid_targets_mean": 3353.8, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 6.1757066462948815, |
| "grad_norm": 0.647719500085238, |
| "learning_rate": 1.672962184333049e-06, |
| "loss": 0.4063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25017115473747253, |
| "step": 4045, |
| "valid_targets_mean": 4126.0, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 6.1833460656990065, |
| "grad_norm": 0.7747670126199028, |
| "learning_rate": 1.6426100616384654e-06, |
| "loss": 0.4065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16823174059391022, |
| "step": 4050, |
| "valid_targets_mean": 2440.1, |
| "valid_targets_min": 1561 |
| }, |
| { |
| "epoch": 6.190985485103132, |
| "grad_norm": 0.7476785216452516, |
| "learning_rate": 1.6125240063742565e-06, |
| "loss": 0.3991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19015461206436157, |
| "step": 4055, |
| "valid_targets_mean": 3180.9, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 6.198624904507257, |
| "grad_norm": 0.7815290028556419, |
| "learning_rate": 1.582704454600208e-06, |
| "loss": 0.3961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18614669144153595, |
| "step": 4060, |
| "valid_targets_mean": 2710.0, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 6.206264323911383, |
| "grad_norm": 0.727274439614293, |
| "learning_rate": 1.5531518385134625e-06, |
| "loss": 0.3997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15869663655757904, |
| "step": 4065, |
| "valid_targets_mean": 2874.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 6.213903743315508, |
| "grad_norm": 0.7405238943348815, |
| "learning_rate": 1.5238665864422665e-06, |
| "loss": 0.4392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18218465149402618, |
| "step": 4070, |
| "valid_targets_mean": 2788.8, |
| "valid_targets_min": 1449 |
| }, |
| { |
| "epoch": 6.221543162719633, |
| "grad_norm": 0.6971040390142008, |
| "learning_rate": 1.4948491228397544e-06, |
| "loss": 0.3981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15370672941207886, |
| "step": 4075, |
| "valid_targets_mean": 2588.0, |
| "valid_targets_min": 1384 |
| }, |
| { |
| "epoch": 6.229182582123759, |
| "grad_norm": 0.6481267442709662, |
| "learning_rate": 1.4660998682778105e-06, |
| "loss": 0.3941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17396646738052368, |
| "step": 4080, |
| "valid_targets_mean": 3749.6, |
| "valid_targets_min": 1736 |
| }, |
| { |
| "epoch": 6.236822001527884, |
| "grad_norm": 0.7595999593253812, |
| "learning_rate": 1.4376192394409571e-06, |
| "loss": 0.3894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15226925909519196, |
| "step": 4085, |
| "valid_targets_mean": 1917.9, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 6.2444614209320095, |
| "grad_norm": 0.7375012589840757, |
| "learning_rate": 1.409407649120318e-06, |
| "loss": 0.4365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2002945989370346, |
| "step": 4090, |
| "valid_targets_mean": 3363.8, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 6.2521008403361344, |
| "grad_norm": 0.6737898597954428, |
| "learning_rate": 1.38146550620766e-06, |
| "loss": 0.4201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18218186497688293, |
| "step": 4095, |
| "valid_targets_mean": 3539.6, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 6.259740259740259, |
| "grad_norm": 0.7675540823076344, |
| "learning_rate": 1.353793215689414e-06, |
| "loss": 0.4405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2069307118654251, |
| "step": 4100, |
| "valid_targets_mean": 2938.4, |
| "valid_targets_min": 1579 |
| }, |
| { |
| "epoch": 6.267379679144385, |
| "grad_norm": 0.8436198032007797, |
| "learning_rate": 1.326391178640869e-06, |
| "loss": 0.4023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20973223447799683, |
| "step": 4105, |
| "valid_targets_mean": 2793.8, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 6.27501909854851, |
| "grad_norm": 0.8653534524601917, |
| "learning_rate": 1.2992597922203087e-06, |
| "loss": 0.4166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17687362432479858, |
| "step": 4110, |
| "valid_targets_mean": 2699.1, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.282658517952636, |
| "grad_norm": 0.7695788197633405, |
| "learning_rate": 1.2723994496632775e-06, |
| "loss": 0.389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24052169919013977, |
| "step": 4115, |
| "valid_targets_mean": 3462.8, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 6.290297937356761, |
| "grad_norm": 0.9251655508633336, |
| "learning_rate": 1.2458105402768905e-06, |
| "loss": 0.4135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18550032377243042, |
| "step": 4120, |
| "valid_targets_mean": 1907.9, |
| "valid_targets_min": 1138 |
| }, |
| { |
| "epoch": 6.297937356760886, |
| "grad_norm": 0.9075744467608439, |
| "learning_rate": 1.2194934494341548e-06, |
| "loss": 0.4354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1659584939479828, |
| "step": 4125, |
| "valid_targets_mean": 1987.1, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 6.305576776165012, |
| "grad_norm": 0.8343949143994032, |
| "learning_rate": 1.1934485585684286e-06, |
| "loss": 0.4045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18994081020355225, |
| "step": 4130, |
| "valid_targets_mean": 2424.1, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 6.313216195569137, |
| "grad_norm": 0.7719958475586056, |
| "learning_rate": 1.1676762451678592e-06, |
| "loss": 0.4074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15388676524162292, |
| "step": 4135, |
| "valid_targets_mean": 1865.9, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 6.320855614973262, |
| "grad_norm": 0.6607601792071848, |
| "learning_rate": 1.1421768827699297e-06, |
| "loss": 0.3883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21211379766464233, |
| "step": 4140, |
| "valid_targets_mean": 3929.9, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 6.328495034377387, |
| "grad_norm": 0.6647948062348348, |
| "learning_rate": 1.1169508409560326e-06, |
| "loss": 0.3842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14956669509410858, |
| "step": 4145, |
| "valid_targets_mean": 3332.8, |
| "valid_targets_min": 1628 |
| }, |
| { |
| "epoch": 6.336134453781512, |
| "grad_norm": 0.8833312270676275, |
| "learning_rate": 1.091998485346133e-06, |
| "loss": 0.4035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2864078879356384, |
| "step": 4150, |
| "valid_targets_mean": 3066.8, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 6.343773873185638, |
| "grad_norm": 0.5784561383842487, |
| "learning_rate": 1.067320177593445e-06, |
| "loss": 0.4323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2022693157196045, |
| "step": 4155, |
| "valid_targets_mean": 5883.6, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 6.351413292589763, |
| "grad_norm": 0.7000964975069451, |
| "learning_rate": 1.0429162753792044e-06, |
| "loss": 0.3926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17252172529697418, |
| "step": 4160, |
| "valid_targets_mean": 3317.1, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 6.359052711993888, |
| "grad_norm": 0.8238761195026589, |
| "learning_rate": 1.0187871324074817e-06, |
| "loss": 0.3856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1751250922679901, |
| "step": 4165, |
| "valid_targets_mean": 2360.1, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 6.366692131398014, |
| "grad_norm": 0.6494877601984028, |
| "learning_rate": 9.94933098400055e-07, |
| "loss": 0.4099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22490882873535156, |
| "step": 4170, |
| "valid_targets_mean": 4196.5, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 6.374331550802139, |
| "grad_norm": 0.8728852143884642, |
| "learning_rate": 9.713545190913476e-07, |
| "loss": 0.4277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.201102614402771, |
| "step": 4175, |
| "valid_targets_mean": 2424.6, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 6.381970970206265, |
| "grad_norm": 0.749192164055093, |
| "learning_rate": 9.480517362234032e-07, |
| "loss": 0.3976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2019495815038681, |
| "step": 4180, |
| "valid_targets_mean": 3497.0, |
| "valid_targets_min": 1721 |
| }, |
| { |
| "epoch": 6.3896103896103895, |
| "grad_norm": 0.638180410821364, |
| "learning_rate": 9.250250875409383e-07, |
| "loss": 0.393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14714564383029938, |
| "step": 4185, |
| "valid_targets_mean": 3203.1, |
| "valid_targets_min": 1783 |
| }, |
| { |
| "epoch": 6.3972498090145145, |
| "grad_norm": 0.8607560920587862, |
| "learning_rate": 9.022749067864689e-07, |
| "loss": 0.3939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2053133249282837, |
| "step": 4190, |
| "valid_targets_mean": 2401.1, |
| "valid_targets_min": 320 |
| }, |
| { |
| "epoch": 6.40488922841864, |
| "grad_norm": 0.7670657586929429, |
| "learning_rate": 8.798015236954227e-07, |
| "loss": 0.3922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17581060528755188, |
| "step": 4195, |
| "valid_targets_mean": 2269.9, |
| "valid_targets_min": 359 |
| }, |
| { |
| "epoch": 6.412528647822765, |
| "grad_norm": 0.7059107747645008, |
| "learning_rate": 8.57605263991419e-07, |
| "loss": 0.3943, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19902944564819336, |
| "step": 4200, |
| "valid_targets_mean": 3872.6, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 6.420168067226891, |
| "grad_norm": 0.7986131923796598, |
| "learning_rate": 8.356864493815075e-07, |
| "loss": 0.3897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16714152693748474, |
| "step": 4205, |
| "valid_targets_mean": 2283.8, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 6.427807486631016, |
| "grad_norm": 0.7984289049100618, |
| "learning_rate": 8.14045397551515e-07, |
| "loss": 0.4303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19162634015083313, |
| "step": 4210, |
| "valid_targets_mean": 2795.0, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 6.435446906035141, |
| "grad_norm": 1.951568058224522, |
| "learning_rate": 7.926824221614504e-07, |
| "loss": 0.394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23274573683738708, |
| "step": 4215, |
| "valid_targets_mean": 2335.2, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 6.443086325439267, |
| "grad_norm": 0.7101960443226988, |
| "learning_rate": 7.715978328409557e-07, |
| "loss": 0.438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1813594102859497, |
| "step": 4220, |
| "valid_targets_mean": 3580.1, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 6.450725744843392, |
| "grad_norm": 0.6571344450932545, |
| "learning_rate": 7.507919351847981e-07, |
| "loss": 0.4103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18891257047653198, |
| "step": 4225, |
| "valid_targets_mean": 4464.8, |
| "valid_targets_min": 2225 |
| }, |
| { |
| "epoch": 6.4583651642475175, |
| "grad_norm": 0.7851602265875163, |
| "learning_rate": 7.30265030748476e-07, |
| "loss": 0.423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21480068564414978, |
| "step": 4230, |
| "valid_targets_mean": 2892.2, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 6.466004583651642, |
| "grad_norm": 0.8880996159628666, |
| "learning_rate": 7.100174170438201e-07, |
| "loss": 0.4379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25237733125686646, |
| "step": 4235, |
| "valid_targets_mean": 2963.4, |
| "valid_targets_min": 1664 |
| }, |
| { |
| "epoch": 6.473644003055767, |
| "grad_norm": 0.7559016985627138, |
| "learning_rate": 6.900493875346881e-07, |
| "loss": 0.4064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1809263825416565, |
| "step": 4240, |
| "valid_targets_mean": 2675.2, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 6.481283422459893, |
| "grad_norm": 0.8329205888133813, |
| "learning_rate": 6.703612316327235e-07, |
| "loss": 0.3957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18009233474731445, |
| "step": 4245, |
| "valid_targets_mean": 2314.6, |
| "valid_targets_min": 336 |
| }, |
| { |
| "epoch": 6.488922841864018, |
| "grad_norm": 0.7520955113985317, |
| "learning_rate": 6.509532346931458e-07, |
| "loss": 0.427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29548799991607666, |
| "step": 4250, |
| "valid_targets_mean": 4104.2, |
| "valid_targets_min": 1550 |
| }, |
| { |
| "epoch": 6.496562261268144, |
| "grad_norm": 0.6690947855209332, |
| "learning_rate": 6.318256780106202e-07, |
| "loss": 0.3992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18764840066432953, |
| "step": 4255, |
| "valid_targets_mean": 3462.2, |
| "valid_targets_min": 1657 |
| }, |
| { |
| "epoch": 6.504201680672269, |
| "grad_norm": 0.7368821627461865, |
| "learning_rate": 6.129788388151837e-07, |
| "loss": 0.4374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1427152156829834, |
| "step": 4260, |
| "valid_targets_mean": 2727.9, |
| "valid_targets_min": 1300 |
| }, |
| { |
| "epoch": 6.511841100076394, |
| "grad_norm": 0.71263809616908, |
| "learning_rate": 5.94412990268216e-07, |
| "loss": 0.4113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2381899654865265, |
| "step": 4265, |
| "valid_targets_mean": 3497.4, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 6.51948051948052, |
| "grad_norm": 0.6447965631661843, |
| "learning_rate": 5.761284014585044e-07, |
| "loss": 0.4191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14833205938339233, |
| "step": 4270, |
| "valid_targets_mean": 4181.8, |
| "valid_targets_min": 1642 |
| }, |
| { |
| "epoch": 6.527119938884645, |
| "grad_norm": 0.9278788809414662, |
| "learning_rate": 5.581253373983097e-07, |
| "loss": 0.4025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31120574474334717, |
| "step": 4275, |
| "valid_targets_mean": 2991.6, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 6.53475935828877, |
| "grad_norm": 0.8206199783968727, |
| "learning_rate": 5.404040590195548e-07, |
| "loss": 0.4055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21243171393871307, |
| "step": 4280, |
| "valid_targets_mean": 3095.6, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 6.542398777692895, |
| "grad_norm": 0.7123021318130813, |
| "learning_rate": 5.229648231700246e-07, |
| "loss": 0.4031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1695111095905304, |
| "step": 4285, |
| "valid_targets_mean": 3057.0, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 6.55003819709702, |
| "grad_norm": 0.7367430336219517, |
| "learning_rate": 5.058078826096613e-07, |
| "loss": 0.4204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15544866025447845, |
| "step": 4290, |
| "valid_targets_mean": 2747.5, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 6.557677616501146, |
| "grad_norm": 0.8256976164624099, |
| "learning_rate": 4.889334860068706e-07, |
| "loss": 0.4115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25187405943870544, |
| "step": 4295, |
| "valid_targets_mean": 3789.0, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 6.565317035905271, |
| "grad_norm": 0.7000989539122991, |
| "learning_rate": 4.723418779349542e-07, |
| "loss": 0.3866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18330548703670502, |
| "step": 4300, |
| "valid_targets_mean": 3228.8, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 6.572956455309397, |
| "grad_norm": 0.7769235104940684, |
| "learning_rate": 4.560332988685412e-07, |
| "loss": 0.426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16183039546012878, |
| "step": 4305, |
| "valid_targets_mean": 2477.9, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 6.580595874713522, |
| "grad_norm": 0.8338757429293011, |
| "learning_rate": 4.40007985180102e-07, |
| "loss": 0.3835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1706201136112213, |
| "step": 4310, |
| "valid_targets_mean": 2273.8, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 6.588235294117647, |
| "grad_norm": 0.9735838755677048, |
| "learning_rate": 4.242661691365446e-07, |
| "loss": 0.4255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2386619746685028, |
| "step": 4315, |
| "valid_targets_mean": 2037.2, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 6.595874713521773, |
| "grad_norm": 0.8316266447924147, |
| "learning_rate": 4.088080788958171e-07, |
| "loss": 0.3911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20971032977104187, |
| "step": 4320, |
| "valid_targets_mean": 2690.0, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 6.6035141329258975, |
| "grad_norm": 0.944056483188538, |
| "learning_rate": 3.936339385036236e-07, |
| "loss": 0.41, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18069300055503845, |
| "step": 4325, |
| "valid_targets_mean": 1738.2, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 6.611153552330023, |
| "grad_norm": 0.7536331411489621, |
| "learning_rate": 3.787439678901739e-07, |
| "loss": 0.395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14931751787662506, |
| "step": 4330, |
| "valid_targets_mean": 2758.6, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 6.618792971734148, |
| "grad_norm": 0.7552466450639199, |
| "learning_rate": 3.641383828669831e-07, |
| "loss": 0.4145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22667306661605835, |
| "step": 4335, |
| "valid_targets_mean": 4108.0, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 6.626432391138273, |
| "grad_norm": 0.7452294813232219, |
| "learning_rate": 3.498173951237593e-07, |
| "loss": 0.4177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18081125617027283, |
| "step": 4340, |
| "valid_targets_mean": 2849.5, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 6.634071810542399, |
| "grad_norm": 0.7645301896963309, |
| "learning_rate": 3.3578121222532565e-07, |
| "loss": 0.4204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17134138941764832, |
| "step": 4345, |
| "valid_targets_mean": 2639.2, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 6.641711229946524, |
| "grad_norm": 0.6464171031333205, |
| "learning_rate": 3.2203003760861827e-07, |
| "loss": 0.4402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2736469507217407, |
| "step": 4350, |
| "valid_targets_mean": 4797.0, |
| "valid_targets_min": 1765 |
| }, |
| { |
| "epoch": 6.64935064935065, |
| "grad_norm": 0.9127196120836408, |
| "learning_rate": 3.085640705797266e-07, |
| "loss": 0.4008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24204598367214203, |
| "step": 4355, |
| "valid_targets_mean": 3617.4, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 6.656990068754775, |
| "grad_norm": 0.685182853452726, |
| "learning_rate": 2.953835063110222e-07, |
| "loss": 0.3911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20241063833236694, |
| "step": 4360, |
| "valid_targets_mean": 3864.1, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 6.6646294881589, |
| "grad_norm": 0.6833217903769809, |
| "learning_rate": 2.824885358383123e-07, |
| "loss": 0.4095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13412925601005554, |
| "step": 4365, |
| "valid_targets_mean": 2417.9, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 6.6722689075630255, |
| "grad_norm": 0.785494709686734, |
| "learning_rate": 2.6987934605808617e-07, |
| "loss": 0.454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19218818843364716, |
| "step": 4370, |
| "valid_targets_mean": 2367.4, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 6.67990832696715, |
| "grad_norm": 0.7628862307702344, |
| "learning_rate": 2.575561197247911e-07, |
| "loss": 0.4354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21473418176174164, |
| "step": 4375, |
| "valid_targets_mean": 3552.5, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 6.687547746371276, |
| "grad_norm": 0.7289251185774825, |
| "learning_rate": 2.4551903544819625e-07, |
| "loss": 0.3982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19578754901885986, |
| "step": 4380, |
| "valid_targets_mean": 4277.5, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 6.695187165775401, |
| "grad_norm": 0.7546985683585661, |
| "learning_rate": 2.3376826769080153e-07, |
| "loss": 0.3993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24338172376155853, |
| "step": 4385, |
| "valid_targets_mean": 3920.4, |
| "valid_targets_min": 425 |
| }, |
| { |
| "epoch": 6.702826585179526, |
| "grad_norm": 0.7218443448066771, |
| "learning_rate": 2.2230398676529763e-07, |
| "loss": 0.3856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2012680470943451, |
| "step": 4390, |
| "valid_targets_mean": 3084.5, |
| "valid_targets_min": 1056 |
| }, |
| { |
| "epoch": 6.710466004583652, |
| "grad_norm": 0.7629253125535567, |
| "learning_rate": 2.1112635883211663e-07, |
| "loss": 0.4006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18300996720790863, |
| "step": 4395, |
| "valid_targets_mean": 2941.1, |
| "valid_targets_min": 1379 |
| }, |
| { |
| "epoch": 6.718105423987777, |
| "grad_norm": 0.8426812792697609, |
| "learning_rate": 2.0023554589701177e-07, |
| "loss": 0.4371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2638070583343506, |
| "step": 4400, |
| "valid_targets_mean": 3378.0, |
| "valid_targets_min": 1189 |
| }, |
| { |
| "epoch": 6.725744843391903, |
| "grad_norm": 0.9125345695540272, |
| "learning_rate": 1.8963170580870384e-07, |
| "loss": 0.3804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2333306074142456, |
| "step": 4405, |
| "valid_targets_mean": 3033.8, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 6.733384262796028, |
| "grad_norm": 0.7491072210513785, |
| "learning_rate": 1.793149922566051e-07, |
| "loss": 0.389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18493598699569702, |
| "step": 4410, |
| "valid_targets_mean": 2844.1, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 6.741023682200153, |
| "grad_norm": 0.7075668630390985, |
| "learning_rate": 1.6928555476859454e-07, |
| "loss": 0.3947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26151540875434875, |
| "step": 4415, |
| "valid_targets_mean": 3931.2, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 6.748663101604278, |
| "grad_norm": 0.6953662547298742, |
| "learning_rate": 1.5954353870883289e-07, |
| "loss": 0.3938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18146592378616333, |
| "step": 4420, |
| "valid_targets_mean": 3214.6, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 6.756302521008403, |
| "grad_norm": 0.8442580153908322, |
| "learning_rate": 1.500890852756709e-07, |
| "loss": 0.424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2436636984348297, |
| "step": 4425, |
| "valid_targets_mean": 3346.9, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 6.763941940412528, |
| "grad_norm": 0.7756874677183939, |
| "learning_rate": 1.409223314996e-07, |
| "loss": 0.4071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21483536064624786, |
| "step": 4430, |
| "valid_targets_mean": 2961.0, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 6.771581359816654, |
| "grad_norm": 0.7526769191170677, |
| "learning_rate": 1.3204341024125822e-07, |
| "loss": 0.4216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28000983595848083, |
| "step": 4435, |
| "valid_targets_mean": 3804.1, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 6.779220779220779, |
| "grad_norm": 0.7084850932543485, |
| "learning_rate": 1.234524501895207e-07, |
| "loss": 0.4104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1803816705942154, |
| "step": 4440, |
| "valid_targets_mean": 3388.8, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 6.786860198624905, |
| "grad_norm": 0.6995301576820601, |
| "learning_rate": 1.1514957585961884e-07, |
| "loss": 0.4265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2403801530599594, |
| "step": 4445, |
| "valid_targets_mean": 3688.4, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 6.79449961802903, |
| "grad_norm": 0.7980224363102327, |
| "learning_rate": 1.0713490759133749e-07, |
| "loss": 0.4298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24173349142074585, |
| "step": 4450, |
| "valid_targets_mean": 3873.1, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 6.802139037433155, |
| "grad_norm": 0.938657736390237, |
| "learning_rate": 9.940856154728285e-08, |
| "loss": 0.4038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2338993102312088, |
| "step": 4455, |
| "valid_targets_mean": 2365.4, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 6.809778456837281, |
| "grad_norm": 0.7970620171037146, |
| "learning_rate": 9.197064971118608e-08, |
| "loss": 0.4128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1684938669204712, |
| "step": 4460, |
| "valid_targets_mean": 2387.1, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 6.8174178762414055, |
| "grad_norm": 0.7990434021559547, |
| "learning_rate": 8.482127988628686e-08, |
| "loss": 0.3957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20925235748291016, |
| "step": 4465, |
| "valid_targets_mean": 3208.0, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 6.825057295645531, |
| "grad_norm": 0.711948338122833, |
| "learning_rate": 7.79605556937657e-08, |
| "loss": 0.3905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22843460738658905, |
| "step": 4470, |
| "valid_targets_mean": 3919.1, |
| "valid_targets_min": 1615 |
| }, |
| { |
| "epoch": 6.832696715049656, |
| "grad_norm": 0.7448708465075117, |
| "learning_rate": 7.138857657125187e-08, |
| "loss": 0.3832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16185849905014038, |
| "step": 4475, |
| "valid_targets_mean": 2761.2, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 6.840336134453781, |
| "grad_norm": 0.7579937641972179, |
| "learning_rate": 6.510543777136446e-08, |
| "loss": 0.4065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20061391592025757, |
| "step": 4480, |
| "valid_targets_mean": 3314.9, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 6.847975553857907, |
| "grad_norm": 0.7907444070235546, |
| "learning_rate": 5.9111230360358044e-08, |
| "loss": 0.4075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186139315366745, |
| "step": 4485, |
| "valid_targets_mean": 2889.6, |
| "valid_targets_min": 1288 |
| }, |
| { |
| "epoch": 6.855614973262032, |
| "grad_norm": 0.6975648733688181, |
| "learning_rate": 5.340604121677251e-08, |
| "loss": 0.4429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2715853750705719, |
| "step": 4490, |
| "valid_targets_mean": 5079.4, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 6.863254392666157, |
| "grad_norm": 0.7829068945896205, |
| "learning_rate": 4.798995303020082e-08, |
| "loss": 0.4006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18688000738620758, |
| "step": 4495, |
| "valid_targets_mean": 3115.0, |
| "valid_targets_min": 1063 |
| }, |
| { |
| "epoch": 6.870893812070283, |
| "grad_norm": 0.810646499172978, |
| "learning_rate": 4.286304430006993e-08, |
| "loss": 0.4184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2315147966146469, |
| "step": 4500, |
| "valid_targets_mean": 3839.6, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 6.878533231474408, |
| "grad_norm": 0.7619179750430908, |
| "learning_rate": 3.802538933451949e-08, |
| "loss": 0.3843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1792149543762207, |
| "step": 4505, |
| "valid_targets_mean": 3125.1, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 6.8861726508785335, |
| "grad_norm": 0.7682971319843082, |
| "learning_rate": 3.34770582493138e-08, |
| "loss": 0.3997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17539235949516296, |
| "step": 4510, |
| "valid_targets_mean": 2813.1, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 6.893812070282658, |
| "grad_norm": 0.845749955999027, |
| "learning_rate": 2.921811696682708e-08, |
| "loss": 0.4075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2827659845352173, |
| "step": 4515, |
| "valid_targets_mean": 3597.2, |
| "valid_targets_min": 517 |
| }, |
| { |
| "epoch": 6.901451489686783, |
| "grad_norm": 0.690837425334579, |
| "learning_rate": 2.5248627215093135e-08, |
| "loss": 0.415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1957932710647583, |
| "step": 4520, |
| "valid_targets_mean": 3684.2, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 6.909090909090909, |
| "grad_norm": 0.6881716196186753, |
| "learning_rate": 2.1568646526906045e-08, |
| "loss": 0.4057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14163070917129517, |
| "step": 4525, |
| "valid_targets_mean": 2711.8, |
| "valid_targets_min": 1141 |
| }, |
| { |
| "epoch": 6.916730328495034, |
| "grad_norm": 0.7723694993387338, |
| "learning_rate": 1.8178228238985296e-08, |
| "loss": 0.4415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16728349030017853, |
| "step": 4530, |
| "valid_targets_mean": 2791.1, |
| "valid_targets_min": 2107 |
| }, |
| { |
| "epoch": 6.92436974789916, |
| "grad_norm": 0.7098507533235618, |
| "learning_rate": 1.507742149121194e-08, |
| "loss": 0.438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1468479186296463, |
| "step": 4535, |
| "valid_targets_mean": 2866.5, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 6.932009167303285, |
| "grad_norm": 0.7742964005350101, |
| "learning_rate": 1.2266271225902515e-08, |
| "loss": 0.406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18890097737312317, |
| "step": 4540, |
| "valid_targets_mean": 3014.0, |
| "valid_targets_min": 1478 |
| }, |
| { |
| "epoch": 6.93964858670741, |
| "grad_norm": 0.7371062150413249, |
| "learning_rate": 9.744818187169547e-09, |
| "loss": 0.4244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25650227069854736, |
| "step": 4545, |
| "valid_targets_mean": 4534.8, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 6.947288006111536, |
| "grad_norm": 0.7581755468751333, |
| "learning_rate": 7.513098920324257e-09, |
| "loss": 0.4061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18233633041381836, |
| "step": 4550, |
| "valid_targets_mean": 3266.2, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 6.954927425515661, |
| "grad_norm": 0.8049076099781532, |
| "learning_rate": 5.571145771345876e-09, |
| "loss": 0.4024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2446897178888321, |
| "step": 4555, |
| "valid_targets_mean": 3738.0, |
| "valid_targets_min": 1564 |
| }, |
| { |
| "epoch": 6.962566844919786, |
| "grad_norm": 0.8164662192077489, |
| "learning_rate": 3.918986886424225e-09, |
| "loss": 0.3819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18588244915008545, |
| "step": 4560, |
| "valid_targets_mean": 3562.0, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 6.970206264323911, |
| "grad_norm": 0.8168583040167611, |
| "learning_rate": 2.5566462115333978e-09, |
| "loss": 0.4236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27808865904808044, |
| "step": 4565, |
| "valid_targets_mean": 2969.0, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 6.977845683728036, |
| "grad_norm": 0.7599055862581678, |
| "learning_rate": 1.484143492100909e-09, |
| "loss": 0.3961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16413216292858124, |
| "step": 4570, |
| "valid_targets_mean": 2781.8, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 6.985485103132162, |
| "grad_norm": 0.855562431244123, |
| "learning_rate": 7.014942727145979e-10, |
| "loss": 0.4307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20022156834602356, |
| "step": 4575, |
| "valid_targets_mean": 2384.5, |
| "valid_targets_min": 438 |
| }, |
| { |
| "epoch": 6.993124522536287, |
| "grad_norm": 0.6722570494176869, |
| "learning_rate": 2.0870989689614208e-10, |
| "loss": 0.408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2858823537826538, |
| "step": 4580, |
| "valid_targets_mean": 4627.0, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 7.0, |
| "grad_norm": 1.1970404627629374, |
| "learning_rate": 5.797506938964859e-12, |
| "loss": 0.3911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35643327236175537, |
| "step": 4585, |
| "valid_targets_mean": 2517.8, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35643327236175537, |
| "step": 4585, |
| "total_flos": 1.0328415967578685e+18, |
| "train_loss": 0.4849937954541771, |
| "train_runtime": 33081.3008, |
| "train_samples_per_second": 2.216, |
| "train_steps_per_second": 0.139, |
| "valid_targets_mean": 2517.8, |
| "valid_targets_min": 562 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4585, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1.0328415967578685e+18, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|