| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4410, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.007936507936507936, |
| "grad_norm": 13.936445999727159, |
| "learning_rate": 3.6281179138322e-07, |
| "loss": 0.5831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5446114540100098, |
| "step": 5, |
| "valid_targets_mean": 5181.8, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 0.015873015873015872, |
| "grad_norm": 14.14405406674101, |
| "learning_rate": 8.163265306122449e-07, |
| "loss": 0.6026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6077768802642822, |
| "step": 10, |
| "valid_targets_mean": 5303.6, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 0.023809523809523808, |
| "grad_norm": 13.385853949153486, |
| "learning_rate": 1.26984126984127e-06, |
| "loss": 0.5824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5799890160560608, |
| "step": 15, |
| "valid_targets_mean": 5301.1, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 0.031746031746031744, |
| "grad_norm": 10.791756912090966, |
| "learning_rate": 1.723356009070295e-06, |
| "loss": 0.5901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5597653985023499, |
| "step": 20, |
| "valid_targets_mean": 4823.9, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 0.03968253968253968, |
| "grad_norm": 6.581205621105729, |
| "learning_rate": 2.17687074829932e-06, |
| "loss": 0.5323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4685205817222595, |
| "step": 25, |
| "valid_targets_mean": 4813.8, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 0.047619047619047616, |
| "grad_norm": 3.7853786833152236, |
| "learning_rate": 2.6303854875283447e-06, |
| "loss": 0.4573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4164578914642334, |
| "step": 30, |
| "valid_targets_mean": 5283.2, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 0.05555555555555555, |
| "grad_norm": 2.602330607184181, |
| "learning_rate": 3.08390022675737e-06, |
| "loss": 0.423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39225059747695923, |
| "step": 35, |
| "valid_targets_mean": 4700.6, |
| "valid_targets_min": 2390 |
| }, |
| { |
| "epoch": 0.06349206349206349, |
| "grad_norm": 1.4233023861991225, |
| "learning_rate": 3.537414965986395e-06, |
| "loss": 0.3809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35967135429382324, |
| "step": 40, |
| "valid_targets_mean": 5445.3, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.07142857142857142, |
| "grad_norm": 1.0170115963512993, |
| "learning_rate": 3.99092970521542e-06, |
| "loss": 0.402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3903147876262665, |
| "step": 45, |
| "valid_targets_mean": 6464.0, |
| "valid_targets_min": 3085 |
| }, |
| { |
| "epoch": 0.07936507936507936, |
| "grad_norm": 0.8370897006461435, |
| "learning_rate": 4.444444444444444e-06, |
| "loss": 0.3794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33025485277175903, |
| "step": 50, |
| "valid_targets_mean": 5718.5, |
| "valid_targets_min": 975 |
| }, |
| { |
| "epoch": 0.0873015873015873, |
| "grad_norm": 0.7252658896074926, |
| "learning_rate": 4.897959183673469e-06, |
| "loss": 0.3611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34258341789245605, |
| "step": 55, |
| "valid_targets_mean": 5999.1, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 0.09523809523809523, |
| "grad_norm": 0.756722250222215, |
| "learning_rate": 5.3514739229024945e-06, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3988223075866699, |
| "step": 60, |
| "valid_targets_mean": 4506.9, |
| "valid_targets_min": 290 |
| }, |
| { |
| "epoch": 0.10317460317460317, |
| "grad_norm": 0.568685223882473, |
| "learning_rate": 5.80498866213152e-06, |
| "loss": 0.3448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3268760144710541, |
| "step": 65, |
| "valid_targets_mean": 6105.9, |
| "valid_targets_min": 2717 |
| }, |
| { |
| "epoch": 0.1111111111111111, |
| "grad_norm": 0.5731290626935265, |
| "learning_rate": 6.258503401360545e-06, |
| "loss": 0.3215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3184238374233246, |
| "step": 70, |
| "valid_targets_mean": 5088.2, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 0.11904761904761904, |
| "grad_norm": 0.5739988755146004, |
| "learning_rate": 6.71201814058957e-06, |
| "loss": 0.3124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34080153703689575, |
| "step": 75, |
| "valid_targets_mean": 5674.6, |
| "valid_targets_min": 1923 |
| }, |
| { |
| "epoch": 0.12698412698412698, |
| "grad_norm": 0.5021784940463249, |
| "learning_rate": 7.165532879818595e-06, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3233030438423157, |
| "step": 80, |
| "valid_targets_mean": 5277.2, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 0.1349206349206349, |
| "grad_norm": 0.5521401363464609, |
| "learning_rate": 7.61904761904762e-06, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2872031331062317, |
| "step": 85, |
| "valid_targets_mean": 5470.0, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 0.14285714285714285, |
| "grad_norm": 0.4751497127812398, |
| "learning_rate": 8.072562358276645e-06, |
| "loss": 0.3222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3212955594062805, |
| "step": 90, |
| "valid_targets_mean": 6301.1, |
| "valid_targets_min": 2854 |
| }, |
| { |
| "epoch": 0.15079365079365079, |
| "grad_norm": 0.43696107468178264, |
| "learning_rate": 8.52607709750567e-06, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2621079683303833, |
| "step": 95, |
| "valid_targets_mean": 5617.8, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 0.15873015873015872, |
| "grad_norm": 0.5242468737414164, |
| "learning_rate": 8.979591836734695e-06, |
| "loss": 0.3018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3428232669830322, |
| "step": 100, |
| "valid_targets_mean": 5715.6, |
| "valid_targets_min": 2266 |
| }, |
| { |
| "epoch": 0.16666666666666666, |
| "grad_norm": 0.4723266645052996, |
| "learning_rate": 9.43310657596372e-06, |
| "loss": 0.2767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27712035179138184, |
| "step": 105, |
| "valid_targets_mean": 5371.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.1746031746031746, |
| "grad_norm": 0.49793096409078624, |
| "learning_rate": 9.886621315192746e-06, |
| "loss": 0.2986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2675686478614807, |
| "step": 110, |
| "valid_targets_mean": 4750.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.18253968253968253, |
| "grad_norm": 0.4902776042402625, |
| "learning_rate": 1.034013605442177e-05, |
| "loss": 0.2876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30433300137519836, |
| "step": 115, |
| "valid_targets_mean": 5146.1, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 0.19047619047619047, |
| "grad_norm": 0.465412157163947, |
| "learning_rate": 1.0793650793650794e-05, |
| "loss": 0.2969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2920241057872772, |
| "step": 120, |
| "valid_targets_mean": 5453.2, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 0.1984126984126984, |
| "grad_norm": 0.4355039639514751, |
| "learning_rate": 1.124716553287982e-05, |
| "loss": 0.2503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2529776692390442, |
| "step": 125, |
| "valid_targets_mean": 5727.6, |
| "valid_targets_min": 2696 |
| }, |
| { |
| "epoch": 0.20634920634920634, |
| "grad_norm": 0.4996682572655225, |
| "learning_rate": 1.1700680272108845e-05, |
| "loss": 0.2826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2821199297904968, |
| "step": 130, |
| "valid_targets_mean": 5396.6, |
| "valid_targets_min": 2020 |
| }, |
| { |
| "epoch": 0.21428571428571427, |
| "grad_norm": 0.43094951290178424, |
| "learning_rate": 1.215419501133787e-05, |
| "loss": 0.2583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24614138901233673, |
| "step": 135, |
| "valid_targets_mean": 5842.7, |
| "valid_targets_min": 286 |
| }, |
| { |
| "epoch": 0.2222222222222222, |
| "grad_norm": 0.47723431745558176, |
| "learning_rate": 1.2607709750566895e-05, |
| "loss": 0.2845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2890702486038208, |
| "step": 140, |
| "valid_targets_mean": 5354.1, |
| "valid_targets_min": 2307 |
| }, |
| { |
| "epoch": 0.23015873015873015, |
| "grad_norm": 0.4617350150011481, |
| "learning_rate": 1.3061224489795918e-05, |
| "loss": 0.2586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2510530948638916, |
| "step": 145, |
| "valid_targets_mean": 5552.1, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 0.23809523809523808, |
| "grad_norm": 0.45824070397194494, |
| "learning_rate": 1.3514739229024945e-05, |
| "loss": 0.2652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26986801624298096, |
| "step": 150, |
| "valid_targets_mean": 5441.2, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 0.24603174603174602, |
| "grad_norm": 0.4392573652714541, |
| "learning_rate": 1.3968253968253968e-05, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2496776133775711, |
| "step": 155, |
| "valid_targets_mean": 5731.4, |
| "valid_targets_min": 1393 |
| }, |
| { |
| "epoch": 0.25396825396825395, |
| "grad_norm": 0.4536964041682826, |
| "learning_rate": 1.4421768707482994e-05, |
| "loss": 0.2374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21673960983753204, |
| "step": 160, |
| "valid_targets_mean": 6079.4, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 0.2619047619047619, |
| "grad_norm": 0.5619742860376928, |
| "learning_rate": 1.4875283446712018e-05, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2804248631000519, |
| "step": 165, |
| "valid_targets_mean": 5392.2, |
| "valid_targets_min": 2214 |
| }, |
| { |
| "epoch": 0.2698412698412698, |
| "grad_norm": 0.4588222248723898, |
| "learning_rate": 1.5328798185941044e-05, |
| "loss": 0.2643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24595819413661957, |
| "step": 170, |
| "valid_targets_mean": 5367.2, |
| "valid_targets_min": 1806 |
| }, |
| { |
| "epoch": 0.2777777777777778, |
| "grad_norm": 0.4837210875448078, |
| "learning_rate": 1.578231292517007e-05, |
| "loss": 0.2465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26808232069015503, |
| "step": 175, |
| "valid_targets_mean": 4694.2, |
| "valid_targets_min": 1970 |
| }, |
| { |
| "epoch": 0.2857142857142857, |
| "grad_norm": 0.4642135470304616, |
| "learning_rate": 1.6235827664399097e-05, |
| "loss": 0.2568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25557032227516174, |
| "step": 180, |
| "valid_targets_mean": 5724.9, |
| "valid_targets_min": 1981 |
| }, |
| { |
| "epoch": 0.29365079365079366, |
| "grad_norm": 0.4404678599566564, |
| "learning_rate": 1.668934240362812e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2403090000152588, |
| "step": 185, |
| "valid_targets_mean": 5580.2, |
| "valid_targets_min": 1807 |
| }, |
| { |
| "epoch": 0.30158730158730157, |
| "grad_norm": 0.461513428421082, |
| "learning_rate": 1.7142857142857142e-05, |
| "loss": 0.2717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2342744767665863, |
| "step": 190, |
| "valid_targets_mean": 5209.1, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 0.30952380952380953, |
| "grad_norm": 0.4616028237565255, |
| "learning_rate": 1.759637188208617e-05, |
| "loss": 0.2573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2381066232919693, |
| "step": 195, |
| "valid_targets_mean": 4881.2, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 0.31746031746031744, |
| "grad_norm": 0.5048131717477712, |
| "learning_rate": 1.8049886621315194e-05, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24961230158805847, |
| "step": 200, |
| "valid_targets_mean": 4766.8, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 0.3253968253968254, |
| "grad_norm": 0.4608218526938904, |
| "learning_rate": 1.8503401360544218e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22085292637348175, |
| "step": 205, |
| "valid_targets_mean": 5626.6, |
| "valid_targets_min": 311 |
| }, |
| { |
| "epoch": 0.3333333333333333, |
| "grad_norm": 0.5276409706041367, |
| "learning_rate": 1.8956916099773243e-05, |
| "loss": 0.2558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2512398362159729, |
| "step": 210, |
| "valid_targets_mean": 5207.8, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 0.3412698412698413, |
| "grad_norm": 0.44125944724862465, |
| "learning_rate": 1.941043083900227e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23039595782756805, |
| "step": 215, |
| "valid_targets_mean": 6150.5, |
| "valid_targets_min": 2819 |
| }, |
| { |
| "epoch": 0.3492063492063492, |
| "grad_norm": 0.8225576873165226, |
| "learning_rate": 1.9863945578231295e-05, |
| "loss": 0.2654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2745077311992645, |
| "step": 220, |
| "valid_targets_mean": 4586.4, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 0.35714285714285715, |
| "grad_norm": 0.44559302418983976, |
| "learning_rate": 2.031746031746032e-05, |
| "loss": 0.2447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27263548970222473, |
| "step": 225, |
| "valid_targets_mean": 5901.4, |
| "valid_targets_min": 1813 |
| }, |
| { |
| "epoch": 0.36507936507936506, |
| "grad_norm": 0.4702793229346846, |
| "learning_rate": 2.0770975056689343e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2387492060661316, |
| "step": 230, |
| "valid_targets_mean": 5740.0, |
| "valid_targets_min": 1593 |
| }, |
| { |
| "epoch": 0.373015873015873, |
| "grad_norm": 0.5771251589812603, |
| "learning_rate": 2.122448979591837e-05, |
| "loss": 0.2577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27772706747055054, |
| "step": 235, |
| "valid_targets_mean": 5892.1, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 0.38095238095238093, |
| "grad_norm": 0.4716600277551803, |
| "learning_rate": 2.1678004535147395e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24430419504642487, |
| "step": 240, |
| "valid_targets_mean": 5370.8, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 0.3888888888888889, |
| "grad_norm": 0.4834321959641482, |
| "learning_rate": 2.213151927437642e-05, |
| "loss": 0.2335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2554604709148407, |
| "step": 245, |
| "valid_targets_mean": 5334.6, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 0.3968253968253968, |
| "grad_norm": 0.4468651198346908, |
| "learning_rate": 2.2585034013605444e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22178535163402557, |
| "step": 250, |
| "valid_targets_mean": 5966.1, |
| "valid_targets_min": 1724 |
| }, |
| { |
| "epoch": 0.40476190476190477, |
| "grad_norm": 0.4750302614876995, |
| "learning_rate": 2.3038548752834472e-05, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26613864302635193, |
| "step": 255, |
| "valid_targets_mean": 5677.9, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 0.4126984126984127, |
| "grad_norm": 0.4468674852795431, |
| "learning_rate": 2.3492063492063496e-05, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2535470724105835, |
| "step": 260, |
| "valid_targets_mean": 5571.2, |
| "valid_targets_min": 3116 |
| }, |
| { |
| "epoch": 0.42063492063492064, |
| "grad_norm": 0.4435957536640986, |
| "learning_rate": 2.394557823129252e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24253222346305847, |
| "step": 265, |
| "valid_targets_mean": 5520.6, |
| "valid_targets_min": 2481 |
| }, |
| { |
| "epoch": 0.42857142857142855, |
| "grad_norm": 0.48192905697263166, |
| "learning_rate": 2.439909297052154e-05, |
| "loss": 0.2405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22654183208942413, |
| "step": 270, |
| "valid_targets_mean": 5040.6, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 0.4365079365079365, |
| "grad_norm": 0.4654909902022295, |
| "learning_rate": 2.4852607709750566e-05, |
| "loss": 0.2397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22321158647537231, |
| "step": 275, |
| "valid_targets_mean": 4938.6, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 0.4444444444444444, |
| "grad_norm": 0.47136311558318184, |
| "learning_rate": 2.5306122448979597e-05, |
| "loss": 0.256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25398164987564087, |
| "step": 280, |
| "valid_targets_mean": 5719.1, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 0.4523809523809524, |
| "grad_norm": 0.5143544056685512, |
| "learning_rate": 2.5759637188208618e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28001242876052856, |
| "step": 285, |
| "valid_targets_mean": 4379.2, |
| "valid_targets_min": 275 |
| }, |
| { |
| "epoch": 0.4603174603174603, |
| "grad_norm": 0.40992433170257936, |
| "learning_rate": 2.6213151927437642e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19944259524345398, |
| "step": 290, |
| "valid_targets_mean": 6113.2, |
| "valid_targets_min": 1496 |
| }, |
| { |
| "epoch": 0.46825396825396826, |
| "grad_norm": 0.7108778765163672, |
| "learning_rate": 2.6666666666666667e-05, |
| "loss": 0.2316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2676636576652527, |
| "step": 295, |
| "valid_targets_mean": 4878.0, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 0.47619047619047616, |
| "grad_norm": 0.7424501325702221, |
| "learning_rate": 2.7120181405895694e-05, |
| "loss": 0.2345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27534204721450806, |
| "step": 300, |
| "valid_targets_mean": 4737.1, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 0.48412698412698413, |
| "grad_norm": 0.4554032952042926, |
| "learning_rate": 2.757369614512472e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23061871528625488, |
| "step": 305, |
| "valid_targets_mean": 5816.9, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 0.49206349206349204, |
| "grad_norm": 0.43918142641279273, |
| "learning_rate": 2.8027210884353743e-05, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2266923487186432, |
| "step": 310, |
| "valid_targets_mean": 5512.4, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 0.5, |
| "grad_norm": 0.46398515425879433, |
| "learning_rate": 2.8480725623582767e-05, |
| "loss": 0.2234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21582689881324768, |
| "step": 315, |
| "valid_targets_mean": 5874.5, |
| "valid_targets_min": 1816 |
| }, |
| { |
| "epoch": 0.5079365079365079, |
| "grad_norm": 0.4043326688329922, |
| "learning_rate": 2.893424036281179e-05, |
| "loss": 0.2239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21339790523052216, |
| "step": 320, |
| "valid_targets_mean": 5820.1, |
| "valid_targets_min": 282 |
| }, |
| { |
| "epoch": 0.5158730158730159, |
| "grad_norm": 0.502316882086023, |
| "learning_rate": 2.938775510204082e-05, |
| "loss": 0.2237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20219871401786804, |
| "step": 325, |
| "valid_targets_mean": 5578.6, |
| "valid_targets_min": 1540 |
| }, |
| { |
| "epoch": 0.5238095238095238, |
| "grad_norm": 0.9835515697061404, |
| "learning_rate": 2.9841269841269844e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2298191487789154, |
| "step": 330, |
| "valid_targets_mean": 4911.0, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 0.5317460317460317, |
| "grad_norm": 0.4647735663644707, |
| "learning_rate": 3.0294784580498868e-05, |
| "loss": 0.2339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22781239449977875, |
| "step": 335, |
| "valid_targets_mean": 5532.8, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 0.5396825396825397, |
| "grad_norm": 0.5438389697935898, |
| "learning_rate": 3.074829931972789e-05, |
| "loss": 0.2375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22640562057495117, |
| "step": 340, |
| "valid_targets_mean": 4285.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 0.5476190476190477, |
| "grad_norm": 0.4334285919558895, |
| "learning_rate": 3.1201814058956924e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21913409233093262, |
| "step": 345, |
| "valid_targets_mean": 5222.7, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 0.5555555555555556, |
| "grad_norm": 0.4738405937337707, |
| "learning_rate": 3.1655328798185945e-05, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25035279989242554, |
| "step": 350, |
| "valid_targets_mean": 5209.8, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 0.5634920634920635, |
| "grad_norm": 0.4555272170875938, |
| "learning_rate": 3.2108843537414965e-05, |
| "loss": 0.2223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21295906603336334, |
| "step": 355, |
| "valid_targets_mean": 4887.6, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 0.5714285714285714, |
| "grad_norm": 0.4607956603180466, |
| "learning_rate": 3.256235827664399e-05, |
| "loss": 0.2242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23422232270240784, |
| "step": 360, |
| "valid_targets_mean": 5982.9, |
| "valid_targets_min": 3791 |
| }, |
| { |
| "epoch": 0.5793650793650794, |
| "grad_norm": 0.46019446827222377, |
| "learning_rate": 3.3015873015873014e-05, |
| "loss": 0.234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21903209388256073, |
| "step": 365, |
| "valid_targets_mean": 5330.9, |
| "valid_targets_min": 2257 |
| }, |
| { |
| "epoch": 0.5873015873015873, |
| "grad_norm": 0.6042052076393369, |
| "learning_rate": 3.346938775510204e-05, |
| "loss": 0.2358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2550661861896515, |
| "step": 370, |
| "valid_targets_mean": 4556.8, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 0.5952380952380952, |
| "grad_norm": 0.44853135001478606, |
| "learning_rate": 3.392290249433107e-05, |
| "loss": 0.2178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.202229842543602, |
| "step": 375, |
| "valid_targets_mean": 5618.4, |
| "valid_targets_min": 287 |
| }, |
| { |
| "epoch": 0.6031746031746031, |
| "grad_norm": 0.4114084841092905, |
| "learning_rate": 3.437641723356009e-05, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.208021879196167, |
| "step": 380, |
| "valid_targets_mean": 6323.6, |
| "valid_targets_min": 3070 |
| }, |
| { |
| "epoch": 0.6111111111111112, |
| "grad_norm": 0.4907016504547875, |
| "learning_rate": 3.482993197278912e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2262699007987976, |
| "step": 385, |
| "valid_targets_mean": 5458.8, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 0.6190476190476191, |
| "grad_norm": 0.4470894371245897, |
| "learning_rate": 3.5283446712018146e-05, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2284412682056427, |
| "step": 390, |
| "valid_targets_mean": 5275.5, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 0.626984126984127, |
| "grad_norm": 0.8292394623205982, |
| "learning_rate": 3.573696145124717e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23321247100830078, |
| "step": 395, |
| "valid_targets_mean": 4546.7, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 0.6349206349206349, |
| "grad_norm": 0.5101519952218712, |
| "learning_rate": 3.6190476190476195e-05, |
| "loss": 0.2029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22552572190761566, |
| "step": 400, |
| "valid_targets_mean": 4713.0, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 0.6428571428571429, |
| "grad_norm": 0.4782175383328679, |
| "learning_rate": 3.6643990929705216e-05, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22066287696361542, |
| "step": 405, |
| "valid_targets_mean": 5557.4, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 0.6507936507936508, |
| "grad_norm": 0.6813010668498629, |
| "learning_rate": 3.7097505668934243e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23460529744625092, |
| "step": 410, |
| "valid_targets_mean": 4301.2, |
| "valid_targets_min": 290 |
| }, |
| { |
| "epoch": 0.6587301587301587, |
| "grad_norm": 0.42762135214795316, |
| "learning_rate": 3.755102040816327e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22290262579917908, |
| "step": 415, |
| "valid_targets_mean": 5696.5, |
| "valid_targets_min": 1242 |
| }, |
| { |
| "epoch": 0.6666666666666666, |
| "grad_norm": 0.7113003892096883, |
| "learning_rate": 3.800453514739229e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24848781526088715, |
| "step": 420, |
| "valid_targets_mean": 5861.1, |
| "valid_targets_min": 1829 |
| }, |
| { |
| "epoch": 0.6746031746031746, |
| "grad_norm": 0.4223786613285171, |
| "learning_rate": 3.845804988662132e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23021358251571655, |
| "step": 425, |
| "valid_targets_mean": 5603.6, |
| "valid_targets_min": 2005 |
| }, |
| { |
| "epoch": 0.6825396825396826, |
| "grad_norm": 0.46482319003042916, |
| "learning_rate": 3.891156462585034e-05, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2257668375968933, |
| "step": 430, |
| "valid_targets_mean": 5665.9, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 0.6904761904761905, |
| "grad_norm": 0.49517195170111594, |
| "learning_rate": 3.936507936507937e-05, |
| "loss": 0.2219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24368128180503845, |
| "step": 435, |
| "valid_targets_mean": 5276.9, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 0.6984126984126984, |
| "grad_norm": 0.4533449896226927, |
| "learning_rate": 3.9818594104308396e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2182699739933014, |
| "step": 440, |
| "valid_targets_mean": 5190.2, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 0.7063492063492064, |
| "grad_norm": 0.47604972418524916, |
| "learning_rate": 3.999994361288785e-05, |
| "loss": 0.2316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27464592456817627, |
| "step": 445, |
| "valid_targets_mean": 5377.2, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 0.7142857142857143, |
| "grad_norm": 0.4843309348827549, |
| "learning_rate": 3.9999599026131644e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21664546430110931, |
| "step": 450, |
| "valid_targets_mean": 5402.9, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 0.7222222222222222, |
| "grad_norm": 0.4382635205661119, |
| "learning_rate": 3.999894118418342e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22355255484580994, |
| "step": 455, |
| "valid_targets_mean": 5052.1, |
| "valid_targets_min": 2069 |
| }, |
| { |
| "epoch": 0.7301587301587301, |
| "grad_norm": 0.472980100407786, |
| "learning_rate": 3.999797009734697e-05, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22827665507793427, |
| "step": 460, |
| "valid_targets_mean": 5404.2, |
| "valid_targets_min": 1744 |
| }, |
| { |
| "epoch": 0.7380952380952381, |
| "grad_norm": 0.43558241143554155, |
| "learning_rate": 3.999668578083253e-05, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22950908541679382, |
| "step": 465, |
| "valid_targets_mean": 5786.8, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 0.746031746031746, |
| "grad_norm": 0.39301407866116134, |
| "learning_rate": 3.9995088254756434e-05, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20144161581993103, |
| "step": 470, |
| "valid_targets_mean": 6067.9, |
| "valid_targets_min": 3477 |
| }, |
| { |
| "epoch": 0.753968253968254, |
| "grad_norm": 0.4335866805247727, |
| "learning_rate": 3.999317754414084e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24468550086021423, |
| "step": 475, |
| "valid_targets_mean": 5383.6, |
| "valid_targets_min": 297 |
| }, |
| { |
| "epoch": 0.7619047619047619, |
| "grad_norm": 0.43530076929025974, |
| "learning_rate": 3.999095367891337e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2087598741054535, |
| "step": 480, |
| "valid_targets_mean": 5412.7, |
| "valid_targets_min": 241 |
| }, |
| { |
| "epoch": 0.7698412698412699, |
| "grad_norm": 0.42581385510950404, |
| "learning_rate": 3.9988416693906563e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20418357849121094, |
| "step": 485, |
| "valid_targets_mean": 5400.4, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 0.7777777777777778, |
| "grad_norm": 0.6201401443531581, |
| "learning_rate": 3.9985566628857425e-05, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22904717922210693, |
| "step": 490, |
| "valid_targets_mean": 5283.9, |
| "valid_targets_min": 1641 |
| }, |
| { |
| "epoch": 0.7857142857142857, |
| "grad_norm": 0.40573600003328514, |
| "learning_rate": 3.998240352840672e-05, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19750481843948364, |
| "step": 495, |
| "valid_targets_mean": 5820.5, |
| "valid_targets_min": 2527 |
| }, |
| { |
| "epoch": 0.7936507936507936, |
| "grad_norm": 0.6282176812699868, |
| "learning_rate": 3.997892744209833e-05, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21052823960781097, |
| "step": 500, |
| "valid_targets_mean": 3286.4, |
| "valid_targets_min": 284 |
| }, |
| { |
| "epoch": 0.8015873015873016, |
| "grad_norm": 0.4150664416041001, |
| "learning_rate": 3.997513842437845e-05, |
| "loss": 0.2168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20114190876483917, |
| "step": 505, |
| "valid_targets_mean": 6746.6, |
| "valid_targets_min": 3503 |
| }, |
| { |
| "epoch": 0.8095238095238095, |
| "grad_norm": 0.5580131451084269, |
| "learning_rate": 3.997103653459475e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21351292729377747, |
| "step": 510, |
| "valid_targets_mean": 5427.2, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 0.8174603174603174, |
| "grad_norm": 0.4539249289508295, |
| "learning_rate": 3.996662183699541e-05, |
| "loss": 0.2029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22894957661628723, |
| "step": 515, |
| "valid_targets_mean": 6587.3, |
| "valid_targets_min": 2987 |
| }, |
| { |
| "epoch": 0.8253968253968254, |
| "grad_norm": 0.4606135797915741, |
| "learning_rate": 3.996189440072818e-05, |
| "loss": 0.2235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23994050920009613, |
| "step": 520, |
| "valid_targets_mean": 5603.4, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 0.8333333333333334, |
| "grad_norm": 0.46485471964434133, |
| "learning_rate": 3.9956854299839246e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24385607242584229, |
| "step": 525, |
| "valid_targets_mean": 5554.9, |
| "valid_targets_min": 1998 |
| }, |
| { |
| "epoch": 0.8412698412698413, |
| "grad_norm": 0.5070540327503203, |
| "learning_rate": 3.9951501613272076e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2311379760503769, |
| "step": 530, |
| "valid_targets_mean": 5792.5, |
| "valid_targets_min": 2950 |
| }, |
| { |
| "epoch": 0.8492063492063492, |
| "grad_norm": 0.4509301237412979, |
| "learning_rate": 3.994583642486618e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22014960646629333, |
| "step": 535, |
| "valid_targets_mean": 5551.4, |
| "valid_targets_min": 2454 |
| }, |
| { |
| "epoch": 0.8571428571428571, |
| "grad_norm": 0.37450581843880576, |
| "learning_rate": 3.993985882335584e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17562690377235413, |
| "step": 540, |
| "valid_targets_mean": 6399.9, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 0.8650793650793651, |
| "grad_norm": 0.4181520509392521, |
| "learning_rate": 3.993356890236866e-05, |
| "loss": 0.2178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1997915804386139, |
| "step": 545, |
| "valid_targets_mean": 5282.3, |
| "valid_targets_min": 307 |
| }, |
| { |
| "epoch": 0.873015873015873, |
| "grad_norm": 0.40651126602493426, |
| "learning_rate": 3.992696676042414e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20215590298175812, |
| "step": 550, |
| "valid_targets_mean": 6478.2, |
| "valid_targets_min": 1253 |
| }, |
| { |
| "epoch": 0.8809523809523809, |
| "grad_norm": 0.42510576646915893, |
| "learning_rate": 3.992005250093211e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20907750725746155, |
| "step": 555, |
| "valid_targets_mean": 5629.7, |
| "valid_targets_min": 1539 |
| }, |
| { |
| "epoch": 0.8888888888888888, |
| "grad_norm": 0.4812454511222598, |
| "learning_rate": 3.991282623219113e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22547686100006104, |
| "step": 560, |
| "valid_targets_mean": 4727.8, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 0.8968253968253969, |
| "grad_norm": 0.4203217407948123, |
| "learning_rate": 3.9905288067386776e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21304470300674438, |
| "step": 565, |
| "valid_targets_mean": 5743.1, |
| "valid_targets_min": 2659 |
| }, |
| { |
| "epoch": 0.9047619047619048, |
| "grad_norm": 0.5536262458911827, |
| "learning_rate": 3.989743812458987e-05, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22015127539634705, |
| "step": 570, |
| "valid_targets_mean": 5742.7, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 0.9126984126984127, |
| "grad_norm": 0.44923723778131375, |
| "learning_rate": 3.9889276526754664e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2490832507610321, |
| "step": 575, |
| "valid_targets_mean": 5566.1, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 0.9206349206349206, |
| "grad_norm": 0.4833832932237736, |
| "learning_rate": 3.988080340171685e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2266359031200409, |
| "step": 580, |
| "valid_targets_mean": 4794.4, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 0.9285714285714286, |
| "grad_norm": 0.5314150951022422, |
| "learning_rate": 3.987201888219161e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23443414270877838, |
| "step": 585, |
| "valid_targets_mean": 3981.2, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 0.9365079365079365, |
| "grad_norm": 0.44573566583926183, |
| "learning_rate": 3.986292310577153e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1997448205947876, |
| "step": 590, |
| "valid_targets_mean": 5087.9, |
| "valid_targets_min": 256 |
| }, |
| { |
| "epoch": 0.9444444444444444, |
| "grad_norm": 0.4823118351901083, |
| "learning_rate": 3.9853516214924416e-05, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21190452575683594, |
| "step": 595, |
| "valid_targets_mean": 4769.4, |
| "valid_targets_min": 1789 |
| }, |
| { |
| "epoch": 0.9523809523809523, |
| "grad_norm": 0.9701252803781317, |
| "learning_rate": 3.9843798356991096e-05, |
| "loss": 0.2033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21730470657348633, |
| "step": 600, |
| "valid_targets_mean": 5590.2, |
| "valid_targets_min": 871 |
| }, |
| { |
| "epoch": 0.9603174603174603, |
| "grad_norm": 0.8528374645310175, |
| "learning_rate": 3.9833769684183104e-05, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25169217586517334, |
| "step": 605, |
| "valid_targets_mean": 5481.6, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 0.9682539682539683, |
| "grad_norm": 0.5719512687258413, |
| "learning_rate": 3.982343035358026e-05, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25562554597854614, |
| "step": 610, |
| "valid_targets_mean": 4258.5, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 0.9761904761904762, |
| "grad_norm": 0.42417870906303506, |
| "learning_rate": 3.981278052712827e-05, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19715425372123718, |
| "step": 615, |
| "valid_targets_mean": 6383.4, |
| "valid_targets_min": 2557 |
| }, |
| { |
| "epoch": 0.9841269841269841, |
| "grad_norm": 0.5592731470756656, |
| "learning_rate": 3.9801820371636157e-05, |
| "loss": 0.2205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21826912462711334, |
| "step": 620, |
| "valid_targets_mean": 5242.9, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 0.9920634920634921, |
| "grad_norm": 0.45536035098972394, |
| "learning_rate": 3.979055005877364e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23044517636299133, |
| "step": 625, |
| "valid_targets_mean": 6434.3, |
| "valid_targets_min": 1909 |
| }, |
| { |
| "epoch": 1.0, |
| "grad_norm": 0.45688834618759994, |
| "learning_rate": 3.977896976506845e-05, |
| "loss": 0.2262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20650140941143036, |
| "step": 630, |
| "valid_targets_mean": 4983.3, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 1.007936507936508, |
| "grad_norm": 0.45783302985716545, |
| "learning_rate": 3.976707967190358e-05, |
| "loss": 0.2009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1878741830587387, |
| "step": 635, |
| "valid_targets_mean": 6036.8, |
| "valid_targets_min": 1419 |
| }, |
| { |
| "epoch": 1.0158730158730158, |
| "grad_norm": 0.3696615133926402, |
| "learning_rate": 3.9754879965514456e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17767128348350525, |
| "step": 640, |
| "valid_targets_mean": 6949.4, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 1.0238095238095237, |
| "grad_norm": 0.5301335563601449, |
| "learning_rate": 3.9742370836985956e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18509696424007416, |
| "step": 645, |
| "valid_targets_mean": 5665.9, |
| "valid_targets_min": 3373 |
| }, |
| { |
| "epoch": 1.0317460317460316, |
| "grad_norm": 0.45339150425457114, |
| "learning_rate": 3.972955248224949e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19851231575012207, |
| "step": 650, |
| "valid_targets_mean": 5496.2, |
| "valid_targets_min": 1700 |
| }, |
| { |
| "epoch": 1.0396825396825398, |
| "grad_norm": 0.4563819518280238, |
| "learning_rate": 3.971642510207989e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20360763370990753, |
| "step": 655, |
| "valid_targets_mean": 5350.4, |
| "valid_targets_min": 333 |
| }, |
| { |
| "epoch": 1.0476190476190477, |
| "grad_norm": 0.5625847542647227, |
| "learning_rate": 3.9702988902092274e-05, |
| "loss": 0.2, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1898064911365509, |
| "step": 660, |
| "valid_targets_mean": 5748.2, |
| "valid_targets_min": 1540 |
| }, |
| { |
| "epoch": 1.0555555555555556, |
| "grad_norm": 0.425299703122137, |
| "learning_rate": 3.968924409273884e-05, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19356761872768402, |
| "step": 665, |
| "valid_targets_mean": 5209.3, |
| "valid_targets_min": 1985 |
| }, |
| { |
| "epoch": 1.0634920634920635, |
| "grad_norm": 0.47286769247229504, |
| "learning_rate": 3.9675190889305545e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1817602813243866, |
| "step": 670, |
| "valid_targets_mean": 5672.6, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 1.0714285714285714, |
| "grad_norm": 0.432773210737844, |
| "learning_rate": 3.966082951190874e-05, |
| "loss": 0.1861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2104063630104065, |
| "step": 675, |
| "valid_targets_mean": 6248.0, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 1.0793650793650793, |
| "grad_norm": 0.4706439453673335, |
| "learning_rate": 3.9646160185491756e-05, |
| "loss": 0.201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18827101588249207, |
| "step": 680, |
| "valid_targets_mean": 4876.6, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 1.0873015873015872, |
| "grad_norm": 0.5338851223858002, |
| "learning_rate": 3.963118313982131e-05, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18436592817306519, |
| "step": 685, |
| "valid_targets_mean": 4361.0, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 1.0952380952380953, |
| "grad_norm": 0.41520798715060503, |
| "learning_rate": 3.961589860948399e-05, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21202310919761658, |
| "step": 690, |
| "valid_targets_mean": 5486.4, |
| "valid_targets_min": 1888 |
| }, |
| { |
| "epoch": 1.1031746031746033, |
| "grad_norm": 0.42676794941537016, |
| "learning_rate": 3.960030683388251e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17921066284179688, |
| "step": 695, |
| "valid_targets_mean": 5590.2, |
| "valid_targets_min": 217 |
| }, |
| { |
| "epoch": 1.1111111111111112, |
| "grad_norm": 0.40164984647020757, |
| "learning_rate": 3.9584408057232e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17369890213012695, |
| "step": 700, |
| "valid_targets_mean": 5022.5, |
| "valid_targets_min": 268 |
| }, |
| { |
| "epoch": 1.119047619047619, |
| "grad_norm": 0.4557865055131249, |
| "learning_rate": 3.956820252855618e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21178218722343445, |
| "step": 705, |
| "valid_targets_mean": 5212.6, |
| "valid_targets_min": 1650 |
| }, |
| { |
| "epoch": 1.126984126984127, |
| "grad_norm": 0.4737440529809228, |
| "learning_rate": 3.955169050168343e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18235670030117035, |
| "step": 710, |
| "valid_targets_mean": 4897.6, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 1.1349206349206349, |
| "grad_norm": 0.36301667189206566, |
| "learning_rate": 3.953487223524283e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15816360712051392, |
| "step": 715, |
| "valid_targets_mean": 6158.5, |
| "valid_targets_min": 2000 |
| }, |
| { |
| "epoch": 1.1428571428571428, |
| "grad_norm": 0.4512962324237001, |
| "learning_rate": 3.951774799266014e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1824280321598053, |
| "step": 720, |
| "valid_targets_mean": 5561.8, |
| "valid_targets_min": 2560 |
| }, |
| { |
| "epoch": 1.1507936507936507, |
| "grad_norm": 0.4511979075727613, |
| "learning_rate": 3.950031804215364e-05, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2006044089794159, |
| "step": 725, |
| "valid_targets_mean": 5573.5, |
| "valid_targets_min": 1633 |
| }, |
| { |
| "epoch": 1.1587301587301586, |
| "grad_norm": 0.42676374430180725, |
| "learning_rate": 3.948258265672991e-05, |
| "loss": 0.2072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21262499690055847, |
| "step": 730, |
| "valid_targets_mean": 5894.2, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 1.1666666666666667, |
| "grad_norm": 0.669542399200941, |
| "learning_rate": 3.946454211417961e-05, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20334014296531677, |
| "step": 735, |
| "valid_targets_mean": 5074.4, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 1.1746031746031746, |
| "grad_norm": 0.45162646285557456, |
| "learning_rate": 3.944619669707309e-05, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.215205579996109, |
| "step": 740, |
| "valid_targets_mean": 5439.4, |
| "valid_targets_min": 1907 |
| }, |
| { |
| "epoch": 1.1825396825396826, |
| "grad_norm": 0.4710256071640483, |
| "learning_rate": 3.9427546692755946e-05, |
| "loss": 0.2082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21397551894187927, |
| "step": 745, |
| "valid_targets_mean": 5276.3, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 1.1904761904761905, |
| "grad_norm": 0.4625751950531012, |
| "learning_rate": 3.9408592393344596e-05, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19521868228912354, |
| "step": 750, |
| "valid_targets_mean": 5905.4, |
| "valid_targets_min": 2861 |
| }, |
| { |
| "epoch": 1.1984126984126984, |
| "grad_norm": 0.4677554812825755, |
| "learning_rate": 3.9389334095721606e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21653307974338531, |
| "step": 755, |
| "valid_targets_mean": 4797.6, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 1.2063492063492063, |
| "grad_norm": 0.546242046347798, |
| "learning_rate": 3.936977210153113e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20400574803352356, |
| "step": 760, |
| "valid_targets_mean": 5519.1, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 1.2142857142857142, |
| "grad_norm": 0.4204392123363325, |
| "learning_rate": 3.93499067171741e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22943107783794403, |
| "step": 765, |
| "valid_targets_mean": 6420.3, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 1.2222222222222223, |
| "grad_norm": 0.4682155865822684, |
| "learning_rate": 3.932973825380351e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22972063720226288, |
| "step": 770, |
| "valid_targets_mean": 4946.4, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 1.2301587301587302, |
| "grad_norm": 0.5301139897940557, |
| "learning_rate": 3.9309267027319485e-05, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23306161165237427, |
| "step": 775, |
| "valid_targets_mean": 3961.6, |
| "valid_targets_min": 222 |
| }, |
| { |
| "epoch": 1.2380952380952381, |
| "grad_norm": 0.40365821128282314, |
| "learning_rate": 3.928849335836435e-05, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18574738502502441, |
| "step": 780, |
| "valid_targets_mean": 5806.0, |
| "valid_targets_min": 2320 |
| }, |
| { |
| "epoch": 1.246031746031746, |
| "grad_norm": 0.47813886067964756, |
| "learning_rate": 3.926741757231761e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21044926345348358, |
| "step": 785, |
| "valid_targets_mean": 5299.6, |
| "valid_targets_min": 1723 |
| }, |
| { |
| "epoch": 1.253968253968254, |
| "grad_norm": 0.40253903041192324, |
| "learning_rate": 3.924603999929086e-05, |
| "loss": 0.2169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2096974402666092, |
| "step": 790, |
| "valid_targets_mean": 5558.8, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 1.2619047619047619, |
| "grad_norm": 0.4549298029596003, |
| "learning_rate": 3.9224360974122584e-05, |
| "loss": 0.2109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23242492973804474, |
| "step": 795, |
| "valid_targets_mean": 5270.6, |
| "valid_targets_min": 2212 |
| }, |
| { |
| "epoch": 1.2698412698412698, |
| "grad_norm": 0.4695471820608219, |
| "learning_rate": 3.920238083637297e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20831601321697235, |
| "step": 800, |
| "valid_targets_mean": 5308.8, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 1.2777777777777777, |
| "grad_norm": 0.7642610362979803, |
| "learning_rate": 3.9180099930318524e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1991654336452484, |
| "step": 805, |
| "valid_targets_mean": 6815.1, |
| "valid_targets_min": 1462 |
| }, |
| { |
| "epoch": 1.2857142857142856, |
| "grad_norm": 0.4440164128697404, |
| "learning_rate": 3.915751860494672e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16493773460388184, |
| "step": 810, |
| "valid_targets_mean": 5028.6, |
| "valid_targets_min": 397 |
| }, |
| { |
| "epoch": 1.2936507936507937, |
| "grad_norm": 0.43322694583144405, |
| "learning_rate": 3.913463721395051e-05, |
| "loss": 0.2092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1892578899860382, |
| "step": 815, |
| "valid_targets_mean": 4793.7, |
| "valid_targets_min": 343 |
| }, |
| { |
| "epoch": 1.3015873015873016, |
| "grad_norm": 0.4113857371999088, |
| "learning_rate": 3.911145611572282e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22850877046585083, |
| "step": 820, |
| "valid_targets_mean": 6205.9, |
| "valid_targets_min": 3119 |
| }, |
| { |
| "epoch": 1.3095238095238095, |
| "grad_norm": 0.4024454753442706, |
| "learning_rate": 3.908797567335089e-05, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1995319277048111, |
| "step": 825, |
| "valid_targets_mean": 6545.4, |
| "valid_targets_min": 2059 |
| }, |
| { |
| "epoch": 1.3174603174603174, |
| "grad_norm": 0.4766793634475361, |
| "learning_rate": 3.906419625461062e-05, |
| "loss": 0.1979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21162061393260956, |
| "step": 830, |
| "valid_targets_mean": 5270.3, |
| "valid_targets_min": 294 |
| }, |
| { |
| "epoch": 1.3253968253968254, |
| "grad_norm": 0.43124302476576, |
| "learning_rate": 3.90401182319608e-05, |
| "loss": 0.2112, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2024182230234146, |
| "step": 835, |
| "valid_targets_mean": 5587.5, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 1.3333333333333333, |
| "grad_norm": 0.37620838473431895, |
| "learning_rate": 3.9015741982537265e-05, |
| "loss": 0.1894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16263701021671295, |
| "step": 840, |
| "valid_targets_mean": 6486.5, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 1.3412698412698414, |
| "grad_norm": 0.4227366879146679, |
| "learning_rate": 3.899106788814701e-05, |
| "loss": 0.2324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19696393609046936, |
| "step": 845, |
| "valid_targets_mean": 5981.3, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 1.3492063492063493, |
| "grad_norm": 0.4396285787879683, |
| "learning_rate": 3.896609633526219e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21186983585357666, |
| "step": 850, |
| "valid_targets_mean": 5076.4, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 1.3571428571428572, |
| "grad_norm": 0.4809038294139755, |
| "learning_rate": 3.894082771501407e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.191837877035141, |
| "step": 855, |
| "valid_targets_mean": 5344.6, |
| "valid_targets_min": 3615 |
| }, |
| { |
| "epoch": 1.3650793650793651, |
| "grad_norm": 0.48473797503352833, |
| "learning_rate": 3.891526242318692e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16904303431510925, |
| "step": 860, |
| "valid_targets_mean": 4677.6, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 1.373015873015873, |
| "grad_norm": 0.3848141194705589, |
| "learning_rate": 3.8889400860211785e-05, |
| "loss": 0.2045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19609695672988892, |
| "step": 865, |
| "valid_targets_mean": 5797.4, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 1.380952380952381, |
| "grad_norm": 0.43935568195512203, |
| "learning_rate": 3.886324343116023e-05, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21925979852676392, |
| "step": 870, |
| "valid_targets_mean": 5510.4, |
| "valid_targets_min": 2795 |
| }, |
| { |
| "epoch": 1.3888888888888888, |
| "grad_norm": 0.3787284592232413, |
| "learning_rate": 3.883679054573799e-05, |
| "loss": 0.1925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17324265837669373, |
| "step": 875, |
| "valid_targets_mean": 6371.8, |
| "valid_targets_min": 1851 |
| }, |
| { |
| "epoch": 1.3968253968253967, |
| "grad_norm": 0.48231311291457907, |
| "learning_rate": 3.881004261827856e-05, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22266656160354614, |
| "step": 880, |
| "valid_targets_mean": 5407.8, |
| "valid_targets_min": 247 |
| }, |
| { |
| "epoch": 1.4047619047619047, |
| "grad_norm": 0.39562200883867676, |
| "learning_rate": 3.878300006773669e-05, |
| "loss": 0.1996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19309642910957336, |
| "step": 885, |
| "valid_targets_mean": 6324.1, |
| "valid_targets_min": 3843 |
| }, |
| { |
| "epoch": 1.4126984126984126, |
| "grad_norm": 0.4536286972970636, |
| "learning_rate": 3.875566331768184e-05, |
| "loss": 0.1989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.205659881234169, |
| "step": 890, |
| "valid_targets_mean": 4451.7, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 1.4206349206349207, |
| "grad_norm": 0.40917484623660716, |
| "learning_rate": 3.872803279629155e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21330603957176208, |
| "step": 895, |
| "valid_targets_mean": 5915.2, |
| "valid_targets_min": 2792 |
| }, |
| { |
| "epoch": 1.4285714285714286, |
| "grad_norm": 0.44208512274029477, |
| "learning_rate": 3.8700108936344705e-05, |
| "loss": 0.1981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21972954273223877, |
| "step": 900, |
| "valid_targets_mean": 4555.5, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 1.4365079365079365, |
| "grad_norm": 0.44093255819884136, |
| "learning_rate": 3.867189217521477e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20141087472438812, |
| "step": 905, |
| "valid_targets_mean": 5635.6, |
| "valid_targets_min": 2966 |
| }, |
| { |
| "epoch": 1.4444444444444444, |
| "grad_norm": 0.4623153556330511, |
| "learning_rate": 3.864338295486297e-05, |
| "loss": 0.2042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21589690446853638, |
| "step": 910, |
| "valid_targets_mean": 4678.0, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 1.4523809523809523, |
| "grad_norm": 0.41249982388927653, |
| "learning_rate": 3.8614581721831316e-05, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2026449292898178, |
| "step": 915, |
| "valid_targets_mean": 5216.7, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 1.4603174603174602, |
| "grad_norm": 0.4104480770890901, |
| "learning_rate": 3.858548892723563e-05, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1731051206588745, |
| "step": 920, |
| "valid_targets_mean": 5339.4, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 1.4682539682539684, |
| "grad_norm": 0.41895380180198477, |
| "learning_rate": 3.855610502675851e-05, |
| "loss": 0.1987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2031707614660263, |
| "step": 925, |
| "valid_targets_mean": 5263.9, |
| "valid_targets_min": 1601 |
| }, |
| { |
| "epoch": 1.4761904761904763, |
| "grad_norm": 0.4261994122248901, |
| "learning_rate": 3.852643048064215e-05, |
| "loss": 0.2095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2084016501903534, |
| "step": 930, |
| "valid_targets_mean": 5398.7, |
| "valid_targets_min": 366 |
| }, |
| { |
| "epoch": 1.4841269841269842, |
| "grad_norm": 0.44461914330875957, |
| "learning_rate": 3.8496465753681145e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.203968346118927, |
| "step": 935, |
| "valid_targets_mean": 5705.4, |
| "valid_targets_min": 293 |
| }, |
| { |
| "epoch": 1.492063492063492, |
| "grad_norm": 0.3619697764513735, |
| "learning_rate": 3.846621131521522e-05, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16397273540496826, |
| "step": 940, |
| "valid_targets_mean": 5586.3, |
| "valid_targets_min": 603 |
| }, |
| { |
| "epoch": 1.5, |
| "grad_norm": 0.47927964908668164, |
| "learning_rate": 3.843566763912187e-05, |
| "loss": 0.1938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19876304268836975, |
| "step": 945, |
| "valid_targets_mean": 5481.6, |
| "valid_targets_min": 2470 |
| }, |
| { |
| "epoch": 1.507936507936508, |
| "grad_norm": 0.43177345256816557, |
| "learning_rate": 3.840483520380896e-05, |
| "loss": 0.1979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19520597159862518, |
| "step": 950, |
| "valid_targets_mean": 5171.9, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 1.5158730158730158, |
| "grad_norm": 0.45814725913527155, |
| "learning_rate": 3.837371449220717e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.191867396235466, |
| "step": 955, |
| "valid_targets_mean": 6292.2, |
| "valid_targets_min": 3359 |
| }, |
| { |
| "epoch": 1.5238095238095237, |
| "grad_norm": 0.3660046705130465, |
| "learning_rate": 3.834230599176251e-05, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16699504852294922, |
| "step": 960, |
| "valid_targets_mean": 6213.4, |
| "valid_targets_min": 2488 |
| }, |
| { |
| "epoch": 1.5317460317460316, |
| "grad_norm": 0.3890844674038831, |
| "learning_rate": 3.831061019442864e-05, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20834946632385254, |
| "step": 965, |
| "valid_targets_mean": 5682.8, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 1.5396825396825395, |
| "grad_norm": 0.442290989827857, |
| "learning_rate": 3.827862759665916e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2266271859407425, |
| "step": 970, |
| "valid_targets_mean": 5248.5, |
| "valid_targets_min": 1995 |
| }, |
| { |
| "epoch": 1.5476190476190477, |
| "grad_norm": 0.4156925522612072, |
| "learning_rate": 3.8246358699399853e-05, |
| "loss": 0.1998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16675469279289246, |
| "step": 975, |
| "valid_targets_mean": 4952.9, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 1.5555555555555556, |
| "grad_norm": 0.37604931667074504, |
| "learning_rate": 3.8213804008080824e-05, |
| "loss": 0.1981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18879935145378113, |
| "step": 980, |
| "valid_targets_mean": 6674.0, |
| "valid_targets_min": 3077 |
| }, |
| { |
| "epoch": 1.5634920634920635, |
| "grad_norm": 0.4287194995251398, |
| "learning_rate": 3.818096403260862e-05, |
| "loss": 0.1951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20438791811466217, |
| "step": 985, |
| "valid_targets_mean": 5784.4, |
| "valid_targets_min": 1565 |
| }, |
| { |
| "epoch": 1.5714285714285714, |
| "grad_norm": 0.44022259559851695, |
| "learning_rate": 3.8147839287358185e-05, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21569909155368805, |
| "step": 990, |
| "valid_targets_mean": 5262.6, |
| "valid_targets_min": 1953 |
| }, |
| { |
| "epoch": 1.5793650793650795, |
| "grad_norm": 0.466156003317299, |
| "learning_rate": 3.8114430291164836e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1877652108669281, |
| "step": 995, |
| "valid_targets_mean": 4195.9, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 1.5873015873015874, |
| "grad_norm": 0.38334955845745405, |
| "learning_rate": 3.808073756731615e-05, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1762232482433319, |
| "step": 1000, |
| "valid_targets_mean": 5545.6, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 1.5952380952380953, |
| "grad_norm": 0.5439994931547266, |
| "learning_rate": 3.8046761643543734e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1913871467113495, |
| "step": 1005, |
| "valid_targets_mean": 4491.5, |
| "valid_targets_min": 369 |
| }, |
| { |
| "epoch": 1.6031746031746033, |
| "grad_norm": 0.40075365186274436, |
| "learning_rate": 3.8012503052014996e-05, |
| "loss": 0.2202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1946803331375122, |
| "step": 1010, |
| "valid_targets_mean": 5425.6, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 1.6111111111111112, |
| "grad_norm": 0.3877028365107908, |
| "learning_rate": 3.797796232932476e-05, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21146497130393982, |
| "step": 1015, |
| "valid_targets_mean": 6453.6, |
| "valid_targets_min": 2839 |
| }, |
| { |
| "epoch": 1.619047619047619, |
| "grad_norm": 0.3668527782681026, |
| "learning_rate": 3.794314001648692e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18072551488876343, |
| "step": 1020, |
| "valid_targets_mean": 6010.3, |
| "valid_targets_min": 2661 |
| }, |
| { |
| "epoch": 1.626984126984127, |
| "grad_norm": 0.44781816078627307, |
| "learning_rate": 3.7908036658925926e-05, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2001311182975769, |
| "step": 1025, |
| "valid_targets_mean": 5515.9, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 1.6349206349206349, |
| "grad_norm": 0.40397196550171016, |
| "learning_rate": 3.787265280646825e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19972187280654907, |
| "step": 1030, |
| "valid_targets_mean": 5461.7, |
| "valid_targets_min": 289 |
| }, |
| { |
| "epoch": 1.6428571428571428, |
| "grad_norm": 0.4356586536795959, |
| "learning_rate": 3.7836989013333776e-05, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1890064775943756, |
| "step": 1035, |
| "valid_targets_mean": 5751.4, |
| "valid_targets_min": 211 |
| }, |
| { |
| "epoch": 1.6507936507936507, |
| "grad_norm": 0.44136645672562447, |
| "learning_rate": 3.780104583812712e-05, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1881527304649353, |
| "step": 1040, |
| "valid_targets_mean": 5342.1, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 1.6587301587301586, |
| "grad_norm": 0.4490662637016875, |
| "learning_rate": 3.7764823843828883e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20181840658187866, |
| "step": 1045, |
| "valid_targets_mean": 4998.9, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.414814689156328, |
| "learning_rate": 3.7728323597786834e-05, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2113458514213562, |
| "step": 1050, |
| "valid_targets_mean": 5317.9, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 1.6746031746031746, |
| "grad_norm": 0.4002735439554692, |
| "learning_rate": 3.7691545671707007e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19339720904827118, |
| "step": 1055, |
| "valid_targets_mean": 5467.6, |
| "valid_targets_min": 304 |
| }, |
| { |
| "epoch": 1.6825396825396826, |
| "grad_norm": 0.34935950618209505, |
| "learning_rate": 3.765449064164477e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16387102007865906, |
| "step": 1060, |
| "valid_targets_mean": 5961.0, |
| "valid_targets_min": 1397 |
| }, |
| { |
| "epoch": 1.6904761904761905, |
| "grad_norm": 0.4617875758265747, |
| "learning_rate": 3.7617159087995784e-05, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20451588928699493, |
| "step": 1065, |
| "valid_targets_mean": 5329.4, |
| "valid_targets_min": 1754 |
| }, |
| { |
| "epoch": 1.6984126984126984, |
| "grad_norm": 0.43000065083291655, |
| "learning_rate": 3.757955159548693e-05, |
| "loss": 0.2123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19835901260375977, |
| "step": 1070, |
| "valid_targets_mean": 5593.4, |
| "valid_targets_min": 1554 |
| }, |
| { |
| "epoch": 1.7063492063492065, |
| "grad_norm": 0.3606371311330236, |
| "learning_rate": 3.754166875316713e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18690404295921326, |
| "step": 1075, |
| "valid_targets_mean": 6369.9, |
| "valid_targets_min": 2694 |
| }, |
| { |
| "epoch": 1.7142857142857144, |
| "grad_norm": 0.39285827605092777, |
| "learning_rate": 3.750351115439812e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20067650079727173, |
| "step": 1080, |
| "valid_targets_mean": 5648.6, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 1.7222222222222223, |
| "grad_norm": 0.38570908603943815, |
| "learning_rate": 3.746507939684519e-05, |
| "loss": 0.1901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19070516526699066, |
| "step": 1085, |
| "valid_targets_mean": 6492.1, |
| "valid_targets_min": 3263 |
| }, |
| { |
| "epoch": 1.7301587301587302, |
| "grad_norm": 0.39910170101731635, |
| "learning_rate": 3.742637408246779e-05, |
| "loss": 0.2, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21158373355865479, |
| "step": 1090, |
| "valid_targets_mean": 6281.1, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 1.7380952380952381, |
| "grad_norm": 0.49874739628178993, |
| "learning_rate": 3.73873958175101e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20216044783592224, |
| "step": 1095, |
| "valid_targets_mean": 4570.4, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 1.746031746031746, |
| "grad_norm": 0.47674802821687573, |
| "learning_rate": 3.734814521249156e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21278969943523407, |
| "step": 1100, |
| "valid_targets_mean": 6688.0, |
| "valid_targets_min": 4913 |
| }, |
| { |
| "epoch": 1.753968253968254, |
| "grad_norm": 0.4208345610037382, |
| "learning_rate": 3.7308622882197294e-05, |
| "loss": 0.2021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20342180132865906, |
| "step": 1105, |
| "valid_targets_mean": 4974.2, |
| "valid_targets_min": 1373 |
| }, |
| { |
| "epoch": 1.7619047619047619, |
| "grad_norm": 0.5036978972360446, |
| "learning_rate": 3.7268829445668456e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19987335801124573, |
| "step": 1110, |
| "valid_targets_mean": 4656.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 1.7698412698412698, |
| "grad_norm": 0.4475822251477478, |
| "learning_rate": 3.722876552619257e-05, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1833523064851761, |
| "step": 1115, |
| "valid_targets_mean": 5454.4, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 1.7777777777777777, |
| "grad_norm": 0.42301407783978096, |
| "learning_rate": 3.718843175129378e-05, |
| "loss": 0.1906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1914646029472351, |
| "step": 1120, |
| "valid_targets_mean": 6252.5, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 1.7857142857142856, |
| "grad_norm": 0.3667105929189479, |
| "learning_rate": 3.7147828752722944e-05, |
| "loss": 0.1872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18096204102039337, |
| "step": 1125, |
| "valid_targets_mean": 5728.2, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 1.7936507936507935, |
| "grad_norm": 0.3988857634933404, |
| "learning_rate": 3.7106957166447834e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20091086626052856, |
| "step": 1130, |
| "valid_targets_mean": 6323.2, |
| "valid_targets_min": 2797 |
| }, |
| { |
| "epoch": 1.8015873015873016, |
| "grad_norm": 0.4353965199064458, |
| "learning_rate": 3.7065817632643115e-05, |
| "loss": 0.1983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2031416893005371, |
| "step": 1135, |
| "valid_targets_mean": 5034.0, |
| "valid_targets_min": 1545 |
| }, |
| { |
| "epoch": 1.8095238095238095, |
| "grad_norm": 0.3835363845414605, |
| "learning_rate": 3.7024410795680326e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20650315284729004, |
| "step": 1140, |
| "valid_targets_mean": 5709.4, |
| "valid_targets_min": 2868 |
| }, |
| { |
| "epoch": 1.8174603174603174, |
| "grad_norm": 0.6017933902148771, |
| "learning_rate": 3.698273730411782e-05, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21874158084392548, |
| "step": 1145, |
| "valid_targets_mean": 4664.8, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 1.8253968253968254, |
| "grad_norm": 0.5010674614611315, |
| "learning_rate": 3.694079781069053e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22206932306289673, |
| "step": 1150, |
| "valid_targets_mean": 5182.3, |
| "valid_targets_min": 1754 |
| }, |
| { |
| "epoch": 1.8333333333333335, |
| "grad_norm": 0.3923636627441356, |
| "learning_rate": 3.6898592972299875e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17895236611366272, |
| "step": 1155, |
| "valid_targets_mean": 5307.1, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 1.8412698412698414, |
| "grad_norm": 0.46097320064253466, |
| "learning_rate": 3.6856123450003306e-05, |
| "loss": 0.1934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17629393935203552, |
| "step": 1160, |
| "valid_targets_mean": 5396.4, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 1.8492063492063493, |
| "grad_norm": 0.4118263198386797, |
| "learning_rate": 3.68133899090041e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21603277325630188, |
| "step": 1165, |
| "valid_targets_mean": 5743.1, |
| "valid_targets_min": 1944 |
| }, |
| { |
| "epoch": 1.8571428571428572, |
| "grad_norm": 0.40887713694857647, |
| "learning_rate": 3.677039301864085e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21704469621181488, |
| "step": 1170, |
| "valid_targets_mean": 5467.9, |
| "valid_targets_min": 1922 |
| }, |
| { |
| "epoch": 1.8650793650793651, |
| "grad_norm": 0.3934682878408651, |
| "learning_rate": 3.672713345237701e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19257432222366333, |
| "step": 1175, |
| "valid_targets_mean": 5539.5, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 1.873015873015873, |
| "grad_norm": 0.40297241825152724, |
| "learning_rate": 3.6683611887790356e-05, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22532138228416443, |
| "step": 1180, |
| "valid_targets_mean": 5603.6, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 1.880952380952381, |
| "grad_norm": 0.4525568905524082, |
| "learning_rate": 3.663982900656236e-05, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21516132354736328, |
| "step": 1185, |
| "valid_targets_mean": 4871.1, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 1.8888888888888888, |
| "grad_norm": 0.3826095420283405, |
| "learning_rate": 3.6595785494467516e-05, |
| "loss": 0.2033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2126571089029312, |
| "step": 1190, |
| "valid_targets_mean": 6149.8, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 1.8968253968253967, |
| "grad_norm": 0.49491876878445984, |
| "learning_rate": 3.655148204136259e-05, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1980828046798706, |
| "step": 1195, |
| "valid_targets_mean": 4812.1, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 1.9047619047619047, |
| "grad_norm": 0.3844425255192722, |
| "learning_rate": 3.650691934117584e-05, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17985425889492035, |
| "step": 1200, |
| "valid_targets_mean": 5473.3, |
| "valid_targets_min": 2775 |
| }, |
| { |
| "epoch": 1.9126984126984126, |
| "grad_norm": 0.4025013315745311, |
| "learning_rate": 3.646209809189611e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2079595923423767, |
| "step": 1205, |
| "valid_targets_mean": 5829.4, |
| "valid_targets_min": 2090 |
| }, |
| { |
| "epoch": 1.9206349206349205, |
| "grad_norm": 0.3718395023938511, |
| "learning_rate": 3.641701899556192e-05, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20109693706035614, |
| "step": 1210, |
| "valid_targets_mean": 5616.2, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 1.9285714285714286, |
| "grad_norm": 0.41192663980117594, |
| "learning_rate": 3.63716827582505e-05, |
| "loss": 0.2066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19556891918182373, |
| "step": 1215, |
| "valid_targets_mean": 5405.4, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 1.9365079365079365, |
| "grad_norm": 0.4061502796105446, |
| "learning_rate": 3.632609009006665e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1885574758052826, |
| "step": 1220, |
| "valid_targets_mean": 4830.4, |
| "valid_targets_min": 1806 |
| }, |
| { |
| "epoch": 1.9444444444444444, |
| "grad_norm": 0.394449808870156, |
| "learning_rate": 3.62802417051317e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1800915151834488, |
| "step": 1225, |
| "valid_targets_mean": 5700.7, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 1.9523809523809523, |
| "grad_norm": 0.4440079869221486, |
| "learning_rate": 3.6234138321572274e-05, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17726945877075195, |
| "step": 1230, |
| "valid_targets_mean": 5161.5, |
| "valid_targets_min": 1498 |
| }, |
| { |
| "epoch": 1.9603174603174605, |
| "grad_norm": 0.4620529228104198, |
| "learning_rate": 3.6187780661509074e-05, |
| "loss": 0.2106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22657737135887146, |
| "step": 1235, |
| "valid_targets_mean": 5007.8, |
| "valid_targets_min": 1843 |
| }, |
| { |
| "epoch": 1.9682539682539684, |
| "grad_norm": 0.4536224923690941, |
| "learning_rate": 3.6141169451045526e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1943274736404419, |
| "step": 1240, |
| "valid_targets_mean": 4127.1, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 1.9761904761904763, |
| "grad_norm": 0.46913089325037155, |
| "learning_rate": 3.609430542025646e-05, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17612981796264648, |
| "step": 1245, |
| "valid_targets_mean": 5872.5, |
| "valid_targets_min": 1386 |
| }, |
| { |
| "epoch": 1.9841269841269842, |
| "grad_norm": 0.40006665679686376, |
| "learning_rate": 3.604718930317664e-05, |
| "loss": 0.1935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21723848581314087, |
| "step": 1250, |
| "valid_targets_mean": 5627.9, |
| "valid_targets_min": 1877 |
| }, |
| { |
| "epoch": 1.992063492063492, |
| "grad_norm": 0.4171450102000576, |
| "learning_rate": 3.5999821837789275e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17687958478927612, |
| "step": 1255, |
| "valid_targets_mean": 4820.7, |
| "valid_targets_min": 275 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 0.39376114464436146, |
| "learning_rate": 3.595220376601447e-05, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16747349500656128, |
| "step": 1260, |
| "valid_targets_mean": 5956.8, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 2.007936507936508, |
| "grad_norm": 0.42367770753786105, |
| "learning_rate": 3.590433583369758e-05, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.164157897233963, |
| "step": 1265, |
| "valid_targets_mean": 6732.4, |
| "valid_targets_min": 3077 |
| }, |
| { |
| "epoch": 2.015873015873016, |
| "grad_norm": 0.43491398653549607, |
| "learning_rate": 3.5856218790597554e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16858386993408203, |
| "step": 1270, |
| "valid_targets_mean": 4635.7, |
| "valid_targets_min": 267 |
| }, |
| { |
| "epoch": 2.0238095238095237, |
| "grad_norm": 0.4336346848049278, |
| "learning_rate": 3.580785339037519e-05, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1782153844833374, |
| "step": 1275, |
| "valid_targets_mean": 5509.9, |
| "valid_targets_min": 2820 |
| }, |
| { |
| "epoch": 2.0317460317460316, |
| "grad_norm": 0.4219922314179232, |
| "learning_rate": 3.57592403905813e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17715319991111755, |
| "step": 1280, |
| "valid_targets_mean": 5722.5, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 2.0396825396825395, |
| "grad_norm": 0.3940209379170676, |
| "learning_rate": 3.571038055264489e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16919057071208954, |
| "step": 1285, |
| "valid_targets_mean": 5806.7, |
| "valid_targets_min": 2137 |
| }, |
| { |
| "epoch": 2.0476190476190474, |
| "grad_norm": 0.9513050625567275, |
| "learning_rate": 3.566127464186119e-05, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17070958018302917, |
| "step": 1290, |
| "valid_targets_mean": 6109.1, |
| "valid_targets_min": 2815 |
| }, |
| { |
| "epoch": 2.0555555555555554, |
| "grad_norm": 0.39178871800874376, |
| "learning_rate": 3.56119234273797e-05, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15980932116508484, |
| "step": 1295, |
| "valid_targets_mean": 6312.2, |
| "valid_targets_min": 2200 |
| }, |
| { |
| "epoch": 2.0634920634920633, |
| "grad_norm": 0.4545939454742837, |
| "learning_rate": 3.5562327682192134e-05, |
| "loss": 0.184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17266622185707092, |
| "step": 1300, |
| "valid_targets_mean": 5758.9, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 2.0714285714285716, |
| "grad_norm": 0.40752366743563423, |
| "learning_rate": 3.5512488183120286e-05, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18903039395809174, |
| "step": 1305, |
| "valid_targets_mean": 6031.5, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 2.0793650793650795, |
| "grad_norm": 0.43154212786267104, |
| "learning_rate": 3.54624057108039e-05, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1685219407081604, |
| "step": 1310, |
| "valid_targets_mean": 4359.1, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 2.0873015873015874, |
| "grad_norm": 0.41368733303715804, |
| "learning_rate": 3.5412081049688444e-05, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1651342809200287, |
| "step": 1315, |
| "valid_targets_mean": 5127.6, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 2.0952380952380953, |
| "grad_norm": 0.38589454302426857, |
| "learning_rate": 3.5361514988012774e-05, |
| "loss": 0.1771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1480841338634491, |
| "step": 1320, |
| "valid_targets_mean": 5874.6, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 2.1031746031746033, |
| "grad_norm": 0.43713259076728145, |
| "learning_rate": 3.5310708317796844e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16304585337638855, |
| "step": 1325, |
| "valid_targets_mean": 5606.6, |
| "valid_targets_min": 2620 |
| }, |
| { |
| "epoch": 2.111111111111111, |
| "grad_norm": 0.5149351729670725, |
| "learning_rate": 3.5259661834829266e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17917974293231964, |
| "step": 1330, |
| "valid_targets_mean": 6228.2, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 2.119047619047619, |
| "grad_norm": 0.3861389835108437, |
| "learning_rate": 3.5208376338654866e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16448023915290833, |
| "step": 1335, |
| "valid_targets_mean": 6666.1, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 2.126984126984127, |
| "grad_norm": 0.38207111066871835, |
| "learning_rate": 3.515685263256214e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17809657752513885, |
| "step": 1340, |
| "valid_targets_mean": 6127.4, |
| "valid_targets_min": 1544 |
| }, |
| { |
| "epoch": 2.134920634920635, |
| "grad_norm": 0.4127592358303544, |
| "learning_rate": 3.51050915235707e-05, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18220895528793335, |
| "step": 1345, |
| "valid_targets_mean": 5229.9, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 2.142857142857143, |
| "grad_norm": 0.42540313592591483, |
| "learning_rate": 3.5053093822418596e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1991414576768875, |
| "step": 1350, |
| "valid_targets_mean": 5462.2, |
| "valid_targets_min": 2257 |
| }, |
| { |
| "epoch": 2.1507936507936507, |
| "grad_norm": 0.39687138441854536, |
| "learning_rate": 3.500086034354966e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20256337523460388, |
| "step": 1355, |
| "valid_targets_mean": 5684.8, |
| "valid_targets_min": 2415 |
| }, |
| { |
| "epoch": 2.1587301587301586, |
| "grad_norm": 0.44932267888477845, |
| "learning_rate": 3.494839190510071e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17283421754837036, |
| "step": 1360, |
| "valid_targets_mean": 4960.4, |
| "valid_targets_min": 2345 |
| }, |
| { |
| "epoch": 2.1666666666666665, |
| "grad_norm": 0.49624084160009224, |
| "learning_rate": 3.489568932888877e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1903117299079895, |
| "step": 1365, |
| "valid_targets_mean": 5084.8, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 2.1746031746031744, |
| "grad_norm": 0.42424536754472875, |
| "learning_rate": 3.484275344039815e-05, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1761750876903534, |
| "step": 1370, |
| "valid_targets_mean": 4764.8, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 2.1825396825396823, |
| "grad_norm": 0.3930655272562859, |
| "learning_rate": 3.478958506876759e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16021452844142914, |
| "step": 1375, |
| "valid_targets_mean": 5342.4, |
| "valid_targets_min": 2886 |
| }, |
| { |
| "epoch": 2.1904761904761907, |
| "grad_norm": 0.5253004636054942, |
| "learning_rate": 3.47361850467772e-05, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1926204413175583, |
| "step": 1380, |
| "valid_targets_mean": 5126.9, |
| "valid_targets_min": 2220 |
| }, |
| { |
| "epoch": 2.1984126984126986, |
| "grad_norm": 0.3913488618062026, |
| "learning_rate": 3.468255421083546e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2079114466905594, |
| "step": 1385, |
| "valid_targets_mean": 6658.1, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 2.2063492063492065, |
| "grad_norm": 0.4343501732005746, |
| "learning_rate": 3.46286934009661e-05, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1819835603237152, |
| "step": 1390, |
| "valid_targets_mean": 4903.1, |
| "valid_targets_min": 1946 |
| }, |
| { |
| "epoch": 2.2142857142857144, |
| "grad_norm": 0.4642383235525826, |
| "learning_rate": 3.457460346079495e-05, |
| "loss": 0.174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1960304081439972, |
| "step": 1395, |
| "valid_targets_mean": 4859.3, |
| "valid_targets_min": 1756 |
| }, |
| { |
| "epoch": 2.2222222222222223, |
| "grad_norm": 0.39883822754099246, |
| "learning_rate": 3.452028523753673e-05, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1751224845647812, |
| "step": 1400, |
| "valid_targets_mean": 5698.9, |
| "valid_targets_min": 1531 |
| }, |
| { |
| "epoch": 2.2301587301587302, |
| "grad_norm": 0.37010389401431576, |
| "learning_rate": 3.446573958198176e-05, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18461816012859344, |
| "step": 1405, |
| "valid_targets_mean": 6230.6, |
| "valid_targets_min": 1700 |
| }, |
| { |
| "epoch": 2.238095238095238, |
| "grad_norm": 0.6181478614629903, |
| "learning_rate": 3.4410967348482666e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14911070466041565, |
| "step": 1410, |
| "valid_targets_mean": 4602.1, |
| "valid_targets_min": 1798 |
| }, |
| { |
| "epoch": 2.246031746031746, |
| "grad_norm": 0.43108429750485655, |
| "learning_rate": 3.435596939494098e-05, |
| "loss": 0.1786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1552506387233734, |
| "step": 1415, |
| "valid_targets_mean": 5343.7, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 2.253968253968254, |
| "grad_norm": 0.3655618940959395, |
| "learning_rate": 3.430074658279369e-05, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16736620664596558, |
| "step": 1420, |
| "valid_targets_mean": 6760.8, |
| "valid_targets_min": 4142 |
| }, |
| { |
| "epoch": 2.261904761904762, |
| "grad_norm": 0.43470898698901705, |
| "learning_rate": 3.424529977699977e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18593010306358337, |
| "step": 1425, |
| "valid_targets_mean": 5456.4, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 2.2698412698412698, |
| "grad_norm": 0.4012757385555316, |
| "learning_rate": 3.418962984602661e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028789222240448, |
| "step": 1430, |
| "valid_targets_mean": 6217.8, |
| "valid_targets_min": 2538 |
| }, |
| { |
| "epoch": 2.2777777777777777, |
| "grad_norm": 0.422277687599635, |
| "learning_rate": 3.413373766183646e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17681989073753357, |
| "step": 1435, |
| "valid_targets_mean": 5242.7, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 2.2857142857142856, |
| "grad_norm": 0.4610732403739008, |
| "learning_rate": 3.40776240998727e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19924741983413696, |
| "step": 1440, |
| "valid_targets_mean": 5244.7, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 2.2936507936507935, |
| "grad_norm": 0.4230850293753159, |
| "learning_rate": 3.4021290039046184e-05, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18189997971057892, |
| "step": 1445, |
| "valid_targets_mean": 5056.2, |
| "valid_targets_min": 287 |
| }, |
| { |
| "epoch": 2.3015873015873014, |
| "grad_norm": 0.4282446015574262, |
| "learning_rate": 3.396473636172146e-05, |
| "loss": 0.1823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1614503115415573, |
| "step": 1450, |
| "valid_targets_mean": 5646.3, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 2.3095238095238093, |
| "grad_norm": 0.35393446023512337, |
| "learning_rate": 3.390796395370294e-05, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1533820927143097, |
| "step": 1455, |
| "valid_targets_mean": 6412.6, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 2.317460317460317, |
| "grad_norm": 0.4006705141341369, |
| "learning_rate": 3.385097370422102e-05, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17715230584144592, |
| "step": 1460, |
| "valid_targets_mean": 5679.0, |
| "valid_targets_min": 1403 |
| }, |
| { |
| "epoch": 2.3253968253968256, |
| "grad_norm": 0.41667317090980344, |
| "learning_rate": 3.3793766505918185e-05, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18403995037078857, |
| "step": 1465, |
| "valid_targets_mean": 5691.4, |
| "valid_targets_min": 1804 |
| }, |
| { |
| "epoch": 2.3333333333333335, |
| "grad_norm": 0.4438049911035154, |
| "learning_rate": 3.3736343254834994e-05, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16705909371376038, |
| "step": 1470, |
| "valid_targets_mean": 5163.1, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 2.3412698412698414, |
| "grad_norm": 0.41724254225439533, |
| "learning_rate": 3.3678704850396045e-05, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20384517312049866, |
| "step": 1475, |
| "valid_targets_mean": 5862.2, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 2.3492063492063493, |
| "grad_norm": 0.4965895506653012, |
| "learning_rate": 3.362085219539592e-05, |
| "loss": 0.1903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19839468598365784, |
| "step": 1480, |
| "valid_targets_mean": 5439.9, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 2.357142857142857, |
| "grad_norm": 0.38336740154664095, |
| "learning_rate": 3.3562786195985025e-05, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.190034419298172, |
| "step": 1485, |
| "valid_targets_mean": 6053.7, |
| "valid_targets_min": 3073 |
| }, |
| { |
| "epoch": 2.365079365079365, |
| "grad_norm": 0.42799053268182136, |
| "learning_rate": 3.350450776165535e-05, |
| "loss": 0.1843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17199914157390594, |
| "step": 1490, |
| "valid_targets_mean": 5109.0, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 2.373015873015873, |
| "grad_norm": 0.49042106827448145, |
| "learning_rate": 3.344601780522634e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18558023869991302, |
| "step": 1495, |
| "valid_targets_mean": 4502.5, |
| "valid_targets_min": 1358 |
| }, |
| { |
| "epoch": 2.380952380952381, |
| "grad_norm": 0.452178036330889, |
| "learning_rate": 3.3387317242830466e-05, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17586269974708557, |
| "step": 1500, |
| "valid_targets_mean": 5095.8, |
| "valid_targets_min": 271 |
| }, |
| { |
| "epoch": 2.388888888888889, |
| "grad_norm": 0.4167028985093456, |
| "learning_rate": 3.332840699389897e-05, |
| "loss": 0.1721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16293631494045258, |
| "step": 1505, |
| "valid_targets_mean": 5093.2, |
| "valid_targets_min": 1199 |
| }, |
| { |
| "epoch": 2.3968253968253967, |
| "grad_norm": 0.4134999974854722, |
| "learning_rate": 3.32692879811474e-05, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16504386067390442, |
| "step": 1510, |
| "valid_targets_mean": 4788.2, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 2.4047619047619047, |
| "grad_norm": 0.38629332618116435, |
| "learning_rate": 3.320996113056123e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16470927000045776, |
| "step": 1515, |
| "valid_targets_mean": 5480.1, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 2.4126984126984126, |
| "grad_norm": 0.4517489878934338, |
| "learning_rate": 3.315042737138128e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19131216406822205, |
| "step": 1520, |
| "valid_targets_mean": 5177.0, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 2.4206349206349205, |
| "grad_norm": 0.3912437196261749, |
| "learning_rate": 3.309068763608919e-05, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15866073966026306, |
| "step": 1525, |
| "valid_targets_mean": 4809.5, |
| "valid_targets_min": 304 |
| }, |
| { |
| "epoch": 2.4285714285714284, |
| "grad_norm": 0.4287081470079961, |
| "learning_rate": 3.303074286039285e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18889503180980682, |
| "step": 1530, |
| "valid_targets_mean": 5050.8, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 2.4365079365079367, |
| "grad_norm": 0.5226823839069293, |
| "learning_rate": 3.2970593983211694e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17266133427619934, |
| "step": 1535, |
| "valid_targets_mean": 5716.3, |
| "valid_targets_min": 2116 |
| }, |
| { |
| "epoch": 2.4444444444444446, |
| "grad_norm": 0.4142977777917709, |
| "learning_rate": 3.2910241946661993e-05, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17832788825035095, |
| "step": 1540, |
| "valid_targets_mean": 5296.9, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 2.4523809523809526, |
| "grad_norm": 0.4094380830442922, |
| "learning_rate": 3.2849687696042165e-05, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16501125693321228, |
| "step": 1545, |
| "valid_targets_mean": 5243.6, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 2.4603174603174605, |
| "grad_norm": 0.5264844857969575, |
| "learning_rate": 3.2788932179817886e-05, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19089126586914062, |
| "step": 1550, |
| "valid_targets_mean": 4228.1, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 2.4682539682539684, |
| "grad_norm": 0.3870078917146876, |
| "learning_rate": 3.2727976349607276e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16617675125598907, |
| "step": 1555, |
| "valid_targets_mean": 5233.7, |
| "valid_targets_min": 283 |
| }, |
| { |
| "epoch": 2.4761904761904763, |
| "grad_norm": 0.37140129207143047, |
| "learning_rate": 3.266682116016599e-05, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15645205974578857, |
| "step": 1560, |
| "valid_targets_mean": 6038.5, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 2.484126984126984, |
| "grad_norm": 0.3972434967156975, |
| "learning_rate": 3.260546756937227e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1872669756412506, |
| "step": 1565, |
| "valid_targets_mean": 5819.3, |
| "valid_targets_min": 343 |
| }, |
| { |
| "epoch": 2.492063492063492, |
| "grad_norm": 0.41540248633079907, |
| "learning_rate": 3.254391653821192e-05, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1847609579563141, |
| "step": 1570, |
| "valid_targets_mean": 5872.5, |
| "valid_targets_min": 366 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.4326289822516213, |
| "learning_rate": 3.248216903076328e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20463158190250397, |
| "step": 1575, |
| "valid_targets_mean": 5289.8, |
| "valid_targets_min": 279 |
| }, |
| { |
| "epoch": 2.507936507936508, |
| "grad_norm": 0.5002103630542671, |
| "learning_rate": 3.24202260141821e-05, |
| "loss": 0.1849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19607800245285034, |
| "step": 1580, |
| "valid_targets_mean": 4856.6, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 2.515873015873016, |
| "grad_norm": 0.44088426161151917, |
| "learning_rate": 3.235808845868641e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17973065376281738, |
| "step": 1585, |
| "valid_targets_mean": 5105.2, |
| "valid_targets_min": 307 |
| }, |
| { |
| "epoch": 2.5238095238095237, |
| "grad_norm": 0.41586874944924196, |
| "learning_rate": 3.229575733754132e-05, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18156777322292328, |
| "step": 1590, |
| "valid_targets_mean": 5101.9, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 2.5317460317460316, |
| "grad_norm": 0.3977154984604151, |
| "learning_rate": 3.2233233627043765e-05, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19697993993759155, |
| "step": 1595, |
| "valid_targets_mean": 5949.2, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 2.5396825396825395, |
| "grad_norm": 0.3893767013034315, |
| "learning_rate": 3.217051830650722e-05, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1648177206516266, |
| "step": 1600, |
| "valid_targets_mean": 5405.4, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 2.5476190476190474, |
| "grad_norm": 0.4012855625129347, |
| "learning_rate": 3.210761235824639e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1662881076335907, |
| "step": 1605, |
| "valid_targets_mean": 5683.6, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 2.5555555555555554, |
| "grad_norm": 0.41653714911973017, |
| "learning_rate": 3.204451676756175e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1690150797367096, |
| "step": 1610, |
| "valid_targets_mean": 5188.4, |
| "valid_targets_min": 2353 |
| }, |
| { |
| "epoch": 2.5634920634920633, |
| "grad_norm": 0.43105631877085077, |
| "learning_rate": 3.198123252272419e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1893271803855896, |
| "step": 1615, |
| "valid_targets_mean": 5241.9, |
| "valid_targets_min": 2285 |
| }, |
| { |
| "epoch": 2.571428571428571, |
| "grad_norm": 0.45967281455616704, |
| "learning_rate": 3.1917760614959505e-05, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19677485525608063, |
| "step": 1620, |
| "valid_targets_mean": 5801.2, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 2.5793650793650795, |
| "grad_norm": 0.40150052297597855, |
| "learning_rate": 3.1854102038432856e-05, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1876111626625061, |
| "step": 1625, |
| "valid_targets_mean": 5630.9, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 2.5873015873015874, |
| "grad_norm": 0.352002911984159, |
| "learning_rate": 3.17902577902332e-05, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1494748890399933, |
| "step": 1630, |
| "valid_targets_mean": 5767.0, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 2.5952380952380953, |
| "grad_norm": 0.38659122601598817, |
| "learning_rate": 3.172622887035771e-05, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17912599444389343, |
| "step": 1635, |
| "valid_targets_mean": 5444.4, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 2.6031746031746033, |
| "grad_norm": 0.566374914273737, |
| "learning_rate": 3.1662016281696073e-05, |
| "loss": 0.1954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1878930926322937, |
| "step": 1640, |
| "valid_targets_mean": 4545.0, |
| "valid_targets_min": 502 |
| }, |
| { |
| "epoch": 2.611111111111111, |
| "grad_norm": 0.40019696946056404, |
| "learning_rate": 3.15976210300148e-05, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19527481496334076, |
| "step": 1645, |
| "valid_targets_mean": 5715.0, |
| "valid_targets_min": 366 |
| }, |
| { |
| "epoch": 2.619047619047619, |
| "grad_norm": 0.39423172570166204, |
| "learning_rate": 3.153304412394143e-05, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1640002578496933, |
| "step": 1650, |
| "valid_targets_mean": 5794.7, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 2.626984126984127, |
| "grad_norm": 0.4024698863549588, |
| "learning_rate": 3.146828657494883e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1920669972896576, |
| "step": 1655, |
| "valid_targets_mean": 5749.9, |
| "valid_targets_min": 3138 |
| }, |
| { |
| "epoch": 2.634920634920635, |
| "grad_norm": 0.3925326135892127, |
| "learning_rate": 3.140334939733924e-05, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18373993039131165, |
| "step": 1660, |
| "valid_targets_mean": 5227.9, |
| "valid_targets_min": 2482 |
| }, |
| { |
| "epoch": 2.642857142857143, |
| "grad_norm": 0.46866690749449025, |
| "learning_rate": 3.1338233608228455e-05, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17870697379112244, |
| "step": 1665, |
| "valid_targets_mean": 5330.0, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 2.6507936507936507, |
| "grad_norm": 0.3948699322229872, |
| "learning_rate": 3.127294022752988e-05, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16245272755622864, |
| "step": 1670, |
| "valid_targets_mean": 5712.2, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 2.6587301587301586, |
| "grad_norm": 0.33562761669358987, |
| "learning_rate": 3.120747027793854e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1378447711467743, |
| "step": 1675, |
| "valid_targets_mean": 6322.2, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 2.6666666666666665, |
| "grad_norm": 0.4080788254926686, |
| "learning_rate": 3.114182478491509e-05, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16858676075935364, |
| "step": 1680, |
| "valid_targets_mean": 5623.9, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 2.674603174603175, |
| "grad_norm": 0.44788385062808955, |
| "learning_rate": 3.107600477666969e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17567336559295654, |
| "step": 1685, |
| "valid_targets_mean": 5283.2, |
| "valid_targets_min": 2475 |
| }, |
| { |
| "epoch": 2.682539682539683, |
| "grad_norm": 0.3698134704035969, |
| "learning_rate": 3.1010011284146004e-05, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1585252285003662, |
| "step": 1690, |
| "valid_targets_mean": 5612.2, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 2.6904761904761907, |
| "grad_norm": 0.4744606363702609, |
| "learning_rate": 3.0943845341004944e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21260786056518555, |
| "step": 1695, |
| "valid_targets_mean": 4632.7, |
| "valid_targets_min": 268 |
| }, |
| { |
| "epoch": 2.6984126984126986, |
| "grad_norm": 0.3925483959574624, |
| "learning_rate": 3.087750798360856e-05, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1703377664089203, |
| "step": 1700, |
| "valid_targets_mean": 6203.7, |
| "valid_targets_min": 1733 |
| }, |
| { |
| "epoch": 2.7063492063492065, |
| "grad_norm": 0.423603961482913, |
| "learning_rate": 3.0811000251003774e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1864738166332245, |
| "step": 1705, |
| "valid_targets_mean": 4999.4, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 2.7142857142857144, |
| "grad_norm": 0.42173447744798365, |
| "learning_rate": 3.074432318490608e-05, |
| "loss": 0.1819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17015457153320312, |
| "step": 1710, |
| "valid_targets_mean": 4929.1, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 2.7222222222222223, |
| "grad_norm": 0.3656999014872132, |
| "learning_rate": 3.067747782968328e-05, |
| "loss": 0.1735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1662687063217163, |
| "step": 1715, |
| "valid_targets_mean": 5857.1, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 2.7301587301587302, |
| "grad_norm": 0.4250802423607952, |
| "learning_rate": 3.0610465232339096e-05, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17572614550590515, |
| "step": 1720, |
| "valid_targets_mean": 5605.6, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 2.738095238095238, |
| "grad_norm": 0.39832850275301074, |
| "learning_rate": 3.054328644249677e-05, |
| "loss": 0.174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17158354818820953, |
| "step": 1725, |
| "valid_targets_mean": 5492.9, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 2.746031746031746, |
| "grad_norm": 0.40611280034429587, |
| "learning_rate": 3.047594251238265e-05, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17876523733139038, |
| "step": 1730, |
| "valid_targets_mean": 5122.9, |
| "valid_targets_min": 1754 |
| }, |
| { |
| "epoch": 2.753968253968254, |
| "grad_norm": 0.3850213501848369, |
| "learning_rate": 3.0408434496809643e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1557503491640091, |
| "step": 1735, |
| "valid_targets_mean": 4817.9, |
| "valid_targets_min": 346 |
| }, |
| { |
| "epoch": 2.761904761904762, |
| "grad_norm": 0.43072814030855905, |
| "learning_rate": 3.034076345316079e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1973961591720581, |
| "step": 1740, |
| "valid_targets_mean": 5802.5, |
| "valid_targets_min": 1788 |
| }, |
| { |
| "epoch": 2.7698412698412698, |
| "grad_norm": 0.4244003572959457, |
| "learning_rate": 3.0272930441372628e-05, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1777854859828949, |
| "step": 1745, |
| "valid_targets_mean": 5021.1, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 2.7777777777777777, |
| "grad_norm": 0.3968223319635917, |
| "learning_rate": 3.02049365239186e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18718859553337097, |
| "step": 1750, |
| "valid_targets_mean": 5884.2, |
| "valid_targets_min": 3484 |
| }, |
| { |
| "epoch": 2.7857142857142856, |
| "grad_norm": 0.38979762153827907, |
| "learning_rate": 3.0136782765792455e-05, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.184782013297081, |
| "step": 1755, |
| "valid_targets_mean": 5326.1, |
| "valid_targets_min": 3768 |
| }, |
| { |
| "epoch": 2.7936507936507935, |
| "grad_norm": 0.401430603353089, |
| "learning_rate": 3.0068470234491517e-05, |
| "loss": 0.1816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18122202157974243, |
| "step": 1760, |
| "valid_targets_mean": 5606.8, |
| "valid_targets_min": 2889 |
| }, |
| { |
| "epoch": 2.8015873015873014, |
| "grad_norm": 0.46774432941464267, |
| "learning_rate": 3.0000000000000004e-05, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19038715958595276, |
| "step": 1765, |
| "valid_targets_mean": 5706.6, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 2.8095238095238093, |
| "grad_norm": 0.3900657231476483, |
| "learning_rate": 2.993137313477223e-05, |
| "loss": 0.1849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16720932722091675, |
| "step": 1770, |
| "valid_targets_mean": 5955.4, |
| "valid_targets_min": 229 |
| }, |
| { |
| "epoch": 2.817460317460317, |
| "grad_norm": 0.4671446489123995, |
| "learning_rate": 2.9862590713715837e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1919449269771576, |
| "step": 1775, |
| "valid_targets_mean": 4992.8, |
| "valid_targets_min": 1710 |
| }, |
| { |
| "epoch": 2.825396825396825, |
| "grad_norm": 0.4108207960556999, |
| "learning_rate": 2.9793653814174957e-05, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16805459558963776, |
| "step": 1780, |
| "valid_targets_mean": 5892.2, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 2.8333333333333335, |
| "grad_norm": 0.3878996578053704, |
| "learning_rate": 2.9724563515913317e-05, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16483880579471588, |
| "step": 1785, |
| "valid_targets_mean": 5715.8, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 2.8412698412698414, |
| "grad_norm": 0.3924118467590962, |
| "learning_rate": 2.9655320901097348e-05, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16196705400943756, |
| "step": 1790, |
| "valid_targets_mean": 5235.0, |
| "valid_targets_min": 2689 |
| }, |
| { |
| "epoch": 2.8492063492063493, |
| "grad_norm": 0.38981761916486113, |
| "learning_rate": 2.9585927054279224e-05, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1542998105287552, |
| "step": 1795, |
| "valid_targets_mean": 5381.4, |
| "valid_targets_min": 2263 |
| }, |
| { |
| "epoch": 2.857142857142857, |
| "grad_norm": 0.3581946508380772, |
| "learning_rate": 2.951638306237988e-05, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17149242758750916, |
| "step": 1800, |
| "valid_targets_mean": 6313.2, |
| "valid_targets_min": 1580 |
| }, |
| { |
| "epoch": 2.865079365079365, |
| "grad_norm": 0.4494970197989124, |
| "learning_rate": 2.9446690014671976e-05, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1602257341146469, |
| "step": 1805, |
| "valid_targets_mean": 5223.4, |
| "valid_targets_min": 935 |
| }, |
| { |
| "epoch": 2.873015873015873, |
| "grad_norm": 0.37530142354886875, |
| "learning_rate": 2.937684900276285e-05, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15792617201805115, |
| "step": 1810, |
| "valid_targets_mean": 5738.4, |
| "valid_targets_min": 2336 |
| }, |
| { |
| "epoch": 2.880952380952381, |
| "grad_norm": 0.39396887510337375, |
| "learning_rate": 2.9306861120577416e-05, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15244446694850922, |
| "step": 1815, |
| "valid_targets_mean": 5644.9, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 2.888888888888889, |
| "grad_norm": 0.3706798220884454, |
| "learning_rate": 2.923672746434103e-05, |
| "loss": 0.1754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1762312352657318, |
| "step": 1820, |
| "valid_targets_mean": 6201.0, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 2.8968253968253967, |
| "grad_norm": 0.4021984022426286, |
| "learning_rate": 2.9166449132562303e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2141510546207428, |
| "step": 1825, |
| "valid_targets_mean": 5325.4, |
| "valid_targets_min": 1539 |
| }, |
| { |
| "epoch": 2.9047619047619047, |
| "grad_norm": 0.42224038990358104, |
| "learning_rate": 2.9096027226015927e-05, |
| "loss": 0.1742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18177683651447296, |
| "step": 1830, |
| "valid_targets_mean": 4708.6, |
| "valid_targets_min": 1117 |
| }, |
| { |
| "epoch": 2.9126984126984126, |
| "grad_norm": 0.3819006419400972, |
| "learning_rate": 2.9025462847725405e-05, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16706177592277527, |
| "step": 1835, |
| "valid_targets_mean": 6122.9, |
| "valid_targets_min": 2503 |
| }, |
| { |
| "epoch": 2.9206349206349205, |
| "grad_norm": 0.4410064177919863, |
| "learning_rate": 2.8954757102945798e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2258429080247879, |
| "step": 1840, |
| "valid_targets_mean": 4895.2, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 2.928571428571429, |
| "grad_norm": 0.39487518735853117, |
| "learning_rate": 2.888391109914638e-05, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17937694489955902, |
| "step": 1845, |
| "valid_targets_mean": 5114.6, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 2.9365079365079367, |
| "grad_norm": 0.38265019511969883, |
| "learning_rate": 2.8812925945993333e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17933601140975952, |
| "step": 1850, |
| "valid_targets_mean": 5663.7, |
| "valid_targets_min": 1513 |
| }, |
| { |
| "epoch": 2.9444444444444446, |
| "grad_norm": 0.402651671534175, |
| "learning_rate": 2.8741802755332332e-05, |
| "loss": 0.1891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17298966646194458, |
| "step": 1855, |
| "valid_targets_mean": 4725.4, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 2.9523809523809526, |
| "grad_norm": 0.43929484251032125, |
| "learning_rate": 2.8670542641171155e-05, |
| "loss": 0.1949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19994154572486877, |
| "step": 1860, |
| "valid_targets_mean": 4797.8, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 2.9603174603174605, |
| "grad_norm": 0.40410989413843573, |
| "learning_rate": 2.859914671966221e-05, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17386558651924133, |
| "step": 1865, |
| "valid_targets_mean": 4977.1, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 2.9682539682539684, |
| "grad_norm": 0.346301301173511, |
| "learning_rate": 2.8527616109085082e-05, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15783601999282837, |
| "step": 1870, |
| "valid_targets_mean": 5833.5, |
| "valid_targets_min": 1896 |
| }, |
| { |
| "epoch": 2.9761904761904763, |
| "grad_norm": 0.38049759940528577, |
| "learning_rate": 2.8455951929828977e-05, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15591737627983093, |
| "step": 1875, |
| "valid_targets_mean": 5575.6, |
| "valid_targets_min": 295 |
| }, |
| { |
| "epoch": 2.984126984126984, |
| "grad_norm": 0.3831654484686578, |
| "learning_rate": 2.8384155304375223e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19842402637004852, |
| "step": 1880, |
| "valid_targets_mean": 6079.8, |
| "valid_targets_min": 1937 |
| }, |
| { |
| "epoch": 2.992063492063492, |
| "grad_norm": 0.487008799638132, |
| "learning_rate": 2.8312227357279646e-05, |
| "loss": 0.1851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.192101389169693, |
| "step": 1885, |
| "valid_targets_mean": 4321.4, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 0.5184260476406786, |
| "learning_rate": 2.8240169215154977e-05, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1595619022846222, |
| "step": 1890, |
| "valid_targets_mean": 5334.9, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 3.007936507936508, |
| "grad_norm": 0.3405314330974361, |
| "learning_rate": 2.8167982006653196e-05, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15521922707557678, |
| "step": 1895, |
| "valid_targets_mean": 6951.9, |
| "valid_targets_min": 3834 |
| }, |
| { |
| "epoch": 3.015873015873016, |
| "grad_norm": 0.44531826407382213, |
| "learning_rate": 2.8095666862447876e-05, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18891948461532593, |
| "step": 1900, |
| "valid_targets_mean": 5601.6, |
| "valid_targets_min": 2266 |
| }, |
| { |
| "epoch": 3.0238095238095237, |
| "grad_norm": 0.3667355362457471, |
| "learning_rate": 2.8023224915216442e-05, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13565120100975037, |
| "step": 1905, |
| "valid_targets_mean": 6374.4, |
| "valid_targets_min": 1807 |
| }, |
| { |
| "epoch": 3.0317460317460316, |
| "grad_norm": 0.36488467668267915, |
| "learning_rate": 2.795065729962244e-05, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15088070929050446, |
| "step": 1910, |
| "valid_targets_mean": 6743.3, |
| "valid_targets_min": 3371 |
| }, |
| { |
| "epoch": 3.0396825396825395, |
| "grad_norm": 0.5240072304479968, |
| "learning_rate": 2.7877965152297785e-05, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16858817636966705, |
| "step": 1915, |
| "valid_targets_mean": 5218.3, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 3.0476190476190474, |
| "grad_norm": 0.4345088557078499, |
| "learning_rate": 2.780514961182492e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18977370858192444, |
| "step": 1920, |
| "valid_targets_mean": 6161.9, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 3.0555555555555554, |
| "grad_norm": 0.43067510343421206, |
| "learning_rate": 2.773221181871903e-05, |
| "loss": 0.145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15231278538703918, |
| "step": 1925, |
| "valid_targets_mean": 5256.0, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 3.0634920634920633, |
| "grad_norm": 0.4329109482212343, |
| "learning_rate": 2.765915291541013e-05, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1648765504360199, |
| "step": 1930, |
| "valid_targets_mean": 5768.6, |
| "valid_targets_min": 2664 |
| }, |
| { |
| "epoch": 3.0714285714285716, |
| "grad_norm": 0.4360393225780438, |
| "learning_rate": 2.7585974046225206e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16902469098567963, |
| "step": 1935, |
| "valid_targets_mean": 4864.1, |
| "valid_targets_min": 1763 |
| }, |
| { |
| "epoch": 3.0793650793650795, |
| "grad_norm": 0.42242563176181436, |
| "learning_rate": 2.751267635737027e-05, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15772101283073425, |
| "step": 1940, |
| "valid_targets_mean": 5512.9, |
| "valid_targets_min": 340 |
| }, |
| { |
| "epoch": 3.0873015873015874, |
| "grad_norm": 0.38359983981254425, |
| "learning_rate": 2.7439260996912423e-05, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.171489417552948, |
| "step": 1945, |
| "valid_targets_mean": 5938.1, |
| "valid_targets_min": 2752 |
| }, |
| { |
| "epoch": 3.0952380952380953, |
| "grad_norm": 0.41322753491472525, |
| "learning_rate": 2.7365729114761862e-05, |
| "loss": 0.1582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15758131444454193, |
| "step": 1950, |
| "valid_targets_mean": 5200.1, |
| "valid_targets_min": 370 |
| }, |
| { |
| "epoch": 3.1031746031746033, |
| "grad_norm": 0.4186192867390412, |
| "learning_rate": 2.729208186265386e-05, |
| "loss": 0.1546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14994092285633087, |
| "step": 1955, |
| "valid_targets_mean": 5166.9, |
| "valid_targets_min": 251 |
| }, |
| { |
| "epoch": 3.111111111111111, |
| "grad_norm": 0.3644255779428956, |
| "learning_rate": 2.721832039413077e-05, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14574278891086578, |
| "step": 1960, |
| "valid_targets_mean": 6365.3, |
| "valid_targets_min": 1939 |
| }, |
| { |
| "epoch": 3.119047619047619, |
| "grad_norm": 0.41549829471711147, |
| "learning_rate": 2.7144445864523887e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15822090208530426, |
| "step": 1965, |
| "valid_targets_mean": 5193.6, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 3.126984126984127, |
| "grad_norm": 0.4080754517778744, |
| "learning_rate": 2.7070459430935407e-05, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18438664078712463, |
| "step": 1970, |
| "valid_targets_mean": 6076.5, |
| "valid_targets_min": 366 |
| }, |
| { |
| "epoch": 3.134920634920635, |
| "grad_norm": 0.34845655756539395, |
| "learning_rate": 2.69963622522203e-05, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1505107879638672, |
| "step": 1975, |
| "valid_targets_mean": 7000.2, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 3.142857142857143, |
| "grad_norm": 0.3957443526395654, |
| "learning_rate": 2.6922155488968117e-05, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15863436460494995, |
| "step": 1980, |
| "valid_targets_mean": 6114.2, |
| "valid_targets_min": 1754 |
| }, |
| { |
| "epoch": 3.1507936507936507, |
| "grad_norm": 0.3987157816987954, |
| "learning_rate": 2.684784030348486e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1591426432132721, |
| "step": 1985, |
| "valid_targets_mean": 5729.1, |
| "valid_targets_min": 2795 |
| }, |
| { |
| "epoch": 3.1587301587301586, |
| "grad_norm": 0.3311471215567983, |
| "learning_rate": 2.6773417859774755e-05, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13412167131900787, |
| "step": 1990, |
| "valid_targets_mean": 7218.6, |
| "valid_targets_min": 5066 |
| }, |
| { |
| "epoch": 3.1666666666666665, |
| "grad_norm": 0.44452141015453234, |
| "learning_rate": 2.669888932352201e-05, |
| "loss": 0.1525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14640459418296814, |
| "step": 1995, |
| "valid_targets_mean": 4116.0, |
| "valid_targets_min": 582 |
| }, |
| { |
| "epoch": 3.1746031746031744, |
| "grad_norm": 0.4296245823041024, |
| "learning_rate": 2.662425586207259e-05, |
| "loss": 0.1587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18060961365699768, |
| "step": 2000, |
| "valid_targets_mean": 5717.8, |
| "valid_targets_min": 2684 |
| }, |
| { |
| "epoch": 3.1825396825396823, |
| "grad_norm": 0.44161933967338207, |
| "learning_rate": 2.6549518644415876e-05, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13894905149936676, |
| "step": 2005, |
| "valid_targets_mean": 5385.4, |
| "valid_targets_min": 1651 |
| }, |
| { |
| "epoch": 3.1904761904761907, |
| "grad_norm": 0.4402027862054312, |
| "learning_rate": 2.6474678841166426e-05, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15985198318958282, |
| "step": 2010, |
| "valid_targets_mean": 4908.7, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 3.1984126984126986, |
| "grad_norm": 0.4521093840332604, |
| "learning_rate": 2.639973762454558e-05, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17308469116687775, |
| "step": 2015, |
| "valid_targets_mean": 5940.6, |
| "valid_targets_min": 2224 |
| }, |
| { |
| "epoch": 3.2063492063492065, |
| "grad_norm": 0.44949779778305143, |
| "learning_rate": 2.6324696168363134e-05, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16031065583229065, |
| "step": 2020, |
| "valid_targets_mean": 4588.2, |
| "valid_targets_min": 1570 |
| }, |
| { |
| "epoch": 3.2142857142857144, |
| "grad_norm": 0.44736879299802484, |
| "learning_rate": 2.624955564799894e-05, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18750852346420288, |
| "step": 2025, |
| "valid_targets_mean": 4769.4, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 3.2222222222222223, |
| "grad_norm": 0.4063469374069734, |
| "learning_rate": 2.617431724038451e-05, |
| "loss": 0.1592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15944424271583557, |
| "step": 2030, |
| "valid_targets_mean": 5581.2, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 3.2301587301587302, |
| "grad_norm": 0.4237562908407849, |
| "learning_rate": 2.609898212398455e-05, |
| "loss": 0.1532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15621069073677063, |
| "step": 2035, |
| "valid_targets_mean": 5366.9, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 3.238095238095238, |
| "grad_norm": 0.39370444783531333, |
| "learning_rate": 2.6023551478778535e-05, |
| "loss": 0.1508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14452454447746277, |
| "step": 2040, |
| "valid_targets_mean": 5937.5, |
| "valid_targets_min": 225 |
| }, |
| { |
| "epoch": 3.246031746031746, |
| "grad_norm": 0.49270720514980915, |
| "learning_rate": 2.5948026486242225e-05, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724134087562561, |
| "step": 2045, |
| "valid_targets_mean": 3770.9, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 3.253968253968254, |
| "grad_norm": 0.4577588443456724, |
| "learning_rate": 2.5872408329329136e-05, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13135287165641785, |
| "step": 2050, |
| "valid_targets_mean": 5848.4, |
| "valid_targets_min": 2027 |
| }, |
| { |
| "epoch": 3.261904761904762, |
| "grad_norm": 0.44271121122885954, |
| "learning_rate": 2.5796698192452016e-05, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16199621558189392, |
| "step": 2055, |
| "valid_targets_mean": 4766.6, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 3.2698412698412698, |
| "grad_norm": 0.39031087916457097, |
| "learning_rate": 2.572089726146432e-05, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16037863492965698, |
| "step": 2060, |
| "valid_targets_mean": 5805.1, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 3.2777777777777777, |
| "grad_norm": 0.4646573659873822, |
| "learning_rate": 2.564500672364162e-05, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.162231907248497, |
| "step": 2065, |
| "valid_targets_mean": 4860.0, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 3.2857142857142856, |
| "grad_norm": 0.3990327001371696, |
| "learning_rate": 2.556902776766298e-05, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15069621801376343, |
| "step": 2070, |
| "valid_targets_mean": 5909.9, |
| "valid_targets_min": 1698 |
| }, |
| { |
| "epoch": 3.2936507936507935, |
| "grad_norm": 0.43271648198961715, |
| "learning_rate": 2.5492961583592397e-05, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.170293927192688, |
| "step": 2075, |
| "valid_targets_mean": 5133.9, |
| "valid_targets_min": 1647 |
| }, |
| { |
| "epoch": 3.3015873015873014, |
| "grad_norm": 0.44977807483400484, |
| "learning_rate": 2.5416809362860107e-05, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18963780999183655, |
| "step": 2080, |
| "valid_targets_mean": 4750.8, |
| "valid_targets_min": 559 |
| }, |
| { |
| "epoch": 3.3095238095238093, |
| "grad_norm": 0.3681715462106892, |
| "learning_rate": 2.5340572298243946e-05, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1364738941192627, |
| "step": 2085, |
| "valid_targets_mean": 6450.1, |
| "valid_targets_min": 4105 |
| }, |
| { |
| "epoch": 3.317460317460317, |
| "grad_norm": 0.45380051213619826, |
| "learning_rate": 2.5264251583850677e-05, |
| "loss": 0.1728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1766563057899475, |
| "step": 2090, |
| "valid_targets_mean": 4932.4, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 3.3253968253968256, |
| "grad_norm": 0.34929908788411107, |
| "learning_rate": 2.518784841509726e-05, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.142880380153656, |
| "step": 2095, |
| "valid_targets_mean": 7236.7, |
| "valid_targets_min": 3519 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.42494242702127294, |
| "learning_rate": 2.511136398869216e-05, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1457439363002777, |
| "step": 2100, |
| "valid_targets_mean": 5273.4, |
| "valid_targets_min": 2522 |
| }, |
| { |
| "epoch": 3.3412698412698414, |
| "grad_norm": 0.41871282992961945, |
| "learning_rate": 2.503479950261658e-05, |
| "loss": 0.1564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14400547742843628, |
| "step": 2105, |
| "valid_targets_mean": 5479.6, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 3.3492063492063493, |
| "grad_norm": 0.41199941257756795, |
| "learning_rate": 2.4958156156105693e-05, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16985690593719482, |
| "step": 2110, |
| "valid_targets_mean": 5431.3, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 3.357142857142857, |
| "grad_norm": 0.41511677551741843, |
| "learning_rate": 2.4881435149629892e-05, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15738296508789062, |
| "step": 2115, |
| "valid_targets_mean": 5947.6, |
| "valid_targets_min": 1723 |
| }, |
| { |
| "epoch": 3.365079365079365, |
| "grad_norm": 0.3658736974288424, |
| "learning_rate": 2.4804637684875937e-05, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1301427185535431, |
| "step": 2120, |
| "valid_targets_mean": 7314.8, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 3.373015873015873, |
| "grad_norm": 0.4048532254523095, |
| "learning_rate": 2.4727764964728177e-05, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15161439776420593, |
| "step": 2125, |
| "valid_targets_mean": 5149.5, |
| "valid_targets_min": 2014 |
| }, |
| { |
| "epoch": 3.380952380952381, |
| "grad_norm": 0.3829760082289399, |
| "learning_rate": 2.4650818193249693e-05, |
| "loss": 0.1596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14068162441253662, |
| "step": 2130, |
| "valid_targets_mean": 5836.1, |
| "valid_targets_min": 1685 |
| }, |
| { |
| "epoch": 3.388888888888889, |
| "grad_norm": 0.4507430940791641, |
| "learning_rate": 2.4573798575663425e-05, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16859221458435059, |
| "step": 2135, |
| "valid_targets_mean": 5247.2, |
| "valid_targets_min": 311 |
| }, |
| { |
| "epoch": 3.3968253968253967, |
| "grad_norm": 0.47784011418612515, |
| "learning_rate": 2.4496707318333323e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.176387220621109, |
| "step": 2140, |
| "valid_targets_mean": 4379.1, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 3.4047619047619047, |
| "grad_norm": 0.41751426715134293, |
| "learning_rate": 2.441954562874541e-05, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1648518145084381, |
| "step": 2145, |
| "valid_targets_mean": 5245.0, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 3.4126984126984126, |
| "grad_norm": 0.34417394477532504, |
| "learning_rate": 2.434231471548893e-05, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16924996674060822, |
| "step": 2150, |
| "valid_targets_mean": 7679.7, |
| "valid_targets_min": 4644 |
| }, |
| { |
| "epoch": 3.4206349206349205, |
| "grad_norm": 0.4099313742801725, |
| "learning_rate": 2.4265015788237348e-05, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1553308665752411, |
| "step": 2155, |
| "valid_targets_mean": 5291.8, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 3.4285714285714284, |
| "grad_norm": 0.3644179150651529, |
| "learning_rate": 2.4187650057729465e-05, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13109582662582397, |
| "step": 2160, |
| "valid_targets_mean": 6145.5, |
| "valid_targets_min": 395 |
| }, |
| { |
| "epoch": 3.4365079365079367, |
| "grad_norm": 0.4344903235604141, |
| "learning_rate": 2.4110218735750403e-05, |
| "loss": 0.1547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16567984223365784, |
| "step": 2165, |
| "valid_targets_mean": 5219.4, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 3.4444444444444446, |
| "grad_norm": 0.44162025985134756, |
| "learning_rate": 2.4032723035112667e-05, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17561107873916626, |
| "step": 2170, |
| "valid_targets_mean": 4544.6, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 3.4523809523809526, |
| "grad_norm": 0.3932602300074192, |
| "learning_rate": 2.3955164169637124e-05, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15324220061302185, |
| "step": 2175, |
| "valid_targets_mean": 5706.5, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 3.4603174603174605, |
| "grad_norm": 0.42827386189990235, |
| "learning_rate": 2.387754335413398e-05, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15386894345283508, |
| "step": 2180, |
| "valid_targets_mean": 4324.1, |
| "valid_targets_min": 373 |
| }, |
| { |
| "epoch": 3.4682539682539684, |
| "grad_norm": 0.41357075683918504, |
| "learning_rate": 2.3799861804383807e-05, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15950973331928253, |
| "step": 2185, |
| "valid_targets_mean": 5571.4, |
| "valid_targets_min": 1700 |
| }, |
| { |
| "epoch": 3.4761904761904763, |
| "grad_norm": 0.4041812547912995, |
| "learning_rate": 2.3722120737118414e-05, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1401449292898178, |
| "step": 2190, |
| "valid_targets_mean": 5355.0, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 3.484126984126984, |
| "grad_norm": 0.4349818563348464, |
| "learning_rate": 2.3644321370001868e-05, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16082270443439484, |
| "step": 2195, |
| "valid_targets_mean": 4887.8, |
| "valid_targets_min": 201 |
| }, |
| { |
| "epoch": 3.492063492063492, |
| "grad_norm": 0.41308220488892183, |
| "learning_rate": 2.3566464921611393e-05, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16265086829662323, |
| "step": 2200, |
| "valid_targets_mean": 5437.2, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 3.5, |
| "grad_norm": 0.4212037346610392, |
| "learning_rate": 2.348855261141827e-05, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16348662972450256, |
| "step": 2205, |
| "valid_targets_mean": 4889.4, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 3.507936507936508, |
| "grad_norm": 0.4704570906062029, |
| "learning_rate": 2.341058565976874e-05, |
| "loss": 0.1644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20820948481559753, |
| "step": 2210, |
| "valid_targets_mean": 5980.6, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 3.515873015873016, |
| "grad_norm": 0.5036481968595117, |
| "learning_rate": 2.3332565287864918e-05, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15473511815071106, |
| "step": 2215, |
| "valid_targets_mean": 5321.4, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 3.5238095238095237, |
| "grad_norm": 0.3735233109636718, |
| "learning_rate": 2.325449271774563e-05, |
| "loss": 0.1555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14910230040550232, |
| "step": 2220, |
| "valid_targets_mean": 6132.2, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 3.5317460317460316, |
| "grad_norm": 0.444413935820999, |
| "learning_rate": 2.3176369172267286e-05, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17016586661338806, |
| "step": 2225, |
| "valid_targets_mean": 4620.8, |
| "valid_targets_min": 1621 |
| }, |
| { |
| "epoch": 3.5396825396825395, |
| "grad_norm": 0.3953957921849172, |
| "learning_rate": 2.3098195875084732e-05, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15769408643245697, |
| "step": 2230, |
| "valid_targets_mean": 5690.9, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 3.5476190476190474, |
| "grad_norm": 0.5077199865444484, |
| "learning_rate": 2.301997405063208e-05, |
| "loss": 0.1739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15993595123291016, |
| "step": 2235, |
| "valid_targets_mean": 5084.5, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 3.5555555555555554, |
| "grad_norm": 0.4086230414672359, |
| "learning_rate": 2.2941704924103535e-05, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1494399756193161, |
| "step": 2240, |
| "valid_targets_mean": 5467.4, |
| "valid_targets_min": 327 |
| }, |
| { |
| "epoch": 3.5634920634920633, |
| "grad_norm": 0.42370220867636965, |
| "learning_rate": 2.2863389721434165e-05, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16436323523521423, |
| "step": 2245, |
| "valid_targets_mean": 6613.1, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 3.571428571428571, |
| "grad_norm": 0.47414264477785967, |
| "learning_rate": 2.2785029669280775e-05, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16836649179458618, |
| "step": 2250, |
| "valid_targets_mean": 4143.4, |
| "valid_targets_min": 1765 |
| }, |
| { |
| "epoch": 3.5793650793650795, |
| "grad_norm": 0.4279968424111969, |
| "learning_rate": 2.2706625995002626e-05, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15963539481163025, |
| "step": 2255, |
| "valid_targets_mean": 5683.1, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 3.5873015873015874, |
| "grad_norm": 0.43551657194367943, |
| "learning_rate": 2.262817992664224e-05, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15465790033340454, |
| "step": 2260, |
| "valid_targets_mean": 5270.2, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 3.5952380952380953, |
| "grad_norm": 0.473618019837446, |
| "learning_rate": 2.2549692692906158e-05, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19456999003887177, |
| "step": 2265, |
| "valid_targets_mean": 4033.5, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 3.6031746031746033, |
| "grad_norm": 0.4610864812937639, |
| "learning_rate": 2.24711655231457e-05, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16838069260120392, |
| "step": 2270, |
| "valid_targets_mean": 4850.8, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 3.611111111111111, |
| "grad_norm": 0.4183921042676627, |
| "learning_rate": 2.2392599647337724e-05, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15832781791687012, |
| "step": 2275, |
| "valid_targets_mean": 5614.7, |
| "valid_targets_min": 2089 |
| }, |
| { |
| "epoch": 3.619047619047619, |
| "grad_norm": 0.4746926085970967, |
| "learning_rate": 2.23139962960653e-05, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17942070960998535, |
| "step": 2280, |
| "valid_targets_mean": 4651.3, |
| "valid_targets_min": 217 |
| }, |
| { |
| "epoch": 3.626984126984127, |
| "grad_norm": 0.42504033178119727, |
| "learning_rate": 2.2235356700498528e-05, |
| "loss": 0.1622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1609695851802826, |
| "step": 2285, |
| "valid_targets_mean": 5650.9, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 3.634920634920635, |
| "grad_norm": 0.35104401078143266, |
| "learning_rate": 2.2156682092375175e-05, |
| "loss": 0.1593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14197728037834167, |
| "step": 2290, |
| "valid_targets_mean": 6449.4, |
| "valid_targets_min": 2699 |
| }, |
| { |
| "epoch": 3.642857142857143, |
| "grad_norm": 0.48629893819073916, |
| "learning_rate": 2.2077973703981423e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.171891987323761, |
| "step": 2295, |
| "valid_targets_mean": 5000.9, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 3.6507936507936507, |
| "grad_norm": 0.38982495934645944, |
| "learning_rate": 2.1999232768132552e-05, |
| "loss": 0.1622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15166640281677246, |
| "step": 2300, |
| "valid_targets_mean": 5598.8, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 3.6587301587301586, |
| "grad_norm": 0.4538805178933535, |
| "learning_rate": 2.1920460518153637e-05, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13476833701133728, |
| "step": 2305, |
| "valid_targets_mean": 4883.2, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 3.6666666666666665, |
| "grad_norm": 0.4650060205808812, |
| "learning_rate": 2.1841658187860232e-05, |
| "loss": 0.1706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1431887298822403, |
| "step": 2310, |
| "valid_targets_mean": 5863.8, |
| "valid_targets_min": 2487 |
| }, |
| { |
| "epoch": 3.674603174603175, |
| "grad_norm": 0.40827307741804697, |
| "learning_rate": 2.176282701153904e-05, |
| "loss": 0.1567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16187241673469543, |
| "step": 2315, |
| "valid_targets_mean": 5186.4, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 3.682539682539683, |
| "grad_norm": 0.40111783297909087, |
| "learning_rate": 2.1683968223928572e-05, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1610245704650879, |
| "step": 2320, |
| "valid_targets_mean": 5193.5, |
| "valid_targets_min": 2007 |
| }, |
| { |
| "epoch": 3.6904761904761907, |
| "grad_norm": 0.4108636912566655, |
| "learning_rate": 2.1605083060199835e-05, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19376526772975922, |
| "step": 2325, |
| "valid_targets_mean": 5273.6, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 3.6984126984126986, |
| "grad_norm": 0.4090720045772208, |
| "learning_rate": 2.152617275593694e-05, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1690284013748169, |
| "step": 2330, |
| "valid_targets_mean": 5263.3, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 3.7063492063492065, |
| "grad_norm": 0.37473461724981033, |
| "learning_rate": 2.144723854711781e-05, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14938317239284515, |
| "step": 2335, |
| "valid_targets_mean": 5389.9, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 3.7142857142857144, |
| "grad_norm": 0.4843387089458587, |
| "learning_rate": 2.1368281670094766e-05, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17382203042507172, |
| "step": 2340, |
| "valid_targets_mean": 4600.9, |
| "valid_targets_min": 1981 |
| }, |
| { |
| "epoch": 3.7222222222222223, |
| "grad_norm": 0.4119585290716737, |
| "learning_rate": 2.1289303361575175e-05, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15374284982681274, |
| "step": 2345, |
| "valid_targets_mean": 5633.0, |
| "valid_targets_min": 2046 |
| }, |
| { |
| "epoch": 3.7301587301587302, |
| "grad_norm": 0.3952648176140555, |
| "learning_rate": 2.121030485860211e-05, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17831559479236603, |
| "step": 2350, |
| "valid_targets_mean": 5893.4, |
| "valid_targets_min": 2787 |
| }, |
| { |
| "epoch": 3.738095238095238, |
| "grad_norm": 0.41411933208876145, |
| "learning_rate": 2.113128739853493e-05, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17142191529273987, |
| "step": 2355, |
| "valid_targets_mean": 5256.2, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 3.746031746031746, |
| "grad_norm": 0.45575184540137365, |
| "learning_rate": 2.1052252219029944e-05, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1489437222480774, |
| "step": 2360, |
| "valid_targets_mean": 5599.4, |
| "valid_targets_min": 360 |
| }, |
| { |
| "epoch": 3.753968253968254, |
| "grad_norm": 0.38228242544809465, |
| "learning_rate": 2.0973200558020967e-05, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1508997082710266, |
| "step": 2365, |
| "valid_targets_mean": 5869.1, |
| "valid_targets_min": 3409 |
| }, |
| { |
| "epoch": 3.761904761904762, |
| "grad_norm": 0.4148754628490215, |
| "learning_rate": 2.0894133653700005e-05, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1601417064666748, |
| "step": 2370, |
| "valid_targets_mean": 5959.2, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 3.7698412698412698, |
| "grad_norm": 0.39421365324647456, |
| "learning_rate": 2.0815052744497795e-05, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16802407801151276, |
| "step": 2375, |
| "valid_targets_mean": 5507.4, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 3.7777777777777777, |
| "grad_norm": 0.4179727695736473, |
| "learning_rate": 2.0735959069064434e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1505141705274582, |
| "step": 2380, |
| "valid_targets_mean": 4560.2, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 3.7857142857142856, |
| "grad_norm": 0.4025223262448166, |
| "learning_rate": 2.065685386624999e-05, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16200333833694458, |
| "step": 2385, |
| "valid_targets_mean": 5546.6, |
| "valid_targets_min": 2114 |
| }, |
| { |
| "epoch": 3.7936507936507935, |
| "grad_norm": 0.42971080125523514, |
| "learning_rate": 2.0577738375085076e-05, |
| "loss": 0.1539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13847434520721436, |
| "step": 2390, |
| "valid_targets_mean": 4286.1, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 3.8015873015873014, |
| "grad_norm": 0.4040671130609569, |
| "learning_rate": 2.0498613834761462e-05, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16613656282424927, |
| "step": 2395, |
| "valid_targets_mean": 5606.1, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 3.8095238095238093, |
| "grad_norm": 0.4104422551171815, |
| "learning_rate": 2.041948148461264e-05, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16815027594566345, |
| "step": 2400, |
| "valid_targets_mean": 6071.4, |
| "valid_targets_min": 1424 |
| }, |
| { |
| "epoch": 3.817460317460317, |
| "grad_norm": 0.433862516805992, |
| "learning_rate": 2.0340342564094436e-05, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1456870138645172, |
| "step": 2405, |
| "valid_targets_mean": 4660.6, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 3.825396825396825, |
| "grad_norm": 0.37026873619906453, |
| "learning_rate": 2.0261198312765597e-05, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17130400240421295, |
| "step": 2410, |
| "valid_targets_mean": 7170.6, |
| "valid_targets_min": 3870 |
| }, |
| { |
| "epoch": 3.8333333333333335, |
| "grad_norm": 0.37774101351813544, |
| "learning_rate": 2.0182049970268355e-05, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1540232002735138, |
| "step": 2415, |
| "valid_targets_mean": 5801.1, |
| "valid_targets_min": 2004 |
| }, |
| { |
| "epoch": 3.8412698412698414, |
| "grad_norm": 0.40806762468519775, |
| "learning_rate": 2.010289877630902e-05, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1633833944797516, |
| "step": 2420, |
| "valid_targets_mean": 6180.1, |
| "valid_targets_min": 278 |
| }, |
| { |
| "epoch": 3.8492063492063493, |
| "grad_norm": 0.4658635857688465, |
| "learning_rate": 2.002374597063858e-05, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14994177222251892, |
| "step": 2425, |
| "valid_targets_mean": 5532.7, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 3.857142857142857, |
| "grad_norm": 0.48235346332409923, |
| "learning_rate": 1.9944592793033255e-05, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1955932080745697, |
| "step": 2430, |
| "valid_targets_mean": 4724.8, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 3.865079365079365, |
| "grad_norm": 0.8801286649564228, |
| "learning_rate": 1.9865440483275086e-05, |
| "loss": 0.1609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1733412742614746, |
| "step": 2435, |
| "valid_targets_mean": 5920.0, |
| "valid_targets_min": 2207 |
| }, |
| { |
| "epoch": 3.873015873015873, |
| "grad_norm": 0.4518531270411737, |
| "learning_rate": 1.978629028113254e-05, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15560846030712128, |
| "step": 2440, |
| "valid_targets_mean": 4698.5, |
| "valid_targets_min": 369 |
| }, |
| { |
| "epoch": 3.880952380952381, |
| "grad_norm": 0.4095907564342567, |
| "learning_rate": 1.9707143426341058e-05, |
| "loss": 0.1596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14006567001342773, |
| "step": 2445, |
| "valid_targets_mean": 5711.9, |
| "valid_targets_min": 1934 |
| }, |
| { |
| "epoch": 3.888888888888889, |
| "grad_norm": 0.38371188352350993, |
| "learning_rate": 1.962800115858364e-05, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15609079599380493, |
| "step": 2450, |
| "valid_targets_mean": 6032.2, |
| "valid_targets_min": 1733 |
| }, |
| { |
| "epoch": 3.8968253968253967, |
| "grad_norm": 0.4118539842920471, |
| "learning_rate": 1.9548864717471472e-05, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14997440576553345, |
| "step": 2455, |
| "valid_targets_mean": 4638.2, |
| "valid_targets_min": 2217 |
| }, |
| { |
| "epoch": 3.9047619047619047, |
| "grad_norm": 0.4025039557270683, |
| "learning_rate": 1.9469735342524454e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1860060691833496, |
| "step": 2460, |
| "valid_targets_mean": 5977.4, |
| "valid_targets_min": 1525 |
| }, |
| { |
| "epoch": 3.9126984126984126, |
| "grad_norm": 0.4033220910310328, |
| "learning_rate": 1.939061427315179e-05, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1573881059885025, |
| "step": 2465, |
| "valid_targets_mean": 5562.9, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 3.9206349206349205, |
| "grad_norm": 0.40909002728066796, |
| "learning_rate": 1.931150274863265e-05, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1574082374572754, |
| "step": 2470, |
| "valid_targets_mean": 5320.6, |
| "valid_targets_min": 397 |
| }, |
| { |
| "epoch": 3.928571428571429, |
| "grad_norm": 0.42869522285562844, |
| "learning_rate": 1.9232402008096643e-05, |
| "loss": 0.175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19264186918735504, |
| "step": 2475, |
| "valid_targets_mean": 5145.9, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 3.9365079365079367, |
| "grad_norm": 0.40381020748858665, |
| "learning_rate": 1.9153313290504495e-05, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13736480474472046, |
| "step": 2480, |
| "valid_targets_mean": 5991.2, |
| "valid_targets_min": 1935 |
| }, |
| { |
| "epoch": 3.9444444444444446, |
| "grad_norm": 0.44514859085692043, |
| "learning_rate": 1.9074237834628623e-05, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14704057574272156, |
| "step": 2485, |
| "valid_targets_mean": 5541.5, |
| "valid_targets_min": 2647 |
| }, |
| { |
| "epoch": 3.9523809523809526, |
| "grad_norm": 0.4265501479636169, |
| "learning_rate": 1.8995176879033698e-05, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18036606907844543, |
| "step": 2490, |
| "valid_targets_mean": 5466.8, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 3.9603174603174605, |
| "grad_norm": 0.4487206178934192, |
| "learning_rate": 1.89161316620573e-05, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17454467713832855, |
| "step": 2495, |
| "valid_targets_mean": 5006.6, |
| "valid_targets_min": 287 |
| }, |
| { |
| "epoch": 3.9682539682539684, |
| "grad_norm": 0.4033222789710387, |
| "learning_rate": 1.8837103421790486e-05, |
| "loss": 0.1582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15375812351703644, |
| "step": 2500, |
| "valid_targets_mean": 6142.2, |
| "valid_targets_min": 1358 |
| }, |
| { |
| "epoch": 3.9761904761904763, |
| "grad_norm": 0.46326929396533706, |
| "learning_rate": 1.8758093396058386e-05, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17514026165008545, |
| "step": 2505, |
| "valid_targets_mean": 5165.4, |
| "valid_targets_min": 2275 |
| }, |
| { |
| "epoch": 3.984126984126984, |
| "grad_norm": 0.40301115402832177, |
| "learning_rate": 1.8679102822400874e-05, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15668317675590515, |
| "step": 2510, |
| "valid_targets_mean": 5199.4, |
| "valid_targets_min": 211 |
| }, |
| { |
| "epoch": 3.992063492063492, |
| "grad_norm": 0.4789393713046297, |
| "learning_rate": 1.8600132938053098e-05, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19280311465263367, |
| "step": 2515, |
| "valid_targets_mean": 4916.7, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 0.46667355097734303, |
| "learning_rate": 1.8521184979926177e-05, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1989072561264038, |
| "step": 2520, |
| "valid_targets_mean": 5119.9, |
| "valid_targets_min": 207 |
| }, |
| { |
| "epoch": 4.007936507936508, |
| "grad_norm": 0.3847916291760838, |
| "learning_rate": 1.8442260184587804e-05, |
| "loss": 0.1508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16161227226257324, |
| "step": 2525, |
| "valid_targets_mean": 6026.6, |
| "valid_targets_min": 2419 |
| }, |
| { |
| "epoch": 4.015873015873016, |
| "grad_norm": 0.4090621169152007, |
| "learning_rate": 1.8363359788242842e-05, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14368446171283722, |
| "step": 2530, |
| "valid_targets_mean": 5862.6, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 4.023809523809524, |
| "grad_norm": 0.6141566166940376, |
| "learning_rate": 1.8284485026714013e-05, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13589806854724884, |
| "step": 2535, |
| "valid_targets_mean": 6541.5, |
| "valid_targets_min": 1485 |
| }, |
| { |
| "epoch": 4.031746031746032, |
| "grad_norm": 0.4391239898708553, |
| "learning_rate": 1.8205637135422525e-05, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15070083737373352, |
| "step": 2540, |
| "valid_targets_mean": 5536.8, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 4.0396825396825395, |
| "grad_norm": 0.41333666376927736, |
| "learning_rate": 1.8126817349368697e-05, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1329149305820465, |
| "step": 2545, |
| "valid_targets_mean": 5577.3, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 4.0476190476190474, |
| "grad_norm": 0.42756859856165286, |
| "learning_rate": 1.8048026903112632e-05, |
| "loss": 0.1485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1718430519104004, |
| "step": 2550, |
| "valid_targets_mean": 5278.7, |
| "valid_targets_min": 1393 |
| }, |
| { |
| "epoch": 4.055555555555555, |
| "grad_norm": 0.7929559502540676, |
| "learning_rate": 1.7969267030754903e-05, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1519625186920166, |
| "step": 2555, |
| "valid_targets_mean": 4177.6, |
| "valid_targets_min": 290 |
| }, |
| { |
| "epoch": 4.063492063492063, |
| "grad_norm": 0.43339872921712147, |
| "learning_rate": 1.7890538965917184e-05, |
| "loss": 0.1359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12034216523170471, |
| "step": 2560, |
| "valid_targets_mean": 5259.5, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 4.071428571428571, |
| "grad_norm": 0.4431280646696749, |
| "learning_rate": 1.7811843941722952e-05, |
| "loss": 0.1485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16165150701999664, |
| "step": 2565, |
| "valid_targets_mean": 5233.3, |
| "valid_targets_min": 343 |
| }, |
| { |
| "epoch": 4.079365079365079, |
| "grad_norm": 0.4733813623577339, |
| "learning_rate": 1.7733183190778174e-05, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17020142078399658, |
| "step": 2570, |
| "valid_targets_mean": 4545.4, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 4.087301587301587, |
| "grad_norm": 0.4256609723968049, |
| "learning_rate": 1.7654557945151968e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16018405556678772, |
| "step": 2575, |
| "valid_targets_mean": 5520.1, |
| "valid_targets_min": 2986 |
| }, |
| { |
| "epoch": 4.095238095238095, |
| "grad_norm": 0.41262793853257446, |
| "learning_rate": 1.7575969436357352e-05, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13311775028705597, |
| "step": 2580, |
| "valid_targets_mean": 5285.7, |
| "valid_targets_min": 1788 |
| }, |
| { |
| "epoch": 4.103174603174603, |
| "grad_norm": 0.45945223536796, |
| "learning_rate": 1.7497418895331934e-05, |
| "loss": 0.1438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14666880667209625, |
| "step": 2585, |
| "valid_targets_mean": 4386.4, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 4.111111111111111, |
| "grad_norm": 0.4675580885936456, |
| "learning_rate": 1.7418907552418597e-05, |
| "loss": 0.1505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15302041172981262, |
| "step": 2590, |
| "valid_targets_mean": 5458.4, |
| "valid_targets_min": 2918 |
| }, |
| { |
| "epoch": 4.119047619047619, |
| "grad_norm": 0.43934364103885165, |
| "learning_rate": 1.7340436637346315e-05, |
| "loss": 0.1473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14084570109844208, |
| "step": 2595, |
| "valid_targets_mean": 4983.3, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 4.1269841269841265, |
| "grad_norm": 0.4164892763919611, |
| "learning_rate": 1.726200737921079e-05, |
| "loss": 0.1429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12312793731689453, |
| "step": 2600, |
| "valid_targets_mean": 6296.2, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 4.134920634920635, |
| "grad_norm": 0.4532045098767217, |
| "learning_rate": 1.718362100645527e-05, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13698981702327728, |
| "step": 2605, |
| "valid_targets_mean": 4957.6, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 4.142857142857143, |
| "grad_norm": 0.4006124579380861, |
| "learning_rate": 1.710527874685129e-05, |
| "loss": 0.1497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13815411925315857, |
| "step": 2610, |
| "valid_targets_mean": 6126.5, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 4.150793650793651, |
| "grad_norm": 0.4714675135702414, |
| "learning_rate": 1.702698182747942e-05, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14571262896060944, |
| "step": 2615, |
| "valid_targets_mean": 4147.3, |
| "valid_targets_min": 284 |
| }, |
| { |
| "epoch": 4.158730158730159, |
| "grad_norm": 0.42920831749050425, |
| "learning_rate": 1.6948731474710075e-05, |
| "loss": 0.1328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13257333636283875, |
| "step": 2620, |
| "valid_targets_mean": 5335.2, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 4.166666666666667, |
| "grad_norm": 0.48356837750736714, |
| "learning_rate": 1.68705289141843e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1508401334285736, |
| "step": 2625, |
| "valid_targets_mean": 6277.6, |
| "valid_targets_min": 2995 |
| }, |
| { |
| "epoch": 4.174603174603175, |
| "grad_norm": 0.4755928358851968, |
| "learning_rate": 1.679237537079454e-05, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14255402982234955, |
| "step": 2630, |
| "valid_targets_mean": 4744.4, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 4.182539682539683, |
| "grad_norm": 0.41585215382481877, |
| "learning_rate": 1.6714272068665526e-05, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13894084095954895, |
| "step": 2635, |
| "valid_targets_mean": 5902.4, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 4.190476190476191, |
| "grad_norm": 0.4189696451329358, |
| "learning_rate": 1.663622023113501e-05, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1487642228603363, |
| "step": 2640, |
| "valid_targets_mean": 6358.3, |
| "valid_targets_min": 3083 |
| }, |
| { |
| "epoch": 4.198412698412699, |
| "grad_norm": 0.44087488345238157, |
| "learning_rate": 1.655822108073467e-05, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14662505686283112, |
| "step": 2645, |
| "valid_targets_mean": 5523.2, |
| "valid_targets_min": 1561 |
| }, |
| { |
| "epoch": 4.2063492063492065, |
| "grad_norm": 0.47060099939704136, |
| "learning_rate": 1.648027583917095e-05, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13752037286758423, |
| "step": 2650, |
| "valid_targets_mean": 5949.6, |
| "valid_targets_min": 2002 |
| }, |
| { |
| "epoch": 4.214285714285714, |
| "grad_norm": 0.4223944809526827, |
| "learning_rate": 1.640238572730591e-05, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14241717755794525, |
| "step": 2655, |
| "valid_targets_mean": 5939.1, |
| "valid_targets_min": 1808 |
| }, |
| { |
| "epoch": 4.222222222222222, |
| "grad_norm": 0.3989848199161138, |
| "learning_rate": 1.632455196513809e-05, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15084542334079742, |
| "step": 2660, |
| "valid_targets_mean": 6282.1, |
| "valid_targets_min": 3096 |
| }, |
| { |
| "epoch": 4.23015873015873, |
| "grad_norm": 0.4334279841268595, |
| "learning_rate": 1.624677577178345e-05, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15273742377758026, |
| "step": 2665, |
| "valid_targets_mean": 5628.8, |
| "valid_targets_min": 2067 |
| }, |
| { |
| "epoch": 4.238095238095238, |
| "grad_norm": 0.5090603717967935, |
| "learning_rate": 1.616905836545624e-05, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14674241840839386, |
| "step": 2670, |
| "valid_targets_mean": 4538.6, |
| "valid_targets_min": 294 |
| }, |
| { |
| "epoch": 4.246031746031746, |
| "grad_norm": 0.40233869436893316, |
| "learning_rate": 1.6091400963449894e-05, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16291236877441406, |
| "step": 2675, |
| "valid_targets_mean": 5911.8, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 4.253968253968254, |
| "grad_norm": 0.46919428409154407, |
| "learning_rate": 1.6013804782118043e-05, |
| "loss": 0.1523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15669263899326324, |
| "step": 2680, |
| "valid_targets_mean": 4653.7, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 4.261904761904762, |
| "grad_norm": 0.46975419177737526, |
| "learning_rate": 1.5936271036855372e-05, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15147748589515686, |
| "step": 2685, |
| "valid_targets_mean": 6341.4, |
| "valid_targets_min": 3029 |
| }, |
| { |
| "epoch": 4.26984126984127, |
| "grad_norm": 0.416023668049094, |
| "learning_rate": 1.585880094207864e-05, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15425267815589905, |
| "step": 2690, |
| "valid_targets_mean": 5568.8, |
| "valid_targets_min": 2137 |
| }, |
| { |
| "epoch": 4.277777777777778, |
| "grad_norm": 0.48941294002103736, |
| "learning_rate": 1.5781395711207664e-05, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16209441423416138, |
| "step": 2695, |
| "valid_targets_mean": 5182.4, |
| "valid_targets_min": 3065 |
| }, |
| { |
| "epoch": 4.285714285714286, |
| "grad_norm": 0.4233678017768594, |
| "learning_rate": 1.5704056556646255e-05, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15272748470306396, |
| "step": 2700, |
| "valid_targets_mean": 6165.9, |
| "valid_targets_min": 289 |
| }, |
| { |
| "epoch": 4.2936507936507935, |
| "grad_norm": 0.4883272680118086, |
| "learning_rate": 1.562678468976329e-05, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14731578528881073, |
| "step": 2705, |
| "valid_targets_mean": 3793.1, |
| "valid_targets_min": 268 |
| }, |
| { |
| "epoch": 4.301587301587301, |
| "grad_norm": 0.4278181836239168, |
| "learning_rate": 1.5549581320873715e-05, |
| "loss": 0.1442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14064767956733704, |
| "step": 2710, |
| "valid_targets_mean": 6504.5, |
| "valid_targets_min": 2638 |
| }, |
| { |
| "epoch": 4.309523809523809, |
| "grad_norm": 0.44190091334584447, |
| "learning_rate": 1.5472447659219573e-05, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1606476753950119, |
| "step": 2715, |
| "valid_targets_mean": 5205.2, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 4.317460317460317, |
| "grad_norm": 0.4287418443341925, |
| "learning_rate": 1.5395384912951096e-05, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.143661230802536, |
| "step": 2720, |
| "valid_targets_mean": 5759.1, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 4.325396825396825, |
| "grad_norm": 0.431052688233739, |
| "learning_rate": 1.531839428910774e-05, |
| "loss": 0.1431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13569197058677673, |
| "step": 2725, |
| "valid_targets_mean": 5779.1, |
| "valid_targets_min": 2902 |
| }, |
| { |
| "epoch": 4.333333333333333, |
| "grad_norm": 0.4462658898939222, |
| "learning_rate": 1.5241476993599318e-05, |
| "loss": 0.1399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15712681412696838, |
| "step": 2730, |
| "valid_targets_mean": 5659.5, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 4.341269841269841, |
| "grad_norm": 0.4365063885634691, |
| "learning_rate": 1.5164634231187106e-05, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14231045544147491, |
| "step": 2735, |
| "valid_targets_mean": 5411.6, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 4.349206349206349, |
| "grad_norm": 0.3675606877485401, |
| "learning_rate": 1.5087867205464933e-05, |
| "loss": 0.1409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12964603304862976, |
| "step": 2740, |
| "valid_targets_mean": 6364.4, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 4.357142857142857, |
| "grad_norm": 0.44160911003260395, |
| "learning_rate": 1.5011177118840376e-05, |
| "loss": 0.1414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1406039297580719, |
| "step": 2745, |
| "valid_targets_mean": 5633.9, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 4.365079365079365, |
| "grad_norm": 0.45789145016787364, |
| "learning_rate": 1.4934565172515917e-05, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16867199540138245, |
| "step": 2750, |
| "valid_targets_mean": 4970.6, |
| "valid_targets_min": 2561 |
| }, |
| { |
| "epoch": 4.3730158730158735, |
| "grad_norm": 0.41734019364461133, |
| "learning_rate": 1.4858032566470107e-05, |
| "loss": 0.1429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14065919816493988, |
| "step": 2755, |
| "valid_targets_mean": 6324.4, |
| "valid_targets_min": 2455 |
| }, |
| { |
| "epoch": 4.380952380952381, |
| "grad_norm": 0.40415096511524873, |
| "learning_rate": 1.4781580499438794e-05, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13654825091362, |
| "step": 2760, |
| "valid_targets_mean": 5964.2, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 4.388888888888889, |
| "grad_norm": 0.40778882084936363, |
| "learning_rate": 1.4705210168896327e-05, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12639005482196808, |
| "step": 2765, |
| "valid_targets_mean": 5996.9, |
| "valid_targets_min": 2114 |
| }, |
| { |
| "epoch": 4.396825396825397, |
| "grad_norm": 0.44063352236267495, |
| "learning_rate": 1.462892277103681e-05, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14338403940200806, |
| "step": 2770, |
| "valid_targets_mean": 5152.0, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 4.404761904761905, |
| "grad_norm": 0.3874565040882736, |
| "learning_rate": 1.455271950075539e-05, |
| "loss": 0.1383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14000162482261658, |
| "step": 2775, |
| "valid_targets_mean": 5943.4, |
| "valid_targets_min": 3591 |
| }, |
| { |
| "epoch": 4.412698412698413, |
| "grad_norm": 0.3941349722942052, |
| "learning_rate": 1.4476601551629493e-05, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1478402018547058, |
| "step": 2780, |
| "valid_targets_mean": 6708.7, |
| "valid_targets_min": 3502 |
| }, |
| { |
| "epoch": 4.420634920634921, |
| "grad_norm": 0.41875630131970193, |
| "learning_rate": 1.4400570115900147e-05, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15849897265434265, |
| "step": 2785, |
| "valid_targets_mean": 5522.6, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 4.428571428571429, |
| "grad_norm": 0.5412264352868692, |
| "learning_rate": 1.4324626384453345e-05, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12859734892845154, |
| "step": 2790, |
| "valid_targets_mean": 4754.4, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 4.436507936507937, |
| "grad_norm": 0.42316575140054596, |
| "learning_rate": 1.4248771546801339e-05, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14226463437080383, |
| "step": 2795, |
| "valid_targets_mean": 5423.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 4.444444444444445, |
| "grad_norm": 0.431013383627872, |
| "learning_rate": 1.4173006791064023e-05, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14574524760246277, |
| "step": 2800, |
| "valid_targets_mean": 5876.1, |
| "valid_targets_min": 2317 |
| }, |
| { |
| "epoch": 4.4523809523809526, |
| "grad_norm": 0.4037541081664408, |
| "learning_rate": 1.4097333303950368e-05, |
| "loss": 0.153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1440451443195343, |
| "step": 2805, |
| "valid_targets_mean": 5450.2, |
| "valid_targets_min": 1747 |
| }, |
| { |
| "epoch": 4.4603174603174605, |
| "grad_norm": 0.3978151834112168, |
| "learning_rate": 1.4021752270739759e-05, |
| "loss": 0.1533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14280155301094055, |
| "step": 2810, |
| "valid_targets_mean": 6047.3, |
| "valid_targets_min": 2885 |
| }, |
| { |
| "epoch": 4.468253968253968, |
| "grad_norm": 0.39606766776930213, |
| "learning_rate": 1.3946264875263485e-05, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13499273359775543, |
| "step": 2815, |
| "valid_targets_mean": 5398.1, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 4.476190476190476, |
| "grad_norm": 0.41951195439714245, |
| "learning_rate": 1.3870872299886184e-05, |
| "loss": 0.1522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15680038928985596, |
| "step": 2820, |
| "valid_targets_mean": 6016.8, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 4.484126984126984, |
| "grad_norm": 0.6264261787683508, |
| "learning_rate": 1.3795575725487303e-05, |
| "loss": 0.1435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16164864599704742, |
| "step": 2825, |
| "valid_targets_mean": 5240.9, |
| "valid_targets_min": 1700 |
| }, |
| { |
| "epoch": 4.492063492063492, |
| "grad_norm": 0.8311634034364538, |
| "learning_rate": 1.3720376331442652e-05, |
| "loss": 0.1527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18453676998615265, |
| "step": 2830, |
| "valid_targets_mean": 6361.3, |
| "valid_targets_min": 3395 |
| }, |
| { |
| "epoch": 4.5, |
| "grad_norm": 0.42732218297283503, |
| "learning_rate": 1.364527529560586e-05, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15269696712493896, |
| "step": 2835, |
| "valid_targets_mean": 5456.8, |
| "valid_targets_min": 297 |
| }, |
| { |
| "epoch": 4.507936507936508, |
| "grad_norm": 0.39922258358961354, |
| "learning_rate": 1.3570273794289978e-05, |
| "loss": 0.1582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15746167302131653, |
| "step": 2840, |
| "valid_targets_mean": 5865.9, |
| "valid_targets_min": 1646 |
| }, |
| { |
| "epoch": 4.515873015873016, |
| "grad_norm": 0.4249607848655103, |
| "learning_rate": 1.3495373002249061e-05, |
| "loss": 0.1431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14502134919166565, |
| "step": 2845, |
| "valid_targets_mean": 5561.5, |
| "valid_targets_min": 2046 |
| }, |
| { |
| "epoch": 4.523809523809524, |
| "grad_norm": 0.45992538161194857, |
| "learning_rate": 1.3420574092659713e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13943564891815186, |
| "step": 2850, |
| "valid_targets_mean": 4809.2, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 4.531746031746032, |
| "grad_norm": 0.4849743503805474, |
| "learning_rate": 1.3345878237102766e-05, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140847310423851, |
| "step": 2855, |
| "valid_targets_mean": 4423.5, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 4.5396825396825395, |
| "grad_norm": 0.4337324469927627, |
| "learning_rate": 1.3271286605544906e-05, |
| "loss": 0.1446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1428968906402588, |
| "step": 2860, |
| "valid_targets_mean": 5831.9, |
| "valid_targets_min": 1871 |
| }, |
| { |
| "epoch": 4.5476190476190474, |
| "grad_norm": 0.46560324944354126, |
| "learning_rate": 1.3196800366320357e-05, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14274823665618896, |
| "step": 2865, |
| "valid_targets_mean": 4730.6, |
| "valid_targets_min": 283 |
| }, |
| { |
| "epoch": 4.555555555555555, |
| "grad_norm": 0.44153707002684167, |
| "learning_rate": 1.3122420686112554e-05, |
| "loss": 0.1528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14780506491661072, |
| "step": 2870, |
| "valid_targets_mean": 4814.2, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 4.563492063492063, |
| "grad_norm": 0.4539431427613466, |
| "learning_rate": 1.3048148729935917e-05, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18015024065971375, |
| "step": 2875, |
| "valid_targets_mean": 5631.1, |
| "valid_targets_min": 275 |
| }, |
| { |
| "epoch": 4.571428571428571, |
| "grad_norm": 0.42536670553586153, |
| "learning_rate": 1.297398566111756e-05, |
| "loss": 0.1435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14803089201450348, |
| "step": 2880, |
| "valid_targets_mean": 5638.5, |
| "valid_targets_min": 2487 |
| }, |
| { |
| "epoch": 4.579365079365079, |
| "grad_norm": 0.42937048670828487, |
| "learning_rate": 1.2899932641279082e-05, |
| "loss": 0.149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13798286020755768, |
| "step": 2885, |
| "valid_targets_mean": 4947.8, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 4.587301587301587, |
| "grad_norm": 0.4404250376238387, |
| "learning_rate": 1.2825990830318395e-05, |
| "loss": 0.1533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17519637942314148, |
| "step": 2890, |
| "valid_targets_mean": 5130.4, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 4.595238095238095, |
| "grad_norm": 0.4758481215827844, |
| "learning_rate": 1.2752161386391526e-05, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13737112283706665, |
| "step": 2895, |
| "valid_targets_mean": 4636.4, |
| "valid_targets_min": 293 |
| }, |
| { |
| "epoch": 4.603174603174603, |
| "grad_norm": 0.4767645902681976, |
| "learning_rate": 1.2678445465894491e-05, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16972827911376953, |
| "step": 2900, |
| "valid_targets_mean": 4518.6, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 4.611111111111111, |
| "grad_norm": 0.4257119901155639, |
| "learning_rate": 1.2604844223445181e-05, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15088322758674622, |
| "step": 2905, |
| "valid_targets_mean": 5354.5, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 4.619047619047619, |
| "grad_norm": 0.42846734809049425, |
| "learning_rate": 1.2531358811865268e-05, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15017569065093994, |
| "step": 2910, |
| "valid_targets_mean": 5312.0, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 4.6269841269841265, |
| "grad_norm": 0.4925025724969061, |
| "learning_rate": 1.2457990382162173e-05, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1452239453792572, |
| "step": 2915, |
| "valid_targets_mean": 4835.2, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.634920634920634, |
| "grad_norm": 0.4662611029234124, |
| "learning_rate": 1.238474008351101e-05, |
| "loss": 0.1533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15926414728164673, |
| "step": 2920, |
| "valid_targets_mean": 5120.9, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 4.642857142857143, |
| "grad_norm": 0.4322145630104494, |
| "learning_rate": 1.2311609063236594e-05, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1390167623758316, |
| "step": 2925, |
| "valid_targets_mean": 4672.6, |
| "valid_targets_min": 1746 |
| }, |
| { |
| "epoch": 4.650793650793651, |
| "grad_norm": 0.4130969360637945, |
| "learning_rate": 1.2238598466795493e-05, |
| "loss": 0.1386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12715992331504822, |
| "step": 2930, |
| "valid_targets_mean": 5706.3, |
| "valid_targets_min": 1765 |
| }, |
| { |
| "epoch": 4.658730158730159, |
| "grad_norm": 0.3829382672782595, |
| "learning_rate": 1.2165709437758042e-05, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14774689078330994, |
| "step": 2935, |
| "valid_targets_mean": 6549.7, |
| "valid_targets_min": 3799 |
| }, |
| { |
| "epoch": 4.666666666666667, |
| "grad_norm": 0.38939915661022567, |
| "learning_rate": 1.209294311779047e-05, |
| "loss": 0.1519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14104187488555908, |
| "step": 2940, |
| "valid_targets_mean": 6312.2, |
| "valid_targets_min": 2275 |
| }, |
| { |
| "epoch": 4.674603174603175, |
| "grad_norm": 0.43181417781915576, |
| "learning_rate": 1.2020300646637018e-05, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11396326869726181, |
| "step": 2945, |
| "valid_targets_mean": 5581.9, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 4.682539682539683, |
| "grad_norm": 0.44410129386120123, |
| "learning_rate": 1.1947783162102043e-05, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1418922394514084, |
| "step": 2950, |
| "valid_targets_mean": 4655.8, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 4.690476190476191, |
| "grad_norm": 0.48458127033747794, |
| "learning_rate": 1.1875391800032248e-05, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1841154396533966, |
| "step": 2955, |
| "valid_targets_mean": 4632.9, |
| "valid_targets_min": 313 |
| }, |
| { |
| "epoch": 4.698412698412699, |
| "grad_norm": 0.4032339427441577, |
| "learning_rate": 1.1803127694298873e-05, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14213016629219055, |
| "step": 2960, |
| "valid_targets_mean": 5584.8, |
| "valid_targets_min": 934 |
| }, |
| { |
| "epoch": 4.7063492063492065, |
| "grad_norm": 0.4419975398132066, |
| "learning_rate": 1.173099197677992e-05, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1430945247411728, |
| "step": 2965, |
| "valid_targets_mean": 5749.8, |
| "valid_targets_min": 2081 |
| }, |
| { |
| "epoch": 4.714285714285714, |
| "grad_norm": 0.43503178571092443, |
| "learning_rate": 1.1658985777342458e-05, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14752447605133057, |
| "step": 2970, |
| "valid_targets_mean": 5720.0, |
| "valid_targets_min": 1862 |
| }, |
| { |
| "epoch": 4.722222222222222, |
| "grad_norm": 0.42023994518841934, |
| "learning_rate": 1.1587110223824874e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15875454246997833, |
| "step": 2975, |
| "valid_targets_mean": 5639.4, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 4.73015873015873, |
| "grad_norm": 0.37363144454032915, |
| "learning_rate": 1.151536644201925e-05, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11643218994140625, |
| "step": 2980, |
| "valid_targets_mean": 5878.9, |
| "valid_targets_min": 1841 |
| }, |
| { |
| "epoch": 4.738095238095238, |
| "grad_norm": 0.44030969849082424, |
| "learning_rate": 1.1443755555653751e-05, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15411710739135742, |
| "step": 2985, |
| "valid_targets_mean": 4914.2, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 4.746031746031746, |
| "grad_norm": 0.41262993153981603, |
| "learning_rate": 1.1372278686374935e-05, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1678827404975891, |
| "step": 2990, |
| "valid_targets_mean": 5873.3, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 4.753968253968254, |
| "grad_norm": 0.4311749330104684, |
| "learning_rate": 1.1300936953730273e-05, |
| "loss": 0.1535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.143174409866333, |
| "step": 2995, |
| "valid_targets_mean": 5119.6, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 4.761904761904762, |
| "grad_norm": 0.361954540458806, |
| "learning_rate": 1.1229731475150594e-05, |
| "loss": 0.1523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13922378420829773, |
| "step": 3000, |
| "valid_targets_mean": 6611.1, |
| "valid_targets_min": 3655 |
| }, |
| { |
| "epoch": 4.76984126984127, |
| "grad_norm": 0.3966366790173581, |
| "learning_rate": 1.1158663365932529e-05, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15058225393295288, |
| "step": 3005, |
| "valid_targets_mean": 5934.8, |
| "valid_targets_min": 3133 |
| }, |
| { |
| "epoch": 4.777777777777778, |
| "grad_norm": 0.4612543471363477, |
| "learning_rate": 1.1087733739221109e-05, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15629416704177856, |
| "step": 3010, |
| "valid_targets_mean": 4712.2, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 4.785714285714286, |
| "grad_norm": 0.38989272621213816, |
| "learning_rate": 1.1016943705992311e-05, |
| "loss": 0.1496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1398439258337021, |
| "step": 3015, |
| "valid_targets_mean": 6174.9, |
| "valid_targets_min": 2064 |
| }, |
| { |
| "epoch": 4.7936507936507935, |
| "grad_norm": 0.4371800342017838, |
| "learning_rate": 1.0946294375035639e-05, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1522529125213623, |
| "step": 3020, |
| "valid_targets_mean": 4937.9, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 4.801587301587301, |
| "grad_norm": 0.5205141553470364, |
| "learning_rate": 1.087578685293674e-05, |
| "loss": 0.1497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15628096461296082, |
| "step": 3025, |
| "valid_targets_mean": 5111.9, |
| "valid_targets_min": 295 |
| }, |
| { |
| "epoch": 4.809523809523809, |
| "grad_norm": 0.4077302471049976, |
| "learning_rate": 1.080542224406015e-05, |
| "loss": 0.1458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14736653864383698, |
| "step": 3030, |
| "valid_targets_mean": 5978.1, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 4.817460317460317, |
| "grad_norm": 0.4091248100895989, |
| "learning_rate": 1.0735201650531915e-05, |
| "loss": 0.1473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1352832168340683, |
| "step": 3035, |
| "valid_targets_mean": 5664.2, |
| "valid_targets_min": 2353 |
| }, |
| { |
| "epoch": 4.825396825396825, |
| "grad_norm": 0.3968540500697524, |
| "learning_rate": 1.066512617222235e-05, |
| "loss": 0.1401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12752054631710052, |
| "step": 3040, |
| "valid_targets_mean": 6093.6, |
| "valid_targets_min": 1203 |
| }, |
| { |
| "epoch": 4.833333333333333, |
| "grad_norm": 0.3642854376590935, |
| "learning_rate": 1.059519690672884e-05, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15932929515838623, |
| "step": 3045, |
| "valid_targets_mean": 7128.1, |
| "valid_targets_min": 2558 |
| }, |
| { |
| "epoch": 4.841269841269841, |
| "grad_norm": 0.38602348967427114, |
| "learning_rate": 1.0525414949358614e-05, |
| "loss": 0.1473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1197904720902443, |
| "step": 3050, |
| "valid_targets_mean": 5888.0, |
| "valid_targets_min": 2560 |
| }, |
| { |
| "epoch": 4.849206349206349, |
| "grad_norm": 0.510022835675847, |
| "learning_rate": 1.0455781393111613e-05, |
| "loss": 0.1471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14147284626960754, |
| "step": 3055, |
| "valid_targets_mean": 5739.3, |
| "valid_targets_min": 1793 |
| }, |
| { |
| "epoch": 4.857142857142857, |
| "grad_norm": 0.6751258587414498, |
| "learning_rate": 1.0386297328663353e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16436898708343506, |
| "step": 3060, |
| "valid_targets_mean": 6290.2, |
| "valid_targets_min": 440 |
| }, |
| { |
| "epoch": 4.865079365079366, |
| "grad_norm": 0.4424084854510193, |
| "learning_rate": 1.0316963844347843e-05, |
| "loss": 0.1522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15425124764442444, |
| "step": 3065, |
| "valid_targets_mean": 5844.6, |
| "valid_targets_min": 2170 |
| }, |
| { |
| "epoch": 4.8730158730158735, |
| "grad_norm": 0.4168794838811193, |
| "learning_rate": 1.0247782026140576e-05, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13188251852989197, |
| "step": 3070, |
| "valid_targets_mean": 5396.5, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 4.880952380952381, |
| "grad_norm": 0.49315142334278483, |
| "learning_rate": 1.017875295764144e-05, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13740713894367218, |
| "step": 3075, |
| "valid_targets_mean": 5882.2, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 4.888888888888889, |
| "grad_norm": 0.4543689569217225, |
| "learning_rate": 1.0109877720057818e-05, |
| "loss": 0.1567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16015523672103882, |
| "step": 3080, |
| "valid_targets_mean": 5451.6, |
| "valid_targets_min": 2056 |
| }, |
| { |
| "epoch": 4.896825396825397, |
| "grad_norm": 0.36802504019714555, |
| "learning_rate": 1.0041157392187651e-05, |
| "loss": 0.145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11829912662506104, |
| "step": 3085, |
| "valid_targets_mean": 5831.1, |
| "valid_targets_min": 2830 |
| }, |
| { |
| "epoch": 4.904761904761905, |
| "grad_norm": 0.3966134482676806, |
| "learning_rate": 9.972593050402471e-06, |
| "loss": 0.1412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14243818819522858, |
| "step": 3090, |
| "valid_targets_mean": 6406.8, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 4.912698412698413, |
| "grad_norm": 0.4183961944811586, |
| "learning_rate": 9.904185768630612e-06, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16794633865356445, |
| "step": 3095, |
| "valid_targets_mean": 6009.8, |
| "valid_targets_min": 3070 |
| }, |
| { |
| "epoch": 4.920634920634921, |
| "grad_norm": 0.44212723748685295, |
| "learning_rate": 9.835936618340377e-06, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14964662492275238, |
| "step": 3100, |
| "valid_targets_mean": 4590.1, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 4.928571428571429, |
| "grad_norm": 0.41070340267056166, |
| "learning_rate": 9.76784666852323e-06, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12387900054454803, |
| "step": 3105, |
| "valid_targets_mean": 6402.7, |
| "valid_targets_min": 3540 |
| }, |
| { |
| "epoch": 4.936507936507937, |
| "grad_norm": 0.44233711675764437, |
| "learning_rate": 9.699916985677062e-06, |
| "loss": 0.1482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1574784517288208, |
| "step": 3110, |
| "valid_targets_mean": 4382.4, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 4.944444444444445, |
| "grad_norm": 0.46887051592133433, |
| "learning_rate": 9.6321486337895e-06, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15827694535255432, |
| "step": 3115, |
| "valid_targets_mean": 5222.6, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 4.9523809523809526, |
| "grad_norm": 0.41511980613828253, |
| "learning_rate": 9.564542674321228e-06, |
| "loss": 0.1479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14313764870166779, |
| "step": 3120, |
| "valid_targets_mean": 5663.2, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 4.9603174603174605, |
| "grad_norm": 0.4621864142346036, |
| "learning_rate": 9.49710016618937e-06, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15151920914649963, |
| "step": 3125, |
| "valid_targets_mean": 5380.6, |
| "valid_targets_min": 313 |
| }, |
| { |
| "epoch": 4.968253968253968, |
| "grad_norm": 0.48527019717345327, |
| "learning_rate": 9.429822165750893e-06, |
| "loss": 0.1509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14661577343940735, |
| "step": 3130, |
| "valid_targets_mean": 4398.2, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 4.976190476190476, |
| "grad_norm": 0.3831996919641483, |
| "learning_rate": 9.36270972678607e-06, |
| "loss": 0.1398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13461735844612122, |
| "step": 3135, |
| "valid_targets_mean": 6052.1, |
| "valid_targets_min": 1578 |
| }, |
| { |
| "epoch": 4.984126984126984, |
| "grad_norm": 0.4100072649060219, |
| "learning_rate": 9.295763900481977e-06, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12445595860481262, |
| "step": 3140, |
| "valid_targets_mean": 5427.4, |
| "valid_targets_min": 307 |
| }, |
| { |
| "epoch": 4.992063492063492, |
| "grad_norm": 0.46254552204793853, |
| "learning_rate": 9.22898573541602e-06, |
| "loss": 0.1485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16388916969299316, |
| "step": 3145, |
| "valid_targets_mean": 5861.9, |
| "valid_targets_min": 2467 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.40795669884699387, |
| "learning_rate": 9.162376277539513e-06, |
| "loss": 0.1439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15090236067771912, |
| "step": 3150, |
| "valid_targets_mean": 5592.5, |
| "valid_targets_min": 1990 |
| }, |
| { |
| "epoch": 5.007936507936508, |
| "grad_norm": 0.3857823068068869, |
| "learning_rate": 9.095936570161301e-06, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14320944249629974, |
| "step": 3155, |
| "valid_targets_mean": 5639.6, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 5.015873015873016, |
| "grad_norm": 0.5435449453461013, |
| "learning_rate": 9.029667653931411e-06, |
| "loss": 0.1325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1401306390762329, |
| "step": 3160, |
| "valid_targets_mean": 5760.2, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 5.023809523809524, |
| "grad_norm": 0.6789857642195729, |
| "learning_rate": 8.96357056682475e-06, |
| "loss": 0.1367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12801998853683472, |
| "step": 3165, |
| "valid_targets_mean": 5610.3, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 5.031746031746032, |
| "grad_norm": 0.38873846063838485, |
| "learning_rate": 8.897646344124882e-06, |
| "loss": 0.1304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11531123518943787, |
| "step": 3170, |
| "valid_targets_mean": 6343.7, |
| "valid_targets_min": 2461 |
| }, |
| { |
| "epoch": 5.0396825396825395, |
| "grad_norm": 0.4632360566976383, |
| "learning_rate": 8.83189601840773e-06, |
| "loss": 0.1416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14523249864578247, |
| "step": 3175, |
| "valid_targets_mean": 5589.1, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 5.0476190476190474, |
| "grad_norm": 0.44480606265136036, |
| "learning_rate": 8.766320619525511e-06, |
| "loss": 0.1405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1437515914440155, |
| "step": 3180, |
| "valid_targets_mean": 5137.6, |
| "valid_targets_min": 1450 |
| }, |
| { |
| "epoch": 5.055555555555555, |
| "grad_norm": 0.40620681435947337, |
| "learning_rate": 8.700921174590525e-06, |
| "loss": 0.1357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13447782397270203, |
| "step": 3185, |
| "valid_targets_mean": 6346.1, |
| "valid_targets_min": 4150 |
| }, |
| { |
| "epoch": 5.063492063492063, |
| "grad_norm": 0.46662620571823504, |
| "learning_rate": 8.63569870795907e-06, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14662285149097443, |
| "step": 3190, |
| "valid_targets_mean": 6060.2, |
| "valid_targets_min": 1308 |
| }, |
| { |
| "epoch": 5.071428571428571, |
| "grad_norm": 0.4654130995805731, |
| "learning_rate": 8.570654241215466e-06, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14438563585281372, |
| "step": 3195, |
| "valid_targets_mean": 5318.1, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 5.079365079365079, |
| "grad_norm": 0.40240677129462593, |
| "learning_rate": 8.505788793155978e-06, |
| "loss": 0.1285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11840318888425827, |
| "step": 3200, |
| "valid_targets_mean": 6147.7, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 5.087301587301587, |
| "grad_norm": 0.5552645220273652, |
| "learning_rate": 8.441103379772893e-06, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15520301461219788, |
| "step": 3205, |
| "valid_targets_mean": 5761.9, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 5.095238095238095, |
| "grad_norm": 0.4847744229611747, |
| "learning_rate": 8.376599014238605e-06, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12781260907649994, |
| "step": 3210, |
| "valid_targets_mean": 5049.5, |
| "valid_targets_min": 2182 |
| }, |
| { |
| "epoch": 5.103174603174603, |
| "grad_norm": 0.4448058887555173, |
| "learning_rate": 8.312276706889738e-06, |
| "loss": 0.1409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14810214936733246, |
| "step": 3215, |
| "valid_targets_mean": 4893.2, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 5.111111111111111, |
| "grad_norm": 0.3769447002552102, |
| "learning_rate": 8.24813746521133e-06, |
| "loss": 0.1442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11988615989685059, |
| "step": 3220, |
| "valid_targets_mean": 6354.1, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 5.119047619047619, |
| "grad_norm": 0.40775763269992454, |
| "learning_rate": 8.184182293821046e-06, |
| "loss": 0.1335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13774478435516357, |
| "step": 3225, |
| "valid_targets_mean": 6155.4, |
| "valid_targets_min": 1769 |
| }, |
| { |
| "epoch": 5.1269841269841265, |
| "grad_norm": 0.4621791306803943, |
| "learning_rate": 8.120412194453442e-06, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13131381571292877, |
| "step": 3230, |
| "valid_targets_mean": 5662.6, |
| "valid_targets_min": 1704 |
| }, |
| { |
| "epoch": 5.134920634920635, |
| "grad_norm": 0.47477190317994294, |
| "learning_rate": 8.056828165944282e-06, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11765207350254059, |
| "step": 3235, |
| "valid_targets_mean": 4793.4, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 5.142857142857143, |
| "grad_norm": 0.4211817590749248, |
| "learning_rate": 7.993431204214883e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140112042427063, |
| "step": 3240, |
| "valid_targets_mean": 6042.8, |
| "valid_targets_min": 2069 |
| }, |
| { |
| "epoch": 5.150793650793651, |
| "grad_norm": 0.4100200812051378, |
| "learning_rate": 7.93022230225652e-06, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1306135654449463, |
| "step": 3245, |
| "valid_targets_mean": 5446.9, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 5.158730158730159, |
| "grad_norm": 0.4654477832902761, |
| "learning_rate": 7.867202450114892e-06, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1470104455947876, |
| "step": 3250, |
| "valid_targets_mean": 4906.9, |
| "valid_targets_min": 483 |
| }, |
| { |
| "epoch": 5.166666666666667, |
| "grad_norm": 0.523468892447528, |
| "learning_rate": 7.804372634874582e-06, |
| "loss": 0.1356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13795553147792816, |
| "step": 3255, |
| "valid_targets_mean": 4284.5, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 5.174603174603175, |
| "grad_norm": 0.6078996381505655, |
| "learning_rate": 7.74173384064359e-06, |
| "loss": 0.1355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1462775468826294, |
| "step": 3260, |
| "valid_targets_mean": 5041.4, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 5.182539682539683, |
| "grad_norm": 0.4607675067323951, |
| "learning_rate": 7.679287048537987e-06, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1391090750694275, |
| "step": 3265, |
| "valid_targets_mean": 5745.2, |
| "valid_targets_min": 336 |
| }, |
| { |
| "epoch": 5.190476190476191, |
| "grad_norm": 0.4923341770949091, |
| "learning_rate": 7.617033236666469e-06, |
| "loss": 0.1331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1512683480978012, |
| "step": 3270, |
| "valid_targets_mean": 4856.6, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 5.198412698412699, |
| "grad_norm": 0.4823935955118556, |
| "learning_rate": 7.55497338011506e-06, |
| "loss": 0.133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12928101420402527, |
| "step": 3275, |
| "valid_targets_mean": 5083.1, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 5.2063492063492065, |
| "grad_norm": 0.4571859304803118, |
| "learning_rate": 7.493108450931879e-06, |
| "loss": 0.1409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.147546648979187, |
| "step": 3280, |
| "valid_targets_mean": 5298.1, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 5.214285714285714, |
| "grad_norm": 0.4656323081387472, |
| "learning_rate": 7.4314394181118636e-06, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13368697464466095, |
| "step": 3285, |
| "valid_targets_mean": 5323.8, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 5.222222222222222, |
| "grad_norm": 0.47778320363976773, |
| "learning_rate": 7.369967247581611e-06, |
| "loss": 0.1363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14050470292568207, |
| "step": 3290, |
| "valid_targets_mean": 4988.6, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 5.23015873015873, |
| "grad_norm": 0.47185902185121587, |
| "learning_rate": 7.3086929021842575e-06, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14221060276031494, |
| "step": 3295, |
| "valid_targets_mean": 4921.3, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 5.238095238095238, |
| "grad_norm": 0.40677949622794063, |
| "learning_rate": 7.247617341664384e-06, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15191778540611267, |
| "step": 3300, |
| "valid_targets_mean": 6783.2, |
| "valid_targets_min": 2108 |
| }, |
| { |
| "epoch": 5.246031746031746, |
| "grad_norm": 0.5597275095189963, |
| "learning_rate": 7.186741522652994e-06, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1412215381860733, |
| "step": 3305, |
| "valid_targets_mean": 5306.6, |
| "valid_targets_min": 1796 |
| }, |
| { |
| "epoch": 5.253968253968254, |
| "grad_norm": 0.4136667615907917, |
| "learning_rate": 7.12606639865252e-06, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13404718041419983, |
| "step": 3310, |
| "valid_targets_mean": 5412.3, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 5.261904761904762, |
| "grad_norm": 0.5072282174178516, |
| "learning_rate": 7.065592920021893e-06, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1653522104024887, |
| "step": 3315, |
| "valid_targets_mean": 5170.6, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 5.26984126984127, |
| "grad_norm": 0.43649425013960674, |
| "learning_rate": 7.005322033961679e-06, |
| "loss": 0.1421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14359837770462036, |
| "step": 3320, |
| "valid_targets_mean": 5731.9, |
| "valid_targets_min": 2041 |
| }, |
| { |
| "epoch": 5.277777777777778, |
| "grad_norm": 0.4609844808793299, |
| "learning_rate": 6.945254684499185e-06, |
| "loss": 0.1388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14887037873268127, |
| "step": 3325, |
| "valid_targets_mean": 5072.8, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 5.285714285714286, |
| "grad_norm": 0.4423681058460165, |
| "learning_rate": 6.8853918124737274e-06, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1400473713874817, |
| "step": 3330, |
| "valid_targets_mean": 5419.5, |
| "valid_targets_min": 461 |
| }, |
| { |
| "epoch": 5.2936507936507935, |
| "grad_norm": 0.4833740463102983, |
| "learning_rate": 6.825734355521898e-06, |
| "loss": 0.1438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1373916119337082, |
| "step": 3335, |
| "valid_targets_mean": 5413.9, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 5.301587301587301, |
| "grad_norm": 0.46607539050074326, |
| "learning_rate": 6.766283248062817e-06, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14503991603851318, |
| "step": 3340, |
| "valid_targets_mean": 5005.1, |
| "valid_targets_min": 1372 |
| }, |
| { |
| "epoch": 5.309523809523809, |
| "grad_norm": 0.46602580090763035, |
| "learning_rate": 6.707039421283559e-06, |
| "loss": 0.1362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1407843828201294, |
| "step": 3345, |
| "valid_targets_mean": 4867.7, |
| "valid_targets_min": 279 |
| }, |
| { |
| "epoch": 5.317460317460317, |
| "grad_norm": 0.4977380166852099, |
| "learning_rate": 6.648003803124559e-06, |
| "loss": 0.1417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18442052602767944, |
| "step": 3350, |
| "valid_targets_mean": 4517.1, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 5.325396825396825, |
| "grad_norm": 0.45300213871690015, |
| "learning_rate": 6.589177318265047e-06, |
| "loss": 0.133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13406887650489807, |
| "step": 3355, |
| "valid_targets_mean": 5391.9, |
| "valid_targets_min": 501 |
| }, |
| { |
| "epoch": 5.333333333333333, |
| "grad_norm": 0.4255524573366613, |
| "learning_rate": 6.53056088810857e-06, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14955641329288483, |
| "step": 3360, |
| "valid_targets_mean": 5542.8, |
| "valid_targets_min": 2458 |
| }, |
| { |
| "epoch": 5.341269841269841, |
| "grad_norm": 0.5534775234199173, |
| "learning_rate": 6.472155430768608e-06, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12088638544082642, |
| "step": 3365, |
| "valid_targets_mean": 6366.4, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 5.349206349206349, |
| "grad_norm": 0.4364437395513567, |
| "learning_rate": 6.413961861054132e-06, |
| "loss": 0.1329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15652699768543243, |
| "step": 3370, |
| "valid_targets_mean": 5471.2, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 5.357142857142857, |
| "grad_norm": 0.45770813360412227, |
| "learning_rate": 6.3559810904553095e-06, |
| "loss": 0.1361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14036116003990173, |
| "step": 3375, |
| "valid_targets_mean": 5520.9, |
| "valid_targets_min": 256 |
| }, |
| { |
| "epoch": 5.365079365079365, |
| "grad_norm": 0.4153555346953972, |
| "learning_rate": 6.298214027129219e-06, |
| "loss": 0.1341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13151246309280396, |
| "step": 3380, |
| "valid_targets_mean": 6010.9, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 5.3730158730158735, |
| "grad_norm": 0.4451350722143499, |
| "learning_rate": 6.240661575885629e-06, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1685609072446823, |
| "step": 3385, |
| "valid_targets_mean": 5214.2, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 5.380952380952381, |
| "grad_norm": 0.46292596088927307, |
| "learning_rate": 6.183324638172819e-06, |
| "loss": 0.1438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15203514695167542, |
| "step": 3390, |
| "valid_targets_mean": 5266.0, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 5.388888888888889, |
| "grad_norm": 0.4676464235157195, |
| "learning_rate": 6.126204112063463e-06, |
| "loss": 0.1353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13088193535804749, |
| "step": 3395, |
| "valid_targets_mean": 4737.1, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 5.396825396825397, |
| "grad_norm": 0.6797962177962652, |
| "learning_rate": 6.069300892240564e-06, |
| "loss": 0.1514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16591420769691467, |
| "step": 3400, |
| "valid_targets_mean": 4606.3, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 5.404761904761905, |
| "grad_norm": 0.47267093685643496, |
| "learning_rate": 6.0126158699834625e-06, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13353607058525085, |
| "step": 3405, |
| "valid_targets_mean": 5052.6, |
| "valid_targets_min": 2020 |
| }, |
| { |
| "epoch": 5.412698412698413, |
| "grad_norm": 0.428442687908954, |
| "learning_rate": 5.956149933153816e-06, |
| "loss": 0.1318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12273760139942169, |
| "step": 3410, |
| "valid_targets_mean": 5588.0, |
| "valid_targets_min": 2053 |
| }, |
| { |
| "epoch": 5.420634920634921, |
| "grad_norm": 0.4412367255518039, |
| "learning_rate": 5.899903966181751e-06, |
| "loss": 0.1398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14523178339004517, |
| "step": 3415, |
| "valid_targets_mean": 5505.2, |
| "valid_targets_min": 2042 |
| }, |
| { |
| "epoch": 5.428571428571429, |
| "grad_norm": 0.43781568976305363, |
| "learning_rate": 5.843878850052007e-06, |
| "loss": 0.1261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14099499583244324, |
| "step": 3420, |
| "valid_targets_mean": 5586.9, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 5.436507936507937, |
| "grad_norm": 0.46059817758019467, |
| "learning_rate": 5.788075462290084e-06, |
| "loss": 0.1333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1432957500219345, |
| "step": 3425, |
| "valid_targets_mean": 4740.2, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 5.444444444444445, |
| "grad_norm": 0.415134511085044, |
| "learning_rate": 5.732494676948554e-06, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12942150235176086, |
| "step": 3430, |
| "valid_targets_mean": 6054.6, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 5.4523809523809526, |
| "grad_norm": 0.41001838037825894, |
| "learning_rate": 5.677137364593363e-06, |
| "loss": 0.1379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14375941455364227, |
| "step": 3435, |
| "valid_targets_mean": 5782.4, |
| "valid_targets_min": 2362 |
| }, |
| { |
| "epoch": 5.4603174603174605, |
| "grad_norm": 0.4462203270648477, |
| "learning_rate": 5.622004392290163e-06, |
| "loss": 0.1409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13974609971046448, |
| "step": 3440, |
| "valid_targets_mean": 5166.1, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 5.468253968253968, |
| "grad_norm": 0.5621286314149347, |
| "learning_rate": 5.567096623590758e-06, |
| "loss": 0.1432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14251437783241272, |
| "step": 3445, |
| "valid_targets_mean": 5521.8, |
| "valid_targets_min": 1822 |
| }, |
| { |
| "epoch": 5.476190476190476, |
| "grad_norm": 0.3951253389087575, |
| "learning_rate": 5.512414918519573e-06, |
| "loss": 0.1375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.138666570186615, |
| "step": 3450, |
| "valid_targets_mean": 6410.9, |
| "valid_targets_min": 2903 |
| }, |
| { |
| "epoch": 5.484126984126984, |
| "grad_norm": 0.42978600879401685, |
| "learning_rate": 5.457960133560179e-06, |
| "loss": 0.1395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13873498141765594, |
| "step": 3455, |
| "valid_targets_mean": 5563.0, |
| "valid_targets_min": 2443 |
| }, |
| { |
| "epoch": 5.492063492063492, |
| "grad_norm": 0.4763755663272107, |
| "learning_rate": 5.403733121641883e-06, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14260432124137878, |
| "step": 3460, |
| "valid_targets_mean": 5387.6, |
| "valid_targets_min": 1680 |
| }, |
| { |
| "epoch": 5.5, |
| "grad_norm": 0.45865214891995293, |
| "learning_rate": 5.349734732126366e-06, |
| "loss": 0.1299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15055881440639496, |
| "step": 3465, |
| "valid_targets_mean": 5297.8, |
| "valid_targets_min": 247 |
| }, |
| { |
| "epoch": 5.507936507936508, |
| "grad_norm": 0.4739801326379873, |
| "learning_rate": 5.295965810794376e-06, |
| "loss": 0.1415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1341158002614975, |
| "step": 3470, |
| "valid_targets_mean": 4671.8, |
| "valid_targets_min": 1946 |
| }, |
| { |
| "epoch": 5.515873015873016, |
| "grad_norm": 0.4054624348563083, |
| "learning_rate": 5.2424271998324895e-06, |
| "loss": 0.1305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13239628076553345, |
| "step": 3475, |
| "valid_targets_mean": 5538.2, |
| "valid_targets_min": 2317 |
| }, |
| { |
| "epoch": 5.523809523809524, |
| "grad_norm": 0.47822327586671515, |
| "learning_rate": 5.189119737819912e-06, |
| "loss": 0.1359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13307338953018188, |
| "step": 3480, |
| "valid_targets_mean": 5326.6, |
| "valid_targets_min": 1927 |
| }, |
| { |
| "epoch": 5.531746031746032, |
| "grad_norm": 0.45640673731159975, |
| "learning_rate": 5.136044259715342e-06, |
| "loss": 0.1411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1569247543811798, |
| "step": 3485, |
| "valid_targets_mean": 5192.1, |
| "valid_targets_min": 1402 |
| }, |
| { |
| "epoch": 5.5396825396825395, |
| "grad_norm": 0.47606206142121826, |
| "learning_rate": 5.083201596843905e-06, |
| "loss": 0.1301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13270564377307892, |
| "step": 3490, |
| "valid_targets_mean": 5579.8, |
| "valid_targets_min": 1802 |
| }, |
| { |
| "epoch": 5.5476190476190474, |
| "grad_norm": 0.48207429223420034, |
| "learning_rate": 5.030592576884117e-06, |
| "loss": 0.1479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1469019204378128, |
| "step": 3495, |
| "valid_targets_mean": 5300.8, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 5.555555555555555, |
| "grad_norm": 0.46920831785621236, |
| "learning_rate": 4.978218023854928e-06, |
| "loss": 0.1355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14404523372650146, |
| "step": 3500, |
| "valid_targets_mean": 4518.9, |
| "valid_targets_min": 229 |
| }, |
| { |
| "epoch": 5.563492063492063, |
| "grad_norm": 0.42912173167963297, |
| "learning_rate": 4.926078758102834e-06, |
| "loss": 0.1417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521531045436859, |
| "step": 3505, |
| "valid_targets_mean": 5723.4, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 5.571428571428571, |
| "grad_norm": 0.503182430334019, |
| "learning_rate": 4.87417559628897e-06, |
| "loss": 0.1304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13956725597381592, |
| "step": 3510, |
| "valid_targets_mean": 5755.2, |
| "valid_targets_min": 342 |
| }, |
| { |
| "epoch": 5.579365079365079, |
| "grad_norm": 0.483615956667945, |
| "learning_rate": 4.822509351376399e-06, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15917867422103882, |
| "step": 3515, |
| "valid_targets_mean": 4745.8, |
| "valid_targets_min": 871 |
| }, |
| { |
| "epoch": 5.587301587301587, |
| "grad_norm": 0.44843746346045477, |
| "learning_rate": 4.7710808326173115e-06, |
| "loss": 0.1376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14553232491016388, |
| "step": 3520, |
| "valid_targets_mean": 5322.7, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 5.595238095238095, |
| "grad_norm": 0.4446428825967545, |
| "learning_rate": 4.719890845540385e-06, |
| "loss": 0.1414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1446400284767151, |
| "step": 3525, |
| "valid_targets_mean": 5464.6, |
| "valid_targets_min": 1876 |
| }, |
| { |
| "epoch": 5.603174603174603, |
| "grad_norm": 0.44461133087445714, |
| "learning_rate": 4.668940191938156e-06, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12743496894836426, |
| "step": 3530, |
| "valid_targets_mean": 5617.1, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 5.611111111111111, |
| "grad_norm": 0.46893046808084937, |
| "learning_rate": 4.618229669854464e-06, |
| "loss": 0.1357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1406087577342987, |
| "step": 3535, |
| "valid_targets_mean": 5965.8, |
| "valid_targets_min": 2904 |
| }, |
| { |
| "epoch": 5.619047619047619, |
| "grad_norm": 0.49547441030459144, |
| "learning_rate": 4.567760073571947e-06, |
| "loss": 0.136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14891457557678223, |
| "step": 3540, |
| "valid_targets_mean": 4223.9, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 5.6269841269841265, |
| "grad_norm": 0.48451923979691575, |
| "learning_rate": 4.51753219359961e-06, |
| "loss": 0.1392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14008775353431702, |
| "step": 3545, |
| "valid_targets_mean": 5037.8, |
| "valid_targets_min": 2496 |
| }, |
| { |
| "epoch": 5.634920634920634, |
| "grad_norm": 0.4290885471458542, |
| "learning_rate": 4.467546816660433e-06, |
| "loss": 0.1383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1463758647441864, |
| "step": 3550, |
| "valid_targets_mean": 6069.6, |
| "valid_targets_min": 2782 |
| }, |
| { |
| "epoch": 5.642857142857143, |
| "grad_norm": 0.4422867985916354, |
| "learning_rate": 4.417804725679058e-06, |
| "loss": 0.1441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1522657573223114, |
| "step": 3555, |
| "valid_targets_mean": 7388.6, |
| "valid_targets_min": 2410 |
| }, |
| { |
| "epoch": 5.650793650793651, |
| "grad_norm": 0.4326771572943575, |
| "learning_rate": 4.368306699769518e-06, |
| "loss": 0.1362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13901498913764954, |
| "step": 3560, |
| "valid_targets_mean": 5687.3, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 5.658730158730159, |
| "grad_norm": 0.5184808560608285, |
| "learning_rate": 4.319053514223033e-06, |
| "loss": 0.1301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12393245846033096, |
| "step": 3565, |
| "valid_targets_mean": 4805.2, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 5.666666666666667, |
| "grad_norm": 0.4747228961326593, |
| "learning_rate": 4.270045940495879e-06, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1519310176372528, |
| "step": 3570, |
| "valid_targets_mean": 4909.6, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 5.674603174603175, |
| "grad_norm": 0.4817480251050087, |
| "learning_rate": 4.221284746197292e-06, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14879171550273895, |
| "step": 3575, |
| "valid_targets_mean": 5205.3, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 5.682539682539683, |
| "grad_norm": 0.5206783763038453, |
| "learning_rate": 4.172770695077437e-06, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16022273898124695, |
| "step": 3580, |
| "valid_targets_mean": 4187.7, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.690476190476191, |
| "grad_norm": 0.42530942051464743, |
| "learning_rate": 4.124504547015487e-06, |
| "loss": 0.1403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1300957351922989, |
| "step": 3585, |
| "valid_targets_mean": 6382.3, |
| "valid_targets_min": 2232 |
| }, |
| { |
| "epoch": 5.698412698412699, |
| "grad_norm": 0.4773846019671863, |
| "learning_rate": 4.0764870580076675e-06, |
| "loss": 0.1527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17422491312026978, |
| "step": 3590, |
| "valid_targets_mean": 5224.0, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 5.7063492063492065, |
| "grad_norm": 0.3861656168881239, |
| "learning_rate": 4.0287189801554304e-06, |
| "loss": 0.1436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12745806574821472, |
| "step": 3595, |
| "valid_targets_mean": 6368.2, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 5.714285714285714, |
| "grad_norm": 0.41849044348707654, |
| "learning_rate": 3.98120106165371e-06, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13698044419288635, |
| "step": 3600, |
| "valid_targets_mean": 5723.8, |
| "valid_targets_min": 2689 |
| }, |
| { |
| "epoch": 5.722222222222222, |
| "grad_norm": 0.5006534631008478, |
| "learning_rate": 3.933934046779164e-06, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15041181445121765, |
| "step": 3605, |
| "valid_targets_mean": 4726.2, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 5.73015873015873, |
| "grad_norm": 0.5390021957931794, |
| "learning_rate": 3.886918675878513e-06, |
| "loss": 0.1352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15215769410133362, |
| "step": 3610, |
| "valid_targets_mean": 5078.9, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 5.738095238095238, |
| "grad_norm": 0.4242218655638763, |
| "learning_rate": 3.840155685356983e-06, |
| "loss": 0.1313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12816202640533447, |
| "step": 3615, |
| "valid_targets_mean": 5724.1, |
| "valid_targets_min": 2290 |
| }, |
| { |
| "epoch": 5.746031746031746, |
| "grad_norm": 0.40905901981368425, |
| "learning_rate": 3.793645807666735e-06, |
| "loss": 0.1399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12471656501293182, |
| "step": 3620, |
| "valid_targets_mean": 6163.4, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 5.753968253968254, |
| "grad_norm": 0.5134066612062572, |
| "learning_rate": 3.747389771295411e-06, |
| "loss": 0.1316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13810807466506958, |
| "step": 3625, |
| "valid_targets_mean": 5215.5, |
| "valid_targets_min": 320 |
| }, |
| { |
| "epoch": 5.761904761904762, |
| "grad_norm": 0.44176531273164726, |
| "learning_rate": 3.701388300754709e-06, |
| "loss": 0.149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15570278465747833, |
| "step": 3630, |
| "valid_targets_mean": 5831.4, |
| "valid_targets_min": 1928 |
| }, |
| { |
| "epoch": 5.76984126984127, |
| "grad_norm": 0.4552213038987976, |
| "learning_rate": 3.6556421165690516e-06, |
| "loss": 0.132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13112439215183258, |
| "step": 3635, |
| "valid_targets_mean": 5127.6, |
| "valid_targets_min": 1412 |
| }, |
| { |
| "epoch": 5.777777777777778, |
| "grad_norm": 0.5475459293945621, |
| "learning_rate": 3.610151935264288e-06, |
| "loss": 0.1321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13923147320747375, |
| "step": 3640, |
| "valid_targets_mean": 5058.1, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 5.785714285714286, |
| "grad_norm": 0.4062383720325422, |
| "learning_rate": 3.5649184693564797e-06, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12178117781877518, |
| "step": 3645, |
| "valid_targets_mean": 6188.1, |
| "valid_targets_min": 2820 |
| }, |
| { |
| "epoch": 5.7936507936507935, |
| "grad_norm": 0.41210477208428037, |
| "learning_rate": 3.5199424273407277e-06, |
| "loss": 0.1329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11573171615600586, |
| "step": 3650, |
| "valid_targets_mean": 5608.1, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 5.801587301587301, |
| "grad_norm": 0.39026902409095005, |
| "learning_rate": 3.4752245136801065e-06, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11422628164291382, |
| "step": 3655, |
| "valid_targets_mean": 6121.1, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 5.809523809523809, |
| "grad_norm": 0.44136839976284375, |
| "learning_rate": 3.430765428794569e-06, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15087169408798218, |
| "step": 3660, |
| "valid_targets_mean": 5458.3, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 5.817460317460317, |
| "grad_norm": 0.47272488901004456, |
| "learning_rate": 3.3865658690500424e-06, |
| "loss": 0.1342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12730719149112701, |
| "step": 3665, |
| "valid_targets_mean": 5489.8, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 5.825396825396825, |
| "grad_norm": 0.4286583074647361, |
| "learning_rate": 3.34262652674749e-06, |
| "loss": 0.1399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13272640109062195, |
| "step": 3670, |
| "valid_targets_mean": 5855.3, |
| "valid_targets_min": 3739 |
| }, |
| { |
| "epoch": 5.833333333333333, |
| "grad_norm": 0.4961674424548416, |
| "learning_rate": 3.2989480901120684e-06, |
| "loss": 0.1305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14517953991889954, |
| "step": 3675, |
| "valid_targets_mean": 5103.6, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 5.841269841269841, |
| "grad_norm": 0.5038921133963972, |
| "learning_rate": 3.2555312432823283e-06, |
| "loss": 0.1381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14607466757297516, |
| "step": 3680, |
| "valid_targets_mean": 4695.1, |
| "valid_targets_min": 2224 |
| }, |
| { |
| "epoch": 5.849206349206349, |
| "grad_norm": 0.4516355692524723, |
| "learning_rate": 3.2123766662995572e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13942056894302368, |
| "step": 3685, |
| "valid_targets_mean": 5577.4, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 5.857142857142857, |
| "grad_norm": 0.43990400419076664, |
| "learning_rate": 3.1694850350970686e-06, |
| "loss": 0.1373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14388282597064972, |
| "step": 3690, |
| "valid_targets_mean": 5896.1, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 5.865079365079366, |
| "grad_norm": 0.4430961156309604, |
| "learning_rate": 3.1268570214896265e-06, |
| "loss": 0.1454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16903355717658997, |
| "step": 3695, |
| "valid_targets_mean": 5768.0, |
| "valid_targets_min": 309 |
| }, |
| { |
| "epoch": 5.8730158730158735, |
| "grad_norm": 0.4687413821050724, |
| "learning_rate": 3.0844932931629602e-06, |
| "loss": 0.1389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12664330005645752, |
| "step": 3700, |
| "valid_targets_mean": 5469.9, |
| "valid_targets_min": 582 |
| }, |
| { |
| "epoch": 5.880952380952381, |
| "grad_norm": 0.4251478406093825, |
| "learning_rate": 3.0423945136632626e-06, |
| "loss": 0.1371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14676138758659363, |
| "step": 3705, |
| "valid_targets_mean": 6292.8, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 5.888888888888889, |
| "grad_norm": 0.4418913815124218, |
| "learning_rate": 3.000561342386814e-06, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1596686840057373, |
| "step": 3710, |
| "valid_targets_mean": 5276.0, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 5.896825396825397, |
| "grad_norm": 0.46832139188754646, |
| "learning_rate": 2.9589944345696596e-06, |
| "loss": 0.1346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12101615965366364, |
| "step": 3715, |
| "valid_targets_mean": 4913.4, |
| "valid_targets_min": 343 |
| }, |
| { |
| "epoch": 5.904761904761905, |
| "grad_norm": 0.4657929056680499, |
| "learning_rate": 2.9176944412773322e-06, |
| "loss": 0.149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17338143289089203, |
| "step": 3720, |
| "valid_targets_mean": 5412.4, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 5.912698412698413, |
| "grad_norm": 0.4449595143164407, |
| "learning_rate": 2.876662009394673e-06, |
| "loss": 0.1346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15727762877941132, |
| "step": 3725, |
| "valid_targets_mean": 5328.9, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 5.920634920634921, |
| "grad_norm": 0.39696814679103, |
| "learning_rate": 2.8358977816156796e-06, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11638738214969635, |
| "step": 3730, |
| "valid_targets_mean": 6867.2, |
| "valid_targets_min": 3676 |
| }, |
| { |
| "epoch": 5.928571428571429, |
| "grad_norm": 0.47195292364800606, |
| "learning_rate": 2.7954023964334485e-06, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1505923867225647, |
| "step": 3735, |
| "valid_targets_mean": 5757.2, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 5.936507936507937, |
| "grad_norm": 0.4486759780229958, |
| "learning_rate": 2.7551764881301955e-06, |
| "loss": 0.1246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13487672805786133, |
| "step": 3740, |
| "valid_targets_mean": 5926.0, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 5.944444444444445, |
| "grad_norm": 0.45150456684299833, |
| "learning_rate": 2.715220686767268e-06, |
| "loss": 0.1325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13316667079925537, |
| "step": 3745, |
| "valid_targets_mean": 5609.4, |
| "valid_targets_min": 2528 |
| }, |
| { |
| "epoch": 5.9523809523809526, |
| "grad_norm": 0.4612924420161714, |
| "learning_rate": 2.6755356181753247e-06, |
| "loss": 0.1555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17791566252708435, |
| "step": 3750, |
| "valid_targets_mean": 5493.9, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 5.9603174603174605, |
| "grad_norm": 0.4466679622369211, |
| "learning_rate": 2.6361219039445328e-06, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1417991816997528, |
| "step": 3755, |
| "valid_targets_mean": 5531.8, |
| "valid_targets_min": 3560 |
| }, |
| { |
| "epoch": 5.968253968253968, |
| "grad_norm": 0.46290951572004435, |
| "learning_rate": 2.5969801614147838e-06, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1562907099723816, |
| "step": 3760, |
| "valid_targets_mean": 5726.4, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 5.976190476190476, |
| "grad_norm": 0.41130105503656605, |
| "learning_rate": 2.558111003666075e-06, |
| "loss": 0.1451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13213077187538147, |
| "step": 3765, |
| "valid_targets_mean": 5965.7, |
| "valid_targets_min": 1546 |
| }, |
| { |
| "epoch": 5.984126984126984, |
| "grad_norm": 0.4305429547314029, |
| "learning_rate": 2.519515039508893e-06, |
| "loss": 0.1328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11605265736579895, |
| "step": 3770, |
| "valid_targets_mean": 5509.0, |
| "valid_targets_min": 290 |
| }, |
| { |
| "epoch": 5.992063492063492, |
| "grad_norm": 0.43615187162481, |
| "learning_rate": 2.481192873474667e-06, |
| "loss": 0.1365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13950824737548828, |
| "step": 3775, |
| "valid_targets_mean": 5780.9, |
| "valid_targets_min": 1479 |
| }, |
| { |
| "epoch": 6.0, |
| "grad_norm": 0.39743183112610925, |
| "learning_rate": 2.4431451058062928e-06, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1134757548570633, |
| "step": 3780, |
| "valid_targets_mean": 5882.9, |
| "valid_targets_min": 2457 |
| }, |
| { |
| "epoch": 6.007936507936508, |
| "grad_norm": 0.4320579605085731, |
| "learning_rate": 2.4053723324487677e-06, |
| "loss": 0.1308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12739768624305725, |
| "step": 3785, |
| "valid_targets_mean": 4568.0, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 6.015873015873016, |
| "grad_norm": 0.45806291042546377, |
| "learning_rate": 2.3678751450398196e-06, |
| "loss": 0.1348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1493530422449112, |
| "step": 3790, |
| "valid_targets_mean": 5264.6, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 6.023809523809524, |
| "grad_norm": 0.4440865317653884, |
| "learning_rate": 2.330654130900656e-06, |
| "loss": 0.1324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13022762537002563, |
| "step": 3795, |
| "valid_targets_mean": 4942.4, |
| "valid_targets_min": 2199 |
| }, |
| { |
| "epoch": 6.031746031746032, |
| "grad_norm": 0.4289001750038118, |
| "learning_rate": 2.2937098730267572e-06, |
| "loss": 0.134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11798284202814102, |
| "step": 3800, |
| "valid_targets_mean": 5962.4, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 6.0396825396825395, |
| "grad_norm": 0.4804416865960379, |
| "learning_rate": 2.2570429500787604e-06, |
| "loss": 0.1359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13769641518592834, |
| "step": 3805, |
| "valid_targets_mean": 4876.4, |
| "valid_targets_min": 2078 |
| }, |
| { |
| "epoch": 6.0476190476190474, |
| "grad_norm": 0.4248137219988032, |
| "learning_rate": 2.2206539363733738e-06, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09792445600032806, |
| "step": 3810, |
| "valid_targets_mean": 6735.6, |
| "valid_targets_min": 2875 |
| }, |
| { |
| "epoch": 6.055555555555555, |
| "grad_norm": 0.4458277839797382, |
| "learning_rate": 2.1845434018744038e-06, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13032405078411102, |
| "step": 3815, |
| "valid_targets_mean": 5100.5, |
| "valid_targets_min": 1711 |
| }, |
| { |
| "epoch": 6.063492063492063, |
| "grad_norm": 0.46870997489479654, |
| "learning_rate": 2.148711912183803e-06, |
| "loss": 0.1349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1340586543083191, |
| "step": 3820, |
| "valid_targets_mean": 6257.2, |
| "valid_targets_min": 3713 |
| }, |
| { |
| "epoch": 6.071428571428571, |
| "grad_norm": 0.43220936389411174, |
| "learning_rate": 2.1131600285328458e-06, |
| "loss": 0.1372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13491111993789673, |
| "step": 3825, |
| "valid_targets_mean": 5652.9, |
| "valid_targets_min": 2291 |
| }, |
| { |
| "epoch": 6.079365079365079, |
| "grad_norm": 0.4938619349035986, |
| "learning_rate": 2.0778883077732903e-06, |
| "loss": 0.1221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12590594589710236, |
| "step": 3830, |
| "valid_targets_mean": 5837.1, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 6.087301587301587, |
| "grad_norm": 0.4461842204628299, |
| "learning_rate": 2.0428973023686983e-06, |
| "loss": 0.1301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12995757162570953, |
| "step": 3835, |
| "valid_targets_mean": 5839.1, |
| "valid_targets_min": 2495 |
| }, |
| { |
| "epoch": 6.095238095238095, |
| "grad_norm": 0.4514403709392358, |
| "learning_rate": 2.0081875603857726e-06, |
| "loss": 0.1271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11519353836774826, |
| "step": 3840, |
| "valid_targets_mean": 5285.4, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 6.103174603174603, |
| "grad_norm": 0.5872250143318944, |
| "learning_rate": 1.973759625485743e-06, |
| "loss": 0.1295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12013471126556396, |
| "step": 3845, |
| "valid_targets_mean": 3976.3, |
| "valid_targets_min": 1509 |
| }, |
| { |
| "epoch": 6.111111111111111, |
| "grad_norm": 0.5053201570927205, |
| "learning_rate": 1.9396140369159e-06, |
| "loss": 0.1314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14312024414539337, |
| "step": 3850, |
| "valid_targets_mean": 5034.4, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 6.119047619047619, |
| "grad_norm": 0.4254491047353564, |
| "learning_rate": 1.9057513295011087e-06, |
| "loss": 0.1249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11980589479207993, |
| "step": 3855, |
| "valid_targets_mean": 5230.5, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 6.1269841269841265, |
| "grad_norm": 0.45350019220553667, |
| "learning_rate": 1.8721720336354487e-06, |
| "loss": 0.1306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1343933343887329, |
| "step": 3860, |
| "valid_targets_mean": 5310.0, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 6.134920634920635, |
| "grad_norm": 0.44908680436264514, |
| "learning_rate": 1.8388766752739017e-06, |
| "loss": 0.1298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13214536011219025, |
| "step": 3865, |
| "valid_targets_mean": 4819.6, |
| "valid_targets_min": 360 |
| }, |
| { |
| "epoch": 6.142857142857143, |
| "grad_norm": 0.43728782320626974, |
| "learning_rate": 1.805865775924116e-06, |
| "loss": 0.137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12990088760852814, |
| "step": 3870, |
| "valid_targets_mean": 5668.4, |
| "valid_targets_min": 2900 |
| }, |
| { |
| "epoch": 6.150793650793651, |
| "grad_norm": 0.46855550237931853, |
| "learning_rate": 1.7731398526382416e-06, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11653086543083191, |
| "step": 3875, |
| "valid_targets_mean": 5082.9, |
| "valid_targets_min": 278 |
| }, |
| { |
| "epoch": 6.158730158730159, |
| "grad_norm": 0.4633118493365201, |
| "learning_rate": 1.7406994180048231e-06, |
| "loss": 0.1302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1214178055524826, |
| "step": 3880, |
| "valid_targets_mean": 5079.4, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 6.166666666666667, |
| "grad_norm": 0.4324845887042187, |
| "learning_rate": 1.7085449801407783e-06, |
| "loss": 0.1242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11891638487577438, |
| "step": 3885, |
| "valid_targets_mean": 5482.2, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 6.174603174603175, |
| "grad_norm": 0.4593597812117515, |
| "learning_rate": 1.67667704268343e-06, |
| "loss": 0.1302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12844383716583252, |
| "step": 3890, |
| "valid_targets_mean": 5304.3, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 6.182539682539683, |
| "grad_norm": 1.0409294151451973, |
| "learning_rate": 1.6450961047826353e-06, |
| "loss": 0.127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14141665399074554, |
| "step": 3895, |
| "valid_targets_mean": 4083.4, |
| "valid_targets_min": 287 |
| }, |
| { |
| "epoch": 6.190476190476191, |
| "grad_norm": 0.4147176475336051, |
| "learning_rate": 1.6138026610929446e-06, |
| "loss": 0.1377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12204622477293015, |
| "step": 3900, |
| "valid_targets_mean": 6026.9, |
| "valid_targets_min": 1789 |
| }, |
| { |
| "epoch": 6.198412698412699, |
| "grad_norm": 0.7688468165385852, |
| "learning_rate": 1.5827972017658732e-06, |
| "loss": 0.1434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14009518921375275, |
| "step": 3905, |
| "valid_targets_mean": 5232.4, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 6.2063492063492065, |
| "grad_norm": 0.5742634408323547, |
| "learning_rate": 1.5520802124422108e-06, |
| "loss": 0.1284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11271405220031738, |
| "step": 3910, |
| "valid_targets_mean": 5412.1, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 6.214285714285714, |
| "grad_norm": 0.4434637011482024, |
| "learning_rate": 1.5216521742444236e-06, |
| "loss": 0.1266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15959657728672028, |
| "step": 3915, |
| "valid_targets_mean": 5545.5, |
| "valid_targets_min": 366 |
| }, |
| { |
| "epoch": 6.222222222222222, |
| "grad_norm": 0.4473257762920866, |
| "learning_rate": 1.491513563769118e-06, |
| "loss": 0.1277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13596297800540924, |
| "step": 3920, |
| "valid_targets_mean": 6079.2, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 6.23015873015873, |
| "grad_norm": 0.40218956890406166, |
| "learning_rate": 1.4616648530795673e-06, |
| "loss": 0.1367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13123834133148193, |
| "step": 3925, |
| "valid_targets_mean": 6588.4, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 6.238095238095238, |
| "grad_norm": 0.4665917089898694, |
| "learning_rate": 1.432106509698319e-06, |
| "loss": 0.1403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14458967745304108, |
| "step": 3930, |
| "valid_targets_mean": 5620.0, |
| "valid_targets_min": 2860 |
| }, |
| { |
| "epoch": 6.246031746031746, |
| "grad_norm": 0.4804278259544632, |
| "learning_rate": 1.4028389965998867e-06, |
| "loss": 0.1322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13646945357322693, |
| "step": 3935, |
| "valid_targets_mean": 4918.8, |
| "valid_targets_min": 2109 |
| }, |
| { |
| "epoch": 6.253968253968254, |
| "grad_norm": 0.4573452936493578, |
| "learning_rate": 1.3738627722034848e-06, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12479956448078156, |
| "step": 3940, |
| "valid_targets_mean": 5664.0, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 6.261904761904762, |
| "grad_norm": 0.4112194821979111, |
| "learning_rate": 1.345178290365845e-06, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12601318955421448, |
| "step": 3945, |
| "valid_targets_mean": 5897.8, |
| "valid_targets_min": 2441 |
| }, |
| { |
| "epoch": 6.26984126984127, |
| "grad_norm": 0.43770788181094994, |
| "learning_rate": 1.3167860003741218e-06, |
| "loss": 0.1333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13687068223953247, |
| "step": 3950, |
| "valid_targets_mean": 5294.8, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 6.277777777777778, |
| "grad_norm": 0.43651984734406524, |
| "learning_rate": 1.2886863469388389e-06, |
| "loss": 0.1357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13095057010650635, |
| "step": 3955, |
| "valid_targets_mean": 5041.6, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 6.285714285714286, |
| "grad_norm": 0.4407006248372022, |
| "learning_rate": 1.2608797701869425e-06, |
| "loss": 0.1454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13327287137508392, |
| "step": 3960, |
| "valid_targets_mean": 5152.8, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 6.2936507936507935, |
| "grad_norm": 0.4830750093647113, |
| "learning_rate": 1.2333667056548881e-06, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12351542711257935, |
| "step": 3965, |
| "valid_targets_mean": 4494.3, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 6.301587301587301, |
| "grad_norm": 0.4721717415354756, |
| "learning_rate": 1.2061475842818337e-06, |
| "loss": 0.1466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15659388899803162, |
| "step": 3970, |
| "valid_targets_mean": 5026.2, |
| "valid_targets_min": 1775 |
| }, |
| { |
| "epoch": 6.309523809523809, |
| "grad_norm": 0.42311493337432965, |
| "learning_rate": 1.1792228324028776e-06, |
| "loss": 0.1289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15567630529403687, |
| "step": 3975, |
| "valid_targets_mean": 5791.2, |
| "valid_targets_min": 3515 |
| }, |
| { |
| "epoch": 6.317460317460317, |
| "grad_norm": 1.4585742478929205, |
| "learning_rate": 1.152592871742395e-06, |
| "loss": 0.133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13825181126594543, |
| "step": 3980, |
| "valid_targets_mean": 5244.9, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 6.325396825396825, |
| "grad_norm": 0.461117951811656, |
| "learning_rate": 1.1262581194074152e-06, |
| "loss": 0.131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11796639859676361, |
| "step": 3985, |
| "valid_targets_mean": 5554.2, |
| "valid_targets_min": 2245 |
| }, |
| { |
| "epoch": 6.333333333333333, |
| "grad_norm": 0.47633924217416224, |
| "learning_rate": 1.100218987881112e-06, |
| "loss": 0.1325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12955845892429352, |
| "step": 3990, |
| "valid_targets_mean": 6029.9, |
| "valid_targets_min": 2670 |
| }, |
| { |
| "epoch": 6.341269841269841, |
| "grad_norm": 0.45154703338066743, |
| "learning_rate": 1.0744758850163085e-06, |
| "loss": 0.1408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13291522860527039, |
| "step": 3995, |
| "valid_targets_mean": 5422.9, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 6.349206349206349, |
| "grad_norm": 0.5119900863580499, |
| "learning_rate": 1.0490292140291247e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13096119463443756, |
| "step": 4000, |
| "valid_targets_mean": 5480.8, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 6.357142857142857, |
| "grad_norm": 0.5126206204332201, |
| "learning_rate": 1.0238793734926467e-06, |
| "loss": 0.13, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14911425113677979, |
| "step": 4005, |
| "valid_targets_mean": 4797.0, |
| "valid_targets_min": 1266 |
| }, |
| { |
| "epoch": 6.365079365079365, |
| "grad_norm": 0.4880357246785836, |
| "learning_rate": 9.990267573306745e-07, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1387421041727066, |
| "step": 4010, |
| "valid_targets_mean": 4544.9, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 6.3730158730158735, |
| "grad_norm": 0.40558138018757806, |
| "learning_rate": 9.744717548115613e-07, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12570391595363617, |
| "step": 4015, |
| "valid_targets_mean": 6268.6, |
| "valid_targets_min": 3291 |
| }, |
| { |
| "epoch": 6.380952380952381, |
| "grad_norm": 0.41810620070165866, |
| "learning_rate": 9.502147505421244e-07, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1270408034324646, |
| "step": 4020, |
| "valid_targets_mean": 6078.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 6.388888888888889, |
| "grad_norm": 0.4496644146071595, |
| "learning_rate": 9.262561244616108e-07, |
| "loss": 0.133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14739742875099182, |
| "step": 4025, |
| "valid_targets_mean": 5835.8, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 6.396825396825397, |
| "grad_norm": 0.45373871441149133, |
| "learning_rate": 9.025962518357323e-07, |
| "loss": 0.1241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11742935329675674, |
| "step": 4030, |
| "valid_targets_mean": 4566.4, |
| "valid_targets_min": 290 |
| }, |
| { |
| "epoch": 6.404761904761905, |
| "grad_norm": 0.4617395683182264, |
| "learning_rate": 8.792355032508282e-07, |
| "loss": 0.1362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12306074798107147, |
| "step": 4035, |
| "valid_targets_mean": 5038.2, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 6.412698412698413, |
| "grad_norm": 0.4644079416505595, |
| "learning_rate": 8.561742446080168e-07, |
| "loss": 0.1282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1280827522277832, |
| "step": 4040, |
| "valid_targets_mean": 5057.6, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 6.420634920634921, |
| "grad_norm": 0.425213082782362, |
| "learning_rate": 8.334128371174955e-07, |
| "loss": 0.1418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14657798409461975, |
| "step": 4045, |
| "valid_targets_mean": 6001.6, |
| "valid_targets_min": 582 |
| }, |
| { |
| "epoch": 6.428571428571429, |
| "grad_norm": 0.428425934530618, |
| "learning_rate": 8.109516372928605e-07, |
| "loss": 0.1309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13139371573925018, |
| "step": 4050, |
| "valid_targets_mean": 5651.9, |
| "valid_targets_min": 2298 |
| }, |
| { |
| "epoch": 6.436507936507937, |
| "grad_norm": 0.4405821827658464, |
| "learning_rate": 7.887909969455366e-07, |
| "loss": 0.1326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12469398230314255, |
| "step": 4055, |
| "valid_targets_mean": 5376.2, |
| "valid_targets_min": 267 |
| }, |
| { |
| "epoch": 6.444444444444445, |
| "grad_norm": 0.5057128403035726, |
| "learning_rate": 7.669312631792758e-07, |
| "loss": 0.14, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14254549145698547, |
| "step": 4060, |
| "valid_targets_mean": 5674.9, |
| "valid_targets_min": 2241 |
| }, |
| { |
| "epoch": 6.4523809523809526, |
| "grad_norm": 0.615770615958985, |
| "learning_rate": 7.453727783846876e-07, |
| "loss": 0.1439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1313585788011551, |
| "step": 4065, |
| "valid_targets_mean": 5325.8, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 6.4603174603174605, |
| "grad_norm": 0.4640004582080486, |
| "learning_rate": 7.241158802339065e-07, |
| "loss": 0.1406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14738494157791138, |
| "step": 4070, |
| "valid_targets_mean": 5742.9, |
| "valid_targets_min": 297 |
| }, |
| { |
| "epoch": 6.468253968253968, |
| "grad_norm": 0.44707812759358856, |
| "learning_rate": 7.031609016753016e-07, |
| "loss": 0.1372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1283096969127655, |
| "step": 4075, |
| "valid_targets_mean": 5941.6, |
| "valid_targets_min": 2715 |
| }, |
| { |
| "epoch": 6.476190476190476, |
| "grad_norm": 0.5025741831025621, |
| "learning_rate": 6.825081709282377e-07, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14924189448356628, |
| "step": 4080, |
| "valid_targets_mean": 5481.9, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 6.484126984126984, |
| "grad_norm": 0.4928322290987037, |
| "learning_rate": 6.62158011477958e-07, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14254453778266907, |
| "step": 4085, |
| "valid_targets_mean": 5396.4, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 6.492063492063492, |
| "grad_norm": 0.4463090392869717, |
| "learning_rate": 6.421107420705097e-07, |
| "loss": 0.139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1291046142578125, |
| "step": 4090, |
| "valid_targets_mean": 5304.8, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 6.5, |
| "grad_norm": 0.41940627052314144, |
| "learning_rate": 6.223666767077508e-07, |
| "loss": 0.1369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1368085891008377, |
| "step": 4095, |
| "valid_targets_mean": 5791.9, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 6.507936507936508, |
| "grad_norm": 0.38633976220944566, |
| "learning_rate": 6.029261246424267e-07, |
| "loss": 0.1254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11674937605857849, |
| "step": 4100, |
| "valid_targets_mean": 7173.1, |
| "valid_targets_min": 3321 |
| }, |
| { |
| "epoch": 6.515873015873016, |
| "grad_norm": 0.5710755866104514, |
| "learning_rate": 5.837893903733394e-07, |
| "loss": 0.1398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14703723788261414, |
| "step": 4105, |
| "valid_targets_mean": 4992.6, |
| "valid_targets_min": 251 |
| }, |
| { |
| "epoch": 6.523809523809524, |
| "grad_norm": 0.42790485901259206, |
| "learning_rate": 5.649567736405681e-07, |
| "loss": 0.1345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11689166724681854, |
| "step": 4110, |
| "valid_targets_mean": 5996.3, |
| "valid_targets_min": 3073 |
| }, |
| { |
| "epoch": 6.531746031746032, |
| "grad_norm": 0.3978542753238711, |
| "learning_rate": 5.464285694207672e-07, |
| "loss": 0.1299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12328889966011047, |
| "step": 4115, |
| "valid_targets_mean": 6366.9, |
| "valid_targets_min": 2921 |
| }, |
| { |
| "epoch": 6.5396825396825395, |
| "grad_norm": 0.4803261314786915, |
| "learning_rate": 5.282050679225714e-07, |
| "loss": 0.1332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13136357069015503, |
| "step": 4120, |
| "valid_targets_mean": 5456.8, |
| "valid_targets_min": 1746 |
| }, |
| { |
| "epoch": 6.5476190476190474, |
| "grad_norm": 0.3906973340150284, |
| "learning_rate": 5.102865545820245e-07, |
| "loss": 0.13, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12256291508674622, |
| "step": 4125, |
| "valid_targets_mean": 6359.6, |
| "valid_targets_min": 2305 |
| }, |
| { |
| "epoch": 6.555555555555555, |
| "grad_norm": 0.4059594097865994, |
| "learning_rate": 4.926733100581182e-07, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11908716708421707, |
| "step": 4130, |
| "valid_targets_mean": 6355.2, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 6.563492063492063, |
| "grad_norm": 0.5832130007483879, |
| "learning_rate": 4.7536561022840213e-07, |
| "loss": 0.1346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13830284774303436, |
| "step": 4135, |
| "valid_targets_mean": 4896.4, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 6.571428571428571, |
| "grad_norm": 0.4059800621113446, |
| "learning_rate": 4.5836372618464964e-07, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12423016875982285, |
| "step": 4140, |
| "valid_targets_mean": 6594.7, |
| "valid_targets_min": 3811 |
| }, |
| { |
| "epoch": 6.579365079365079, |
| "grad_norm": 0.4185374589094962, |
| "learning_rate": 4.416679242286215e-07, |
| "loss": 0.1279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13419991731643677, |
| "step": 4145, |
| "valid_targets_mean": 6087.1, |
| "valid_targets_min": 2433 |
| }, |
| { |
| "epoch": 6.587301587301587, |
| "grad_norm": 0.5103870835544566, |
| "learning_rate": 4.2527846586789547e-07, |
| "loss": 0.136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14000031352043152, |
| "step": 4150, |
| "valid_targets_mean": 4625.3, |
| "valid_targets_min": 221 |
| }, |
| { |
| "epoch": 6.595238095238095, |
| "grad_norm": 0.5765993905041488, |
| "learning_rate": 4.0919560781176317e-07, |
| "loss": 0.1312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13032563030719757, |
| "step": 4155, |
| "valid_targets_mean": 5195.4, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 6.603174603174603, |
| "grad_norm": 0.48593436180980204, |
| "learning_rate": 3.934196019672176e-07, |
| "loss": 0.1267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13097088038921356, |
| "step": 4160, |
| "valid_targets_mean": 4735.8, |
| "valid_targets_min": 1686 |
| }, |
| { |
| "epoch": 6.611111111111111, |
| "grad_norm": 0.4395609496182445, |
| "learning_rate": 3.779506954349965e-07, |
| "loss": 0.1357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12398695945739746, |
| "step": 4165, |
| "valid_targets_mean": 6392.1, |
| "valid_targets_min": 2819 |
| }, |
| { |
| "epoch": 6.619047619047619, |
| "grad_norm": 0.47600560032316025, |
| "learning_rate": 3.6278913050572076e-07, |
| "loss": 0.1377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1410660743713379, |
| "step": 4170, |
| "valid_targets_mean": 4714.9, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 6.6269841269841265, |
| "grad_norm": 0.4626328635010138, |
| "learning_rate": 3.4793514465610414e-07, |
| "loss": 0.1227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12245401740074158, |
| "step": 4175, |
| "valid_targets_mean": 5662.9, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 6.634920634920634, |
| "grad_norm": 0.4856477089680751, |
| "learning_rate": 3.3338897054521205e-07, |
| "loss": 0.1445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12981770932674408, |
| "step": 4180, |
| "valid_targets_mean": 6161.9, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 6.642857142857143, |
| "grad_norm": 0.4382225877662096, |
| "learning_rate": 3.191508360108464e-07, |
| "loss": 0.1265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12940582633018494, |
| "step": 4185, |
| "valid_targets_mean": 5541.3, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 6.650793650793651, |
| "grad_norm": 0.4467797690671947, |
| "learning_rate": 3.0522096406595536e-07, |
| "loss": 0.1249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12461797893047333, |
| "step": 4190, |
| "valid_targets_mean": 5350.9, |
| "valid_targets_min": 1531 |
| }, |
| { |
| "epoch": 6.658730158730159, |
| "grad_norm": 0.4315640371338101, |
| "learning_rate": 2.9159957289514926e-07, |
| "loss": 0.1307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1185673251748085, |
| "step": 4195, |
| "valid_targets_mean": 5560.6, |
| "valid_targets_min": 2700 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.48404703695546003, |
| "learning_rate": 2.782868758512791e-07, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13700520992279053, |
| "step": 4200, |
| "valid_targets_mean": 5088.4, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 6.674603174603175, |
| "grad_norm": 0.4561326307439442, |
| "learning_rate": 2.6528308145210125e-07, |
| "loss": 0.1336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14443397521972656, |
| "step": 4205, |
| "valid_targets_mean": 5388.9, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 6.682539682539683, |
| "grad_norm": 0.4432184683642521, |
| "learning_rate": 2.525883933770046e-07, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13129255175590515, |
| "step": 4210, |
| "valid_targets_mean": 6560.8, |
| "valid_targets_min": 2872 |
| }, |
| { |
| "epoch": 6.690476190476191, |
| "grad_norm": 0.4428498025907347, |
| "learning_rate": 2.402030104638198e-07, |
| "loss": 0.1281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1193118616938591, |
| "step": 4215, |
| "valid_targets_mean": 5178.1, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 6.698412698412699, |
| "grad_norm": 0.4342898053436231, |
| "learning_rate": 2.2812712670571502e-07, |
| "loss": 0.1307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13040482997894287, |
| "step": 4220, |
| "valid_targets_mean": 5622.1, |
| "valid_targets_min": 2496 |
| }, |
| { |
| "epoch": 6.7063492063492065, |
| "grad_norm": 2.0764732196910196, |
| "learning_rate": 2.1636093124814738e-07, |
| "loss": 0.136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12159843742847443, |
| "step": 4225, |
| "valid_targets_mean": 5518.6, |
| "valid_targets_min": 1795 |
| }, |
| { |
| "epoch": 6.714285714285714, |
| "grad_norm": 0.4586433877189939, |
| "learning_rate": 2.0490460838589855e-07, |
| "loss": 0.1337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12682956457138062, |
| "step": 4230, |
| "valid_targets_mean": 4948.1, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 6.722222222222222, |
| "grad_norm": 0.47132990810816733, |
| "learning_rate": 1.9375833756019923e-07, |
| "loss": 0.1348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15487657487392426, |
| "step": 4235, |
| "valid_targets_mean": 4774.9, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 6.73015873015873, |
| "grad_norm": 0.4124840094163903, |
| "learning_rate": 1.8292229335590716e-07, |
| "loss": 0.1351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11652678996324539, |
| "step": 4240, |
| "valid_targets_mean": 6393.1, |
| "valid_targets_min": 3197 |
| }, |
| { |
| "epoch": 6.738095238095238, |
| "grad_norm": 0.4350958770760526, |
| "learning_rate": 1.7239664549878688e-07, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1278618425130844, |
| "step": 4245, |
| "valid_targets_mean": 5711.4, |
| "valid_targets_min": 307 |
| }, |
| { |
| "epoch": 6.746031746031746, |
| "grad_norm": 0.4380389060922931, |
| "learning_rate": 1.6218155885283192e-07, |
| "loss": 0.1333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1238991990685463, |
| "step": 4250, |
| "valid_targets_mean": 5243.3, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 6.753968253968254, |
| "grad_norm": 0.45207585431063574, |
| "learning_rate": 1.5227719341769364e-07, |
| "loss": 0.1406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12772828340530396, |
| "step": 4255, |
| "valid_targets_mean": 6135.6, |
| "valid_targets_min": 2455 |
| }, |
| { |
| "epoch": 6.761904761904762, |
| "grad_norm": 0.48236608264345426, |
| "learning_rate": 1.4268370432618306e-07, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14505012333393097, |
| "step": 4260, |
| "valid_targets_mean": 4687.0, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 6.76984126984127, |
| "grad_norm": 0.4233867675421516, |
| "learning_rate": 1.3340124184182178e-07, |
| "loss": 0.1289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12908919155597687, |
| "step": 4265, |
| "valid_targets_mean": 6025.6, |
| "valid_targets_min": 2257 |
| }, |
| { |
| "epoch": 6.777777777777778, |
| "grad_norm": 0.4877416792035469, |
| "learning_rate": 1.2442995135650393e-07, |
| "loss": 0.1296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15760302543640137, |
| "step": 4270, |
| "valid_targets_mean": 4828.7, |
| "valid_targets_min": 268 |
| }, |
| { |
| "epoch": 6.785714285714286, |
| "grad_norm": 0.6506490177567913, |
| "learning_rate": 1.1576997338821339e-07, |
| "loss": 0.1364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13028597831726074, |
| "step": 4275, |
| "valid_targets_mean": 5155.9, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 6.7936507936507935, |
| "grad_norm": 0.4477970591498348, |
| "learning_rate": 1.0742144357882567e-07, |
| "loss": 0.1401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1585049331188202, |
| "step": 4280, |
| "valid_targets_mean": 5534.2, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 6.801587301587301, |
| "grad_norm": 0.49507868999640176, |
| "learning_rate": 9.938449269197181e-08, |
| "loss": 0.1258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1410304307937622, |
| "step": 4285, |
| "valid_targets_mean": 4884.3, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 6.809523809523809, |
| "grad_norm": 0.4842993936056907, |
| "learning_rate": 9.165924661100889e-08, |
| "loss": 0.1347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12479911744594574, |
| "step": 4290, |
| "valid_targets_mean": 5132.9, |
| "valid_targets_min": 397 |
| }, |
| { |
| "epoch": 6.817460317460317, |
| "grad_norm": 0.43326494078340105, |
| "learning_rate": 8.424582633703493e-08, |
| "loss": 0.1291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13402575254440308, |
| "step": 4295, |
| "valid_targets_mean": 5267.1, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 6.825396825396825, |
| "grad_norm": 0.39800154553874223, |
| "learning_rate": 7.714434798699933e-08, |
| "loss": 0.1228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12014246731996536, |
| "step": 4300, |
| "valid_targets_mean": 6144.5, |
| "valid_targets_min": 2815 |
| }, |
| { |
| "epoch": 6.833333333333333, |
| "grad_norm": 0.42208852936776803, |
| "learning_rate": 7.035492279187538e-08, |
| "loss": 0.1331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12092911452054977, |
| "step": 4305, |
| "valid_targets_mean": 5618.4, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 6.841269841269841, |
| "grad_norm": 0.5061623759467122, |
| "learning_rate": 6.387765709493288e-08, |
| "loss": 0.1362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13144025206565857, |
| "step": 4310, |
| "valid_targets_mean": 5299.0, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 6.849206349206349, |
| "grad_norm": 0.4703474965866674, |
| "learning_rate": 5.7712652350061515e-08, |
| "loss": 0.1368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14938583970069885, |
| "step": 4315, |
| "valid_targets_mean": 4459.2, |
| "valid_targets_min": 229 |
| }, |
| { |
| "epoch": 6.857142857142857, |
| "grad_norm": 0.4544153706399285, |
| "learning_rate": 5.186000512018341e-08, |
| "loss": 0.1304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13210490345954895, |
| "step": 4320, |
| "valid_targets_mean": 5968.1, |
| "valid_targets_min": 1966 |
| }, |
| { |
| "epoch": 6.865079365079366, |
| "grad_norm": 0.3951693224390717, |
| "learning_rate": 4.631980707574535e-08, |
| "loss": 0.1222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10764377564191818, |
| "step": 4325, |
| "valid_targets_mean": 6102.2, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 6.8730158730158735, |
| "grad_norm": 0.47764153403255666, |
| "learning_rate": 4.10921449932733e-08, |
| "loss": 0.1415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13427546620368958, |
| "step": 4330, |
| "valid_targets_mean": 4686.6, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 6.880952380952381, |
| "grad_norm": 0.4686718928282114, |
| "learning_rate": 3.61771007540268e-08, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12770965695381165, |
| "step": 4335, |
| "valid_targets_mean": 5458.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 6.888888888888889, |
| "grad_norm": 0.45215811836727576, |
| "learning_rate": 3.157475134270227e-08, |
| "loss": 0.1306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14995113015174866, |
| "step": 4340, |
| "valid_targets_mean": 5664.1, |
| "valid_targets_min": 3600 |
| }, |
| { |
| "epoch": 6.896825396825397, |
| "grad_norm": 0.49008507070012214, |
| "learning_rate": 2.728516884624277e-08, |
| "loss": 0.1288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13054564595222473, |
| "step": 4345, |
| "valid_targets_mean": 5089.6, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 6.904761904761905, |
| "grad_norm": 0.48404319287292985, |
| "learning_rate": 2.3308420452690106e-08, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13617941737174988, |
| "step": 4350, |
| "valid_targets_mean": 4722.2, |
| "valid_targets_min": 1597 |
| }, |
| { |
| "epoch": 6.912698412698413, |
| "grad_norm": 0.40638533094484175, |
| "learning_rate": 1.9644568450147837e-08, |
| "loss": 0.1317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14109522104263306, |
| "step": 4355, |
| "valid_targets_mean": 6445.0, |
| "valid_targets_min": 3553 |
| }, |
| { |
| "epoch": 6.920634920634921, |
| "grad_norm": 0.4629617085369057, |
| "learning_rate": 1.6293670225799864e-08, |
| "loss": 0.1253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1260548233985901, |
| "step": 4360, |
| "valid_targets_mean": 5373.1, |
| "valid_targets_min": 543 |
| }, |
| { |
| "epoch": 6.928571428571429, |
| "grad_norm": 0.45402888146937276, |
| "learning_rate": 1.3255778265013342e-08, |
| "loss": 0.1365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14494284987449646, |
| "step": 4365, |
| "valid_targets_mean": 5725.3, |
| "valid_targets_min": 1550 |
| }, |
| { |
| "epoch": 6.936507936507937, |
| "grad_norm": 0.4086709277572136, |
| "learning_rate": 1.0530940150512703e-08, |
| "loss": 0.1352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1179996132850647, |
| "step": 4370, |
| "valid_targets_mean": 5990.4, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 6.944444444444445, |
| "grad_norm": 0.42662410297325026, |
| "learning_rate": 8.119198561638009e-09, |
| "loss": 0.1466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14371398091316223, |
| "step": 4375, |
| "valid_targets_mean": 5997.8, |
| "valid_targets_min": 3437 |
| }, |
| { |
| "epoch": 6.9523809523809526, |
| "grad_norm": 0.42639557312324744, |
| "learning_rate": 6.020591273674381e-09, |
| "loss": 0.1317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1339547336101532, |
| "step": 4380, |
| "valid_targets_mean": 6416.2, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 6.9603174603174605, |
| "grad_norm": 0.4092765044556627, |
| "learning_rate": 4.2351511572635835e-09, |
| "loss": 0.1359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10867651551961899, |
| "step": 4385, |
| "valid_targets_mean": 6632.2, |
| "valid_targets_min": 1370 |
| }, |
| { |
| "epoch": 6.968253968253968, |
| "grad_norm": 0.4951156195990528, |
| "learning_rate": 2.7629061778866597e-09, |
| "loss": 0.1432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1670551598072052, |
| "step": 4390, |
| "valid_targets_mean": 5063.4, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 6.976190476190476, |
| "grad_norm": 0.5279789366650457, |
| "learning_rate": 1.603879395422059e-09, |
| "loss": 0.134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14463752508163452, |
| "step": 4395, |
| "valid_targets_mean": 4726.2, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 6.984126984126984, |
| "grad_norm": 0.43870727411718197, |
| "learning_rate": 7.580889637925914e-10, |
| "loss": 0.1397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14193710684776306, |
| "step": 4400, |
| "valid_targets_mean": 5203.9, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 6.992063492063492, |
| "grad_norm": 0.4604903629839532, |
| "learning_rate": 2.2554813067676705e-10, |
| "loss": 0.1268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1437646746635437, |
| "step": 4405, |
| "valid_targets_mean": 5522.9, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 7.0, |
| "grad_norm": 0.4923560486700678, |
| "learning_rate": 6.265237300073778e-12, |
| "loss": 0.1497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15846839547157288, |
| "step": 4410, |
| "valid_targets_mean": 5295.1, |
| "valid_targets_min": 1258 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15846839547157288, |
| "step": 4410, |
| "total_flos": 1765744004825088.0, |
| "train_loss": 0.17469855595608147, |
| "train_runtime": 27741.8701, |
| "train_samples_per_second": 2.541, |
| "train_steps_per_second": 0.159, |
| "valid_targets_mean": 5295.1, |
| "valid_targets_min": 1258 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4410, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1765744004825088.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|