| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4410, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.007936507936507936, |
| "grad_norm": 7.791894551319325, |
| "learning_rate": 3.6281179138322e-07, |
| "loss": 0.7972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3812609314918518, |
| "step": 5, |
| "valid_targets_mean": 2755.6, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 0.015873015873015872, |
| "grad_norm": 7.455912538367786, |
| "learning_rate": 8.163265306122449e-07, |
| "loss": 0.8212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37411224842071533, |
| "step": 10, |
| "valid_targets_mean": 3696.9, |
| "valid_targets_min": 1315 |
| }, |
| { |
| "epoch": 0.023809523809523808, |
| "grad_norm": 7.4947876547841865, |
| "learning_rate": 1.26984126984127e-06, |
| "loss": 0.798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37891465425491333, |
| "step": 15, |
| "valid_targets_mean": 3647.1, |
| "valid_targets_min": 1396 |
| }, |
| { |
| "epoch": 0.031746031746031744, |
| "grad_norm": 5.997591663796195, |
| "learning_rate": 1.723356009070295e-06, |
| "loss": 0.7689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33539754152297974, |
| "step": 20, |
| "valid_targets_mean": 2617.8, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 0.03968253968253968, |
| "grad_norm": 4.498581839487113, |
| "learning_rate": 2.17687074829932e-06, |
| "loss": 0.7181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38529515266418457, |
| "step": 25, |
| "valid_targets_mean": 3182.4, |
| "valid_targets_min": 2220 |
| }, |
| { |
| "epoch": 0.047619047619047616, |
| "grad_norm": 3.279401177139959, |
| "learning_rate": 2.6303854875283447e-06, |
| "loss": 0.6841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3477422297000885, |
| "step": 30, |
| "valid_targets_mean": 3296.5, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 0.05555555555555555, |
| "grad_norm": 2.65642172394517, |
| "learning_rate": 3.08390022675737e-06, |
| "loss": 0.697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3257293105125427, |
| "step": 35, |
| "valid_targets_mean": 3436.6, |
| "valid_targets_min": 1517 |
| }, |
| { |
| "epoch": 0.06349206349206349, |
| "grad_norm": 2.141011741114798, |
| "learning_rate": 3.537414965986395e-06, |
| "loss": 0.6551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3501768410205841, |
| "step": 40, |
| "valid_targets_mean": 3314.8, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 0.07142857142857142, |
| "grad_norm": 1.4253116818930238, |
| "learning_rate": 3.99092970521542e-06, |
| "loss": 0.6421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22955095767974854, |
| "step": 45, |
| "valid_targets_mean": 2430.1, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 0.07936507936507936, |
| "grad_norm": 1.144109550309547, |
| "learning_rate": 4.444444444444444e-06, |
| "loss": 0.6267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2753365933895111, |
| "step": 50, |
| "valid_targets_mean": 3324.9, |
| "valid_targets_min": 1255 |
| }, |
| { |
| "epoch": 0.0873015873015873, |
| "grad_norm": 1.0559927514309588, |
| "learning_rate": 4.897959183673469e-06, |
| "loss": 0.5787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3343765139579773, |
| "step": 55, |
| "valid_targets_mean": 3959.4, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 0.09523809523809523, |
| "grad_norm": 1.089174983738798, |
| "learning_rate": 5.3514739229024945e-06, |
| "loss": 0.5769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2921941876411438, |
| "step": 60, |
| "valid_targets_mean": 2628.2, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 0.10317460317460317, |
| "grad_norm": 0.9352039163105647, |
| "learning_rate": 5.80498866213152e-06, |
| "loss": 0.5802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31847676634788513, |
| "step": 65, |
| "valid_targets_mean": 5229.6, |
| "valid_targets_min": 2258 |
| }, |
| { |
| "epoch": 0.1111111111111111, |
| "grad_norm": 0.7821250269316058, |
| "learning_rate": 6.258503401360545e-06, |
| "loss": 0.5822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24337267875671387, |
| "step": 70, |
| "valid_targets_mean": 3637.1, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 0.11904761904761904, |
| "grad_norm": 0.8049140841034186, |
| "learning_rate": 6.71201814058957e-06, |
| "loss": 0.5711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31313028931617737, |
| "step": 75, |
| "valid_targets_mean": 3684.1, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 0.12698412698412698, |
| "grad_norm": 0.9345065106303573, |
| "learning_rate": 7.165532879818595e-06, |
| "loss": 0.5511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2718881070613861, |
| "step": 80, |
| "valid_targets_mean": 2535.2, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 0.1349206349206349, |
| "grad_norm": 0.7003907932134493, |
| "learning_rate": 7.61904761904762e-06, |
| "loss": 0.5241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26534807682037354, |
| "step": 85, |
| "valid_targets_mean": 4012.6, |
| "valid_targets_min": 2198 |
| }, |
| { |
| "epoch": 0.14285714285714285, |
| "grad_norm": 0.7511620568435198, |
| "learning_rate": 8.072562358276645e-06, |
| "loss": 0.5339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23427170515060425, |
| "step": 90, |
| "valid_targets_mean": 2802.2, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 0.15079365079365079, |
| "grad_norm": 0.8328109025616128, |
| "learning_rate": 8.52607709750567e-06, |
| "loss": 0.5245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2510078549385071, |
| "step": 95, |
| "valid_targets_mean": 2489.6, |
| "valid_targets_min": 1273 |
| }, |
| { |
| "epoch": 0.15873015873015872, |
| "grad_norm": 0.7816118772554373, |
| "learning_rate": 8.979591836734695e-06, |
| "loss": 0.4958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29513928294181824, |
| "step": 100, |
| "valid_targets_mean": 3522.4, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 0.16666666666666666, |
| "grad_norm": 0.7279446724813006, |
| "learning_rate": 9.43310657596372e-06, |
| "loss": 0.5014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23042386770248413, |
| "step": 105, |
| "valid_targets_mean": 3128.6, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 0.1746031746031746, |
| "grad_norm": 0.5890418553585118, |
| "learning_rate": 9.886621315192746e-06, |
| "loss": 0.4927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21733567118644714, |
| "step": 110, |
| "valid_targets_mean": 4134.9, |
| "valid_targets_min": 1335 |
| }, |
| { |
| "epoch": 0.18253968253968253, |
| "grad_norm": 0.7116158842930445, |
| "learning_rate": 1.034013605442177e-05, |
| "loss": 0.4823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22764775156974792, |
| "step": 115, |
| "valid_targets_mean": 4014.4, |
| "valid_targets_min": 1400 |
| }, |
| { |
| "epoch": 0.19047619047619047, |
| "grad_norm": 0.8008016401079758, |
| "learning_rate": 1.0793650793650794e-05, |
| "loss": 0.4857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24580729007720947, |
| "step": 120, |
| "valid_targets_mean": 2738.6, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 0.1984126984126984, |
| "grad_norm": 0.6667752435108454, |
| "learning_rate": 1.124716553287982e-05, |
| "loss": 0.4606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22335901856422424, |
| "step": 125, |
| "valid_targets_mean": 5113.5, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 0.20634920634920634, |
| "grad_norm": 0.7810365614559169, |
| "learning_rate": 1.1700680272108845e-05, |
| "loss": 0.4855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30480098724365234, |
| "step": 130, |
| "valid_targets_mean": 4073.2, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 0.21428571428571427, |
| "grad_norm": 0.5971746973534208, |
| "learning_rate": 1.215419501133787e-05, |
| "loss": 0.4614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14763841032981873, |
| "step": 135, |
| "valid_targets_mean": 3988.2, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 0.2222222222222222, |
| "grad_norm": 0.6922843878731343, |
| "learning_rate": 1.2607709750566895e-05, |
| "loss": 0.4444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036367654800415, |
| "step": 140, |
| "valid_targets_mean": 3281.9, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 0.23015873015873015, |
| "grad_norm": 0.6226231983750194, |
| "learning_rate": 1.3061224489795918e-05, |
| "loss": 0.4632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24707484245300293, |
| "step": 145, |
| "valid_targets_mean": 4809.4, |
| "valid_targets_min": 1577 |
| }, |
| { |
| "epoch": 0.23809523809523808, |
| "grad_norm": 0.8326186713780263, |
| "learning_rate": 1.3514739229024945e-05, |
| "loss": 0.4941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23414701223373413, |
| "step": 150, |
| "valid_targets_mean": 3326.1, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 0.24603174603174602, |
| "grad_norm": 0.6395050003229518, |
| "learning_rate": 1.3968253968253968e-05, |
| "loss": 0.444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22398585081100464, |
| "step": 155, |
| "valid_targets_mean": 3925.0, |
| "valid_targets_min": 486 |
| }, |
| { |
| "epoch": 0.25396825396825395, |
| "grad_norm": 0.9256622944985334, |
| "learning_rate": 1.4421768707482994e-05, |
| "loss": 0.4619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29537683725357056, |
| "step": 160, |
| "valid_targets_mean": 2947.2, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 0.2619047619047619, |
| "grad_norm": 0.7551814432848716, |
| "learning_rate": 1.4875283446712018e-05, |
| "loss": 0.463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23746734857559204, |
| "step": 165, |
| "valid_targets_mean": 3384.1, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 0.2698412698412698, |
| "grad_norm": 0.7006392151761067, |
| "learning_rate": 1.5328798185941044e-05, |
| "loss": 0.449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23496189713478088, |
| "step": 170, |
| "valid_targets_mean": 3901.6, |
| "valid_targets_min": 1496 |
| }, |
| { |
| "epoch": 0.2777777777777778, |
| "grad_norm": 0.6782345715181035, |
| "learning_rate": 1.578231292517007e-05, |
| "loss": 0.4643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2183074653148651, |
| "step": 175, |
| "valid_targets_mean": 3844.2, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 0.2857142857142857, |
| "grad_norm": 0.7454470024354803, |
| "learning_rate": 1.6235827664399097e-05, |
| "loss": 0.4341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22839799523353577, |
| "step": 180, |
| "valid_targets_mean": 3672.9, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 0.29365079365079366, |
| "grad_norm": 0.7104945798231723, |
| "learning_rate": 1.668934240362812e-05, |
| "loss": 0.4184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20457884669303894, |
| "step": 185, |
| "valid_targets_mean": 3345.2, |
| "valid_targets_min": 1448 |
| }, |
| { |
| "epoch": 0.30158730158730157, |
| "grad_norm": 0.8232451122305295, |
| "learning_rate": 1.7142857142857142e-05, |
| "loss": 0.4329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19103802740573883, |
| "step": 190, |
| "valid_targets_mean": 2470.0, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 0.30952380952380953, |
| "grad_norm": 0.7204209957946106, |
| "learning_rate": 1.759637188208617e-05, |
| "loss": 0.455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24723023176193237, |
| "step": 195, |
| "valid_targets_mean": 3233.0, |
| "valid_targets_min": 1414 |
| }, |
| { |
| "epoch": 0.31746031746031744, |
| "grad_norm": 0.7248505685281441, |
| "learning_rate": 1.8049886621315194e-05, |
| "loss": 0.4606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18277300894260406, |
| "step": 200, |
| "valid_targets_mean": 2704.4, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 0.3253968253968254, |
| "grad_norm": 0.8433557218499257, |
| "learning_rate": 1.8503401360544218e-05, |
| "loss": 0.4426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20108163356781006, |
| "step": 205, |
| "valid_targets_mean": 2836.4, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 0.3333333333333333, |
| "grad_norm": 0.7780860618594482, |
| "learning_rate": 1.8956916099773243e-05, |
| "loss": 0.4492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2229580283164978, |
| "step": 210, |
| "valid_targets_mean": 3097.6, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 0.3412698412698413, |
| "grad_norm": 0.7441717737312311, |
| "learning_rate": 1.941043083900227e-05, |
| "loss": 0.4214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16947849094867706, |
| "step": 215, |
| "valid_targets_mean": 2817.4, |
| "valid_targets_min": 1820 |
| }, |
| { |
| "epoch": 0.3492063492063492, |
| "grad_norm": 0.9092379058979357, |
| "learning_rate": 1.9863945578231295e-05, |
| "loss": 0.4468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2582654356956482, |
| "step": 220, |
| "valid_targets_mean": 2500.8, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 0.35714285714285715, |
| "grad_norm": 0.6589744304007081, |
| "learning_rate": 2.031746031746032e-05, |
| "loss": 0.4167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21442869305610657, |
| "step": 225, |
| "valid_targets_mean": 4276.1, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 0.36507936507936506, |
| "grad_norm": 0.6323891462731305, |
| "learning_rate": 2.0770975056689343e-05, |
| "loss": 0.4101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1991756558418274, |
| "step": 230, |
| "valid_targets_mean": 4364.2, |
| "valid_targets_min": 1985 |
| }, |
| { |
| "epoch": 0.373015873015873, |
| "grad_norm": 0.6300499913534073, |
| "learning_rate": 2.122448979591837e-05, |
| "loss": 0.4235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1824556291103363, |
| "step": 235, |
| "valid_targets_mean": 4333.2, |
| "valid_targets_min": 1767 |
| }, |
| { |
| "epoch": 0.38095238095238093, |
| "grad_norm": 0.7575279487592979, |
| "learning_rate": 2.1678004535147395e-05, |
| "loss": 0.4325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17709918320178986, |
| "step": 240, |
| "valid_targets_mean": 2336.2, |
| "valid_targets_min": 563 |
| }, |
| { |
| "epoch": 0.3888888888888889, |
| "grad_norm": 0.7262739017659442, |
| "learning_rate": 2.213151927437642e-05, |
| "loss": 0.4123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2349386066198349, |
| "step": 245, |
| "valid_targets_mean": 3695.9, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 0.3968253968253968, |
| "grad_norm": 0.6666197654683886, |
| "learning_rate": 2.2585034013605444e-05, |
| "loss": 0.4219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19883863627910614, |
| "step": 250, |
| "valid_targets_mean": 3917.5, |
| "valid_targets_min": 1650 |
| }, |
| { |
| "epoch": 0.40476190476190477, |
| "grad_norm": 0.8818322001559287, |
| "learning_rate": 2.3038548752834472e-05, |
| "loss": 0.4031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2325284481048584, |
| "step": 255, |
| "valid_targets_mean": 4317.1, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 0.4126984126984127, |
| "grad_norm": 0.8421416866948682, |
| "learning_rate": 2.3492063492063496e-05, |
| "loss": 0.4295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28885674476623535, |
| "step": 260, |
| "valid_targets_mean": 3573.9, |
| "valid_targets_min": 1326 |
| }, |
| { |
| "epoch": 0.42063492063492064, |
| "grad_norm": 0.5853157764437146, |
| "learning_rate": 2.394557823129252e-05, |
| "loss": 0.4161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15830400586128235, |
| "step": 265, |
| "valid_targets_mean": 3754.9, |
| "valid_targets_min": 1835 |
| }, |
| { |
| "epoch": 0.42857142857142855, |
| "grad_norm": 0.8503179082208167, |
| "learning_rate": 2.439909297052154e-05, |
| "loss": 0.3996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22213050723075867, |
| "step": 270, |
| "valid_targets_mean": 2988.8, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 0.4365079365079365, |
| "grad_norm": 0.7148417560197586, |
| "learning_rate": 2.4852607709750566e-05, |
| "loss": 0.4223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17101828753948212, |
| "step": 275, |
| "valid_targets_mean": 2654.6, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 0.4444444444444444, |
| "grad_norm": 0.7488294120655374, |
| "learning_rate": 2.5306122448979597e-05, |
| "loss": 0.4057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22752045094966888, |
| "step": 280, |
| "valid_targets_mean": 3658.4, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 0.4523809523809524, |
| "grad_norm": 0.819013125702064, |
| "learning_rate": 2.5759637188208618e-05, |
| "loss": 0.389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18698972463607788, |
| "step": 285, |
| "valid_targets_mean": 3620.4, |
| "valid_targets_min": 338 |
| }, |
| { |
| "epoch": 0.4603174603174603, |
| "grad_norm": 0.8764147766183873, |
| "learning_rate": 2.6213151927437642e-05, |
| "loss": 0.4258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2131589949131012, |
| "step": 290, |
| "valid_targets_mean": 2699.6, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 0.46825396825396826, |
| "grad_norm": 0.7879977167108214, |
| "learning_rate": 2.6666666666666667e-05, |
| "loss": 0.4163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1819707751274109, |
| "step": 295, |
| "valid_targets_mean": 2660.6, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 0.47619047619047616, |
| "grad_norm": 0.7627064380571622, |
| "learning_rate": 2.7120181405895694e-05, |
| "loss": 0.3933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2631428837776184, |
| "step": 300, |
| "valid_targets_mean": 4265.4, |
| "valid_targets_min": 1689 |
| }, |
| { |
| "epoch": 0.48412698412698413, |
| "grad_norm": 0.8689936550923171, |
| "learning_rate": 2.757369614512472e-05, |
| "loss": 0.396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1952773928642273, |
| "step": 305, |
| "valid_targets_mean": 3231.6, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 0.49206349206349204, |
| "grad_norm": 0.6751339015061344, |
| "learning_rate": 2.8027210884353743e-05, |
| "loss": 0.4131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20138613879680634, |
| "step": 310, |
| "valid_targets_mean": 3902.9, |
| "valid_targets_min": 1826 |
| }, |
| { |
| "epoch": 0.5, |
| "grad_norm": 0.8543806139476121, |
| "learning_rate": 2.8480725623582767e-05, |
| "loss": 0.4131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23939643800258636, |
| "step": 315, |
| "valid_targets_mean": 3292.4, |
| "valid_targets_min": 1588 |
| }, |
| { |
| "epoch": 0.5079365079365079, |
| "grad_norm": 0.7658147806021045, |
| "learning_rate": 2.893424036281179e-05, |
| "loss": 0.4181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23602905869483948, |
| "step": 320, |
| "valid_targets_mean": 4239.2, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 0.5158730158730159, |
| "grad_norm": 0.6595384619915944, |
| "learning_rate": 2.938775510204082e-05, |
| "loss": 0.383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23135556280612946, |
| "step": 325, |
| "valid_targets_mean": 4404.8, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 0.5238095238095238, |
| "grad_norm": 0.7133459488389239, |
| "learning_rate": 2.9841269841269844e-05, |
| "loss": 0.3921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19045504927635193, |
| "step": 330, |
| "valid_targets_mean": 3302.9, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 0.5317460317460317, |
| "grad_norm": 0.816501934646045, |
| "learning_rate": 3.0294784580498868e-05, |
| "loss": 0.3857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21776193380355835, |
| "step": 335, |
| "valid_targets_mean": 3168.0, |
| "valid_targets_min": 877 |
| }, |
| { |
| "epoch": 0.5396825396825397, |
| "grad_norm": 0.7547862179719467, |
| "learning_rate": 3.074829931972789e-05, |
| "loss": 0.3946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25766003131866455, |
| "step": 340, |
| "valid_targets_mean": 3334.1, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 0.5476190476190477, |
| "grad_norm": 0.7456441513111814, |
| "learning_rate": 3.1201814058956924e-05, |
| "loss": 0.3904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2486940622329712, |
| "step": 345, |
| "valid_targets_mean": 4429.5, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 0.5555555555555556, |
| "grad_norm": 0.7657984461471989, |
| "learning_rate": 3.1655328798185945e-05, |
| "loss": 0.3947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2721412479877472, |
| "step": 350, |
| "valid_targets_mean": 4107.6, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 0.5634920634920635, |
| "grad_norm": 0.7508109310293009, |
| "learning_rate": 3.2108843537414965e-05, |
| "loss": 0.4011, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2144778072834015, |
| "step": 355, |
| "valid_targets_mean": 3111.6, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 0.5714285714285714, |
| "grad_norm": 0.7203641872399225, |
| "learning_rate": 3.256235827664399e-05, |
| "loss": 0.4204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1992923766374588, |
| "step": 360, |
| "valid_targets_mean": 3283.1, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 0.5793650793650794, |
| "grad_norm": 0.8767754163538739, |
| "learning_rate": 3.3015873015873014e-05, |
| "loss": 0.3836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18871556222438812, |
| "step": 365, |
| "valid_targets_mean": 2312.6, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 0.5873015873015873, |
| "grad_norm": 0.7936761727417533, |
| "learning_rate": 3.346938775510204e-05, |
| "loss": 0.4144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2474576234817505, |
| "step": 370, |
| "valid_targets_mean": 3684.5, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 0.5952380952380952, |
| "grad_norm": 0.7531283113396905, |
| "learning_rate": 3.392290249433107e-05, |
| "loss": 0.4006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2062309980392456, |
| "step": 375, |
| "valid_targets_mean": 3048.8, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 0.6031746031746031, |
| "grad_norm": 0.75475705688863, |
| "learning_rate": 3.437641723356009e-05, |
| "loss": 0.3928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1992933750152588, |
| "step": 380, |
| "valid_targets_mean": 3318.6, |
| "valid_targets_min": 1709 |
| }, |
| { |
| "epoch": 0.6111111111111112, |
| "grad_norm": 0.6780236377117146, |
| "learning_rate": 3.482993197278912e-05, |
| "loss": 0.3817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2662087678909302, |
| "step": 385, |
| "valid_targets_mean": 4945.2, |
| "valid_targets_min": 2317 |
| }, |
| { |
| "epoch": 0.6190476190476191, |
| "grad_norm": 0.7877440224609804, |
| "learning_rate": 3.5283446712018146e-05, |
| "loss": 0.3818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17678651213645935, |
| "step": 390, |
| "valid_targets_mean": 3275.4, |
| "valid_targets_min": 1605 |
| }, |
| { |
| "epoch": 0.626984126984127, |
| "grad_norm": 0.7191554661780377, |
| "learning_rate": 3.573696145124717e-05, |
| "loss": 0.3738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25680381059646606, |
| "step": 395, |
| "valid_targets_mean": 4801.4, |
| "valid_targets_min": 2557 |
| }, |
| { |
| "epoch": 0.6349206349206349, |
| "grad_norm": 0.7021848250259723, |
| "learning_rate": 3.6190476190476195e-05, |
| "loss": 0.3862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.181675523519516, |
| "step": 400, |
| "valid_targets_mean": 3404.2, |
| "valid_targets_min": 1675 |
| }, |
| { |
| "epoch": 0.6428571428571429, |
| "grad_norm": 0.7099201322215687, |
| "learning_rate": 3.6643990929705216e-05, |
| "loss": 0.3986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1909167766571045, |
| "step": 405, |
| "valid_targets_mean": 3180.8, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 0.6507936507936508, |
| "grad_norm": 0.6475933862451292, |
| "learning_rate": 3.7097505668934243e-05, |
| "loss": 0.3621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15484705567359924, |
| "step": 410, |
| "valid_targets_mean": 3154.2, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 0.6587301587301587, |
| "grad_norm": 0.7601788500031307, |
| "learning_rate": 3.755102040816327e-05, |
| "loss": 0.3862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19706499576568604, |
| "step": 415, |
| "valid_targets_mean": 3226.2, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 0.6666666666666666, |
| "grad_norm": 0.7989603824606386, |
| "learning_rate": 3.800453514739229e-05, |
| "loss": 0.3795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20341980457305908, |
| "step": 420, |
| "valid_targets_mean": 2154.1, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 0.6746031746031746, |
| "grad_norm": 0.8589861103070494, |
| "learning_rate": 3.845804988662132e-05, |
| "loss": 0.4057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2528594732284546, |
| "step": 425, |
| "valid_targets_mean": 3353.6, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 0.6825396825396826, |
| "grad_norm": 0.6923698776091382, |
| "learning_rate": 3.891156462585034e-05, |
| "loss": 0.3722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22147980332374573, |
| "step": 430, |
| "valid_targets_mean": 4294.6, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 0.6904761904761905, |
| "grad_norm": 0.6835864581969211, |
| "learning_rate": 3.936507936507937e-05, |
| "loss": 0.3824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19371160864830017, |
| "step": 435, |
| "valid_targets_mean": 3578.5, |
| "valid_targets_min": 1759 |
| }, |
| { |
| "epoch": 0.6984126984126984, |
| "grad_norm": 0.6628481402738557, |
| "learning_rate": 3.9818594104308396e-05, |
| "loss": 0.3852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1930302232503891, |
| "step": 440, |
| "valid_targets_mean": 3477.0, |
| "valid_targets_min": 1703 |
| }, |
| { |
| "epoch": 0.7063492063492064, |
| "grad_norm": 0.6502431105225167, |
| "learning_rate": 3.999994361288785e-05, |
| "loss": 0.378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16785907745361328, |
| "step": 445, |
| "valid_targets_mean": 3585.5, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 0.7142857142857143, |
| "grad_norm": 0.7344445982650616, |
| "learning_rate": 3.9999599026131644e-05, |
| "loss": 0.4005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26353609561920166, |
| "step": 450, |
| "valid_targets_mean": 3787.4, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 0.7222222222222222, |
| "grad_norm": 0.7393938445809128, |
| "learning_rate": 3.999894118418342e-05, |
| "loss": 0.3823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2211625725030899, |
| "step": 455, |
| "valid_targets_mean": 2948.5, |
| "valid_targets_min": 1663 |
| }, |
| { |
| "epoch": 0.7301587301587301, |
| "grad_norm": 0.6960634624059825, |
| "learning_rate": 3.999797009734697e-05, |
| "loss": 0.3951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21404457092285156, |
| "step": 460, |
| "valid_targets_mean": 3528.6, |
| "valid_targets_min": 1449 |
| }, |
| { |
| "epoch": 0.7380952380952381, |
| "grad_norm": 0.7184877621518291, |
| "learning_rate": 3.999668578083253e-05, |
| "loss": 0.3612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20007619261741638, |
| "step": 465, |
| "valid_targets_mean": 4320.4, |
| "valid_targets_min": 1497 |
| }, |
| { |
| "epoch": 0.746031746031746, |
| "grad_norm": 0.5728045234335117, |
| "learning_rate": 3.9995088254756434e-05, |
| "loss": 0.3815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16080446541309357, |
| "step": 470, |
| "valid_targets_mean": 4607.4, |
| "valid_targets_min": 1481 |
| }, |
| { |
| "epoch": 0.753968253968254, |
| "grad_norm": 0.6475372333254459, |
| "learning_rate": 3.999317754414084e-05, |
| "loss": 0.3492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24191340804100037, |
| "step": 475, |
| "valid_targets_mean": 4953.6, |
| "valid_targets_min": 586 |
| }, |
| { |
| "epoch": 0.7619047619047619, |
| "grad_norm": 0.6843058759524845, |
| "learning_rate": 3.999095367891337e-05, |
| "loss": 0.3727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1674070954322815, |
| "step": 480, |
| "valid_targets_mean": 3345.8, |
| "valid_targets_min": 1521 |
| }, |
| { |
| "epoch": 0.7698412698412699, |
| "grad_norm": 0.7811323772346972, |
| "learning_rate": 3.9988416693906563e-05, |
| "loss": 0.3567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17297232151031494, |
| "step": 485, |
| "valid_targets_mean": 2783.2, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 0.7777777777777778, |
| "grad_norm": 0.6346318209661107, |
| "learning_rate": 3.9985566628857425e-05, |
| "loss": 0.3618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2082044929265976, |
| "step": 490, |
| "valid_targets_mean": 3855.1, |
| "valid_targets_min": 2018 |
| }, |
| { |
| "epoch": 0.7857142857142857, |
| "grad_norm": 0.636191038245321, |
| "learning_rate": 3.998240352840672e-05, |
| "loss": 0.3734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16644376516342163, |
| "step": 495, |
| "valid_targets_mean": 3555.9, |
| "valid_targets_min": 1613 |
| }, |
| { |
| "epoch": 0.7936507936507936, |
| "grad_norm": 0.7677265538591346, |
| "learning_rate": 3.997892744209833e-05, |
| "loss": 0.382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19620782136917114, |
| "step": 500, |
| "valid_targets_mean": 3067.5, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 0.8015873015873016, |
| "grad_norm": 0.6946489087789731, |
| "learning_rate": 3.997513842437845e-05, |
| "loss": 0.3817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1887287199497223, |
| "step": 505, |
| "valid_targets_mean": 3885.8, |
| "valid_targets_min": 1515 |
| }, |
| { |
| "epoch": 0.8095238095238095, |
| "grad_norm": 0.6017170952436831, |
| "learning_rate": 3.997103653459475e-05, |
| "loss": 0.3623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1097162514925003, |
| "step": 510, |
| "valid_targets_mean": 2377.0, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 0.8174603174603174, |
| "grad_norm": 0.8117871434459484, |
| "learning_rate": 3.996662183699541e-05, |
| "loss": 0.3789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2122984677553177, |
| "step": 515, |
| "valid_targets_mean": 2203.6, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 0.8253968253968254, |
| "grad_norm": 1.099868973186974, |
| "learning_rate": 3.996189440072818e-05, |
| "loss": 0.3733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2121431827545166, |
| "step": 520, |
| "valid_targets_mean": 1926.2, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 0.8333333333333334, |
| "grad_norm": 0.7894079145469358, |
| "learning_rate": 3.9956854299839246e-05, |
| "loss": 0.3726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19006070494651794, |
| "step": 525, |
| "valid_targets_mean": 2125.8, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 0.8412698412698413, |
| "grad_norm": 0.5713509671754762, |
| "learning_rate": 3.9951501613272076e-05, |
| "loss": 0.3877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13354474306106567, |
| "step": 530, |
| "valid_targets_mean": 3074.2, |
| "valid_targets_min": 1520 |
| }, |
| { |
| "epoch": 0.8492063492063492, |
| "grad_norm": 0.6881625716625266, |
| "learning_rate": 3.994583642486618e-05, |
| "loss": 0.3482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1768343448638916, |
| "step": 535, |
| "valid_targets_mean": 3562.4, |
| "valid_targets_min": 2059 |
| }, |
| { |
| "epoch": 0.8571428571428571, |
| "grad_norm": 0.899503970041781, |
| "learning_rate": 3.993985882335584e-05, |
| "loss": 0.3879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21532076597213745, |
| "step": 540, |
| "valid_targets_mean": 2230.4, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 0.8650793650793651, |
| "grad_norm": 0.7723136033497726, |
| "learning_rate": 3.993356890236866e-05, |
| "loss": 0.3727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16664713621139526, |
| "step": 545, |
| "valid_targets_mean": 3265.4, |
| "valid_targets_min": 1553 |
| }, |
| { |
| "epoch": 0.873015873015873, |
| "grad_norm": 0.6301346388180525, |
| "learning_rate": 3.992696676042414e-05, |
| "loss": 0.3704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10019686818122864, |
| "step": 550, |
| "valid_targets_mean": 2215.4, |
| "valid_targets_min": 1273 |
| }, |
| { |
| "epoch": 0.8809523809523809, |
| "grad_norm": 0.6543508925534741, |
| "learning_rate": 3.992005250093211e-05, |
| "loss": 0.3598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17179307341575623, |
| "step": 555, |
| "valid_targets_mean": 3047.4, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 0.8888888888888888, |
| "grad_norm": 0.8123556394552758, |
| "learning_rate": 3.991282623219113e-05, |
| "loss": 0.3666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1461830735206604, |
| "step": 560, |
| "valid_targets_mean": 2082.2, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 0.8968253968253969, |
| "grad_norm": 0.7331475325077027, |
| "learning_rate": 3.9905288067386776e-05, |
| "loss": 0.3681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19923052191734314, |
| "step": 565, |
| "valid_targets_mean": 3274.1, |
| "valid_targets_min": 1872 |
| }, |
| { |
| "epoch": 0.9047619047619048, |
| "grad_norm": 0.7153118596407079, |
| "learning_rate": 3.989743812458987e-05, |
| "loss": 0.3826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14115799963474274, |
| "step": 570, |
| "valid_targets_mean": 2320.8, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 0.9126984126984127, |
| "grad_norm": 0.7016335318916914, |
| "learning_rate": 3.9889276526754664e-05, |
| "loss": 0.3382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16912700235843658, |
| "step": 575, |
| "valid_targets_mean": 2482.8, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 0.9206349206349206, |
| "grad_norm": 0.7194115163831962, |
| "learning_rate": 3.988080340171685e-05, |
| "loss": 0.3746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13386040925979614, |
| "step": 580, |
| "valid_targets_mean": 2249.6, |
| "valid_targets_min": 1316 |
| }, |
| { |
| "epoch": 0.9285714285714286, |
| "grad_norm": 0.6158476314889361, |
| "learning_rate": 3.987201888219161e-05, |
| "loss": 0.3363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1599443256855011, |
| "step": 585, |
| "valid_targets_mean": 3076.1, |
| "valid_targets_min": 1577 |
| }, |
| { |
| "epoch": 0.9365079365079365, |
| "grad_norm": 0.6585146139697904, |
| "learning_rate": 3.986292310577153e-05, |
| "loss": 0.3422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14659200608730316, |
| "step": 590, |
| "valid_targets_mean": 3358.4, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 0.9444444444444444, |
| "grad_norm": 0.6835718384960962, |
| "learning_rate": 3.9853516214924416e-05, |
| "loss": 0.3721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13478732109069824, |
| "step": 595, |
| "valid_targets_mean": 2055.1, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 0.9523809523809523, |
| "grad_norm": 0.6959839449645118, |
| "learning_rate": 3.9843798356991096e-05, |
| "loss": 0.3685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.176021009683609, |
| "step": 600, |
| "valid_targets_mean": 3608.4, |
| "valid_targets_min": 1354 |
| }, |
| { |
| "epoch": 0.9603174603174603, |
| "grad_norm": 0.6388041844606942, |
| "learning_rate": 3.9833769684183104e-05, |
| "loss": 0.354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1868162751197815, |
| "step": 605, |
| "valid_targets_mean": 4381.1, |
| "valid_targets_min": 1644 |
| }, |
| { |
| "epoch": 0.9682539682539683, |
| "grad_norm": 0.589355661451599, |
| "learning_rate": 3.982343035358026e-05, |
| "loss": 0.3485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1337076723575592, |
| "step": 610, |
| "valid_targets_mean": 4026.0, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 0.9761904761904762, |
| "grad_norm": 0.7138102765349207, |
| "learning_rate": 3.981278052712827e-05, |
| "loss": 0.3765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21860548853874207, |
| "step": 615, |
| "valid_targets_mean": 3400.8, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 0.9841269841269841, |
| "grad_norm": 0.7189437980532786, |
| "learning_rate": 3.9801820371636157e-05, |
| "loss": 0.3613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14498873054981232, |
| "step": 620, |
| "valid_targets_mean": 2650.0, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 0.9920634920634921, |
| "grad_norm": 0.7615356151418823, |
| "learning_rate": 3.979055005877364e-05, |
| "loss": 0.3481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15953488647937775, |
| "step": 625, |
| "valid_targets_mean": 2240.5, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 1.0, |
| "grad_norm": 0.6621991671174888, |
| "learning_rate": 3.977896976506845e-05, |
| "loss": 0.3623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1603941172361374, |
| "step": 630, |
| "valid_targets_mean": 3363.9, |
| "valid_targets_min": 1638 |
| }, |
| { |
| "epoch": 1.007936507936508, |
| "grad_norm": 0.6550331659262137, |
| "learning_rate": 3.976707967190358e-05, |
| "loss": 0.3327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17896458506584167, |
| "step": 635, |
| "valid_targets_mean": 4749.9, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 1.0158730158730158, |
| "grad_norm": 1.4617398692123404, |
| "learning_rate": 3.9754879965514456e-05, |
| "loss": 0.3293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17083466053009033, |
| "step": 640, |
| "valid_targets_mean": 2990.1, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 1.0238095238095237, |
| "grad_norm": 0.6853201850501975, |
| "learning_rate": 3.9742370836985956e-05, |
| "loss": 0.3462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18801261484622955, |
| "step": 645, |
| "valid_targets_mean": 3202.0, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 1.0317460317460316, |
| "grad_norm": 0.7335116899022144, |
| "learning_rate": 3.972955248224949e-05, |
| "loss": 0.3272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14001566171646118, |
| "step": 650, |
| "valid_targets_mean": 2526.6, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 1.0396825396825398, |
| "grad_norm": 0.7803286501692405, |
| "learning_rate": 3.971642510207989e-05, |
| "loss": 0.3406, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11908479779958725, |
| "step": 655, |
| "valid_targets_mean": 2010.4, |
| "valid_targets_min": 834 |
| }, |
| { |
| "epoch": 1.0476190476190477, |
| "grad_norm": 0.669641003705267, |
| "learning_rate": 3.9702988902092274e-05, |
| "loss": 0.3404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1486767828464508, |
| "step": 660, |
| "valid_targets_mean": 3876.1, |
| "valid_targets_min": 1169 |
| }, |
| { |
| "epoch": 1.0555555555555556, |
| "grad_norm": 0.7374591920294192, |
| "learning_rate": 3.968924409273884e-05, |
| "loss": 0.3361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1979072391986847, |
| "step": 665, |
| "valid_targets_mean": 3748.1, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 1.0634920634920635, |
| "grad_norm": 0.7083687479977528, |
| "learning_rate": 3.9675190889305545e-05, |
| "loss": 0.3417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19211263954639435, |
| "step": 670, |
| "valid_targets_mean": 4064.2, |
| "valid_targets_min": 1686 |
| }, |
| { |
| "epoch": 1.0714285714285714, |
| "grad_norm": 0.8099558494020401, |
| "learning_rate": 3.966082951190874e-05, |
| "loss": 0.3503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15523111820220947, |
| "step": 675, |
| "valid_targets_mean": 2294.0, |
| "valid_targets_min": 1479 |
| }, |
| { |
| "epoch": 1.0793650793650793, |
| "grad_norm": 0.8193510612362526, |
| "learning_rate": 3.9646160185491756e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16692380607128143, |
| "step": 680, |
| "valid_targets_mean": 2352.2, |
| "valid_targets_min": 1492 |
| }, |
| { |
| "epoch": 1.0873015873015872, |
| "grad_norm": 0.6631812506670042, |
| "learning_rate": 3.963118313982131e-05, |
| "loss": 0.3291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16724464297294617, |
| "step": 685, |
| "valid_targets_mean": 3532.9, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 1.0952380952380953, |
| "grad_norm": 0.6330184363082058, |
| "learning_rate": 3.961589860948399e-05, |
| "loss": 0.3341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13762444257736206, |
| "step": 690, |
| "valid_targets_mean": 3628.2, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 1.1031746031746033, |
| "grad_norm": 0.7395137202968401, |
| "learning_rate": 3.960030683388251e-05, |
| "loss": 0.3298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1789383590221405, |
| "step": 695, |
| "valid_targets_mean": 2894.2, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 1.1111111111111112, |
| "grad_norm": 0.7567445910162289, |
| "learning_rate": 3.9584408057232e-05, |
| "loss": 0.3277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13180208206176758, |
| "step": 700, |
| "valid_targets_mean": 2321.5, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 1.119047619047619, |
| "grad_norm": 0.7029746538069985, |
| "learning_rate": 3.956820252855618e-05, |
| "loss": 0.3371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23373830318450928, |
| "step": 705, |
| "valid_targets_mean": 3848.2, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 1.126984126984127, |
| "grad_norm": 0.8217697460107479, |
| "learning_rate": 3.955169050168343e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11867678910493851, |
| "step": 710, |
| "valid_targets_mean": 1995.0, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 1.1349206349206349, |
| "grad_norm": 0.6237928838837601, |
| "learning_rate": 3.953487223524283e-05, |
| "loss": 0.3413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20738816261291504, |
| "step": 715, |
| "valid_targets_mean": 4893.6, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 1.1428571428571428, |
| "grad_norm": 0.6340353953231894, |
| "learning_rate": 3.951774799266014e-05, |
| "loss": 0.3248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17009267210960388, |
| "step": 720, |
| "valid_targets_mean": 3876.5, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 1.1507936507936507, |
| "grad_norm": 0.7509419852778023, |
| "learning_rate": 3.950031804215364e-05, |
| "loss": 0.3542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22996996343135834, |
| "step": 725, |
| "valid_targets_mean": 4188.8, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 1.1587301587301586, |
| "grad_norm": 0.6070513438056959, |
| "learning_rate": 3.948258265672991e-05, |
| "loss": 0.3218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12374967336654663, |
| "step": 730, |
| "valid_targets_mean": 3161.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 1.1666666666666667, |
| "grad_norm": 0.8005848521113644, |
| "learning_rate": 3.946454211417961e-05, |
| "loss": 0.34, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19525708258152008, |
| "step": 735, |
| "valid_targets_mean": 2452.2, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 1.1746031746031746, |
| "grad_norm": 0.7223216527088103, |
| "learning_rate": 3.944619669707309e-05, |
| "loss": 0.3259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19071514904499054, |
| "step": 740, |
| "valid_targets_mean": 2636.9, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 1.1825396825396826, |
| "grad_norm": 0.769530384992589, |
| "learning_rate": 3.9427546692755946e-05, |
| "loss": 0.3479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15291930735111237, |
| "step": 745, |
| "valid_targets_mean": 1790.5, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 1.1904761904761905, |
| "grad_norm": 0.8609161127919669, |
| "learning_rate": 3.9408592393344596e-05, |
| "loss": 0.3333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18366797268390656, |
| "step": 750, |
| "valid_targets_mean": 2313.8, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 1.1984126984126984, |
| "grad_norm": 0.7460458484078427, |
| "learning_rate": 3.9389334095721606e-05, |
| "loss": 0.3435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18691663444042206, |
| "step": 755, |
| "valid_targets_mean": 2993.1, |
| "valid_targets_min": 1669 |
| }, |
| { |
| "epoch": 1.2063492063492063, |
| "grad_norm": 0.6569460078100842, |
| "learning_rate": 3.936977210153113e-05, |
| "loss": 0.3446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1891995668411255, |
| "step": 760, |
| "valid_targets_mean": 4634.4, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 1.2142857142857142, |
| "grad_norm": 0.8065057390599204, |
| "learning_rate": 3.93499067171741e-05, |
| "loss": 0.321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16406933963298798, |
| "step": 765, |
| "valid_targets_mean": 2047.8, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 1.2222222222222223, |
| "grad_norm": 0.6735826463574247, |
| "learning_rate": 3.932973825380351e-05, |
| "loss": 0.3341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1321011185646057, |
| "step": 770, |
| "valid_targets_mean": 3697.6, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 1.2301587301587302, |
| "grad_norm": 0.6532987965485518, |
| "learning_rate": 3.9309267027319485e-05, |
| "loss": 0.3284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20019066333770752, |
| "step": 775, |
| "valid_targets_mean": 5117.1, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 1.2380952380952381, |
| "grad_norm": 0.6721008291547677, |
| "learning_rate": 3.928849335836435e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16830293834209442, |
| "step": 780, |
| "valid_targets_mean": 3834.2, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 1.246031746031746, |
| "grad_norm": 0.672719770061112, |
| "learning_rate": 3.926741757231761e-05, |
| "loss": 0.3179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14843882620334625, |
| "step": 785, |
| "valid_targets_mean": 2557.2, |
| "valid_targets_min": 1395 |
| }, |
| { |
| "epoch": 1.253968253968254, |
| "grad_norm": 0.6540553828853359, |
| "learning_rate": 3.924603999929086e-05, |
| "loss": 0.3359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036338448524475, |
| "step": 790, |
| "valid_targets_mean": 4443.6, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 1.2619047619047619, |
| "grad_norm": 0.6995738559163635, |
| "learning_rate": 3.9224360974122584e-05, |
| "loss": 0.3559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15793496370315552, |
| "step": 795, |
| "valid_targets_mean": 2658.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 1.2698412698412698, |
| "grad_norm": 0.6963704328628288, |
| "learning_rate": 3.920238083637297e-05, |
| "loss": 0.322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15149086713790894, |
| "step": 800, |
| "valid_targets_mean": 2722.5, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 1.2777777777777777, |
| "grad_norm": 0.5568936443457445, |
| "learning_rate": 3.9180099930318524e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1571732759475708, |
| "step": 805, |
| "valid_targets_mean": 4953.6, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 1.2857142857142856, |
| "grad_norm": 0.7021372758165298, |
| "learning_rate": 3.915751860494672e-05, |
| "loss": 0.3446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1892794370651245, |
| "step": 810, |
| "valid_targets_mean": 3306.2, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 1.2936507936507937, |
| "grad_norm": 0.7165579981094458, |
| "learning_rate": 3.913463721395051e-05, |
| "loss": 0.3397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1962992250919342, |
| "step": 815, |
| "valid_targets_mean": 3322.0, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 1.3015873015873016, |
| "grad_norm": 0.6672225363936888, |
| "learning_rate": 3.911145611572282e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13479071855545044, |
| "step": 820, |
| "valid_targets_mean": 2435.1, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 1.3095238095238095, |
| "grad_norm": 0.6373647212783545, |
| "learning_rate": 3.908797567335089e-05, |
| "loss": 0.3476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14948585629463196, |
| "step": 825, |
| "valid_targets_mean": 2808.1, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 1.3174603174603174, |
| "grad_norm": 1.153607480771756, |
| "learning_rate": 3.906419625461062e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14141523838043213, |
| "step": 830, |
| "valid_targets_mean": 1876.9, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 1.3253968253968254, |
| "grad_norm": 0.6466191823091932, |
| "learning_rate": 3.90401182319608e-05, |
| "loss": 0.3174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16680654883384705, |
| "step": 835, |
| "valid_targets_mean": 3402.9, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 1.3333333333333333, |
| "grad_norm": 0.762601991381067, |
| "learning_rate": 3.9015741982537265e-05, |
| "loss": 0.3367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18606701493263245, |
| "step": 840, |
| "valid_targets_mean": 3056.8, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 1.3412698412698414, |
| "grad_norm": 0.5962344088673996, |
| "learning_rate": 3.899106788814701e-05, |
| "loss": 0.3194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1680346578359604, |
| "step": 845, |
| "valid_targets_mean": 3557.2, |
| "valid_targets_min": 1508 |
| }, |
| { |
| "epoch": 1.3492063492063493, |
| "grad_norm": 0.6079281739641783, |
| "learning_rate": 3.896609633526219e-05, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18283489346504211, |
| "step": 850, |
| "valid_targets_mean": 4741.0, |
| "valid_targets_min": 2597 |
| }, |
| { |
| "epoch": 1.3571428571428572, |
| "grad_norm": 0.6433520532374093, |
| "learning_rate": 3.894082771501407e-05, |
| "loss": 0.3142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.224579855799675, |
| "step": 855, |
| "valid_targets_mean": 5688.9, |
| "valid_targets_min": 2441 |
| }, |
| { |
| "epoch": 1.3650793650793651, |
| "grad_norm": 0.6236488281351981, |
| "learning_rate": 3.891526242318692e-05, |
| "loss": 0.3213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12770557403564453, |
| "step": 860, |
| "valid_targets_mean": 2938.4, |
| "valid_targets_min": 1391 |
| }, |
| { |
| "epoch": 1.373015873015873, |
| "grad_norm": 0.6758191068090547, |
| "learning_rate": 3.8889400860211785e-05, |
| "loss": 0.3291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1711861491203308, |
| "step": 865, |
| "valid_targets_mean": 4322.4, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 1.380952380952381, |
| "grad_norm": 0.7829861176740196, |
| "learning_rate": 3.886324343116023e-05, |
| "loss": 0.3326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14786922931671143, |
| "step": 870, |
| "valid_targets_mean": 2398.6, |
| "valid_targets_min": 1527 |
| }, |
| { |
| "epoch": 1.3888888888888888, |
| "grad_norm": 0.6137417239069314, |
| "learning_rate": 3.883679054573799e-05, |
| "loss": 0.3142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12261499464511871, |
| "step": 875, |
| "valid_targets_mean": 3248.4, |
| "valid_targets_min": 1341 |
| }, |
| { |
| "epoch": 1.3968253968253967, |
| "grad_norm": 0.7275067900304849, |
| "learning_rate": 3.881004261827856e-05, |
| "loss": 0.3274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13986937701702118, |
| "step": 880, |
| "valid_targets_mean": 2470.4, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 1.4047619047619047, |
| "grad_norm": 0.573567853532649, |
| "learning_rate": 3.878300006773669e-05, |
| "loss": 0.3188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11593329906463623, |
| "step": 885, |
| "valid_targets_mean": 3373.0, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 1.4126984126984126, |
| "grad_norm": 0.6421889204633251, |
| "learning_rate": 3.875566331768184e-05, |
| "loss": 0.327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16899876296520233, |
| "step": 890, |
| "valid_targets_mean": 3735.2, |
| "valid_targets_min": 1422 |
| }, |
| { |
| "epoch": 1.4206349206349207, |
| "grad_norm": 0.636113488826798, |
| "learning_rate": 3.872803279629155e-05, |
| "loss": 0.3247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18453936278820038, |
| "step": 895, |
| "valid_targets_mean": 4604.8, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 1.4285714285714286, |
| "grad_norm": 0.8348881833927589, |
| "learning_rate": 3.8700108936344705e-05, |
| "loss": 0.3218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15507002174854279, |
| "step": 900, |
| "valid_targets_mean": 4224.5, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 1.4365079365079365, |
| "grad_norm": 0.6263889168583548, |
| "learning_rate": 3.867189217521477e-05, |
| "loss": 0.329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17729918658733368, |
| "step": 905, |
| "valid_targets_mean": 4577.2, |
| "valid_targets_min": 1831 |
| }, |
| { |
| "epoch": 1.4444444444444444, |
| "grad_norm": 0.6333671939834843, |
| "learning_rate": 3.864338295486297e-05, |
| "loss": 0.3216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.230592280626297, |
| "step": 910, |
| "valid_targets_mean": 4192.1, |
| "valid_targets_min": 1671 |
| }, |
| { |
| "epoch": 1.4523809523809523, |
| "grad_norm": 0.7922900343139502, |
| "learning_rate": 3.8614581721831316e-05, |
| "loss": 0.3297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1534234583377838, |
| "step": 915, |
| "valid_targets_mean": 2057.8, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 1.4603174603174602, |
| "grad_norm": 0.6383017464464749, |
| "learning_rate": 3.858548892723563e-05, |
| "loss": 0.3535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13009271025657654, |
| "step": 920, |
| "valid_targets_mean": 3326.5, |
| "valid_targets_min": 1077 |
| }, |
| { |
| "epoch": 1.4682539682539684, |
| "grad_norm": 0.651551125180835, |
| "learning_rate": 3.855610502675851e-05, |
| "loss": 0.3351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22951310873031616, |
| "step": 925, |
| "valid_targets_mean": 4700.6, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 1.4761904761904763, |
| "grad_norm": 0.6753131034311983, |
| "learning_rate": 3.852643048064215e-05, |
| "loss": 0.3219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15419398248195648, |
| "step": 930, |
| "valid_targets_mean": 3162.8, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 1.4841269841269842, |
| "grad_norm": 0.6537814645059444, |
| "learning_rate": 3.8496465753681145e-05, |
| "loss": 0.2999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15850700438022614, |
| "step": 935, |
| "valid_targets_mean": 3159.0, |
| "valid_targets_min": 1387 |
| }, |
| { |
| "epoch": 1.492063492063492, |
| "grad_norm": 0.6873845352603423, |
| "learning_rate": 3.846621131521522e-05, |
| "loss": 0.3314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22871655225753784, |
| "step": 940, |
| "valid_targets_mean": 3588.6, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 1.5, |
| "grad_norm": 0.5815861421834687, |
| "learning_rate": 3.843566763912187e-05, |
| "loss": 0.3205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1536579430103302, |
| "step": 945, |
| "valid_targets_mean": 4438.8, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 1.507936507936508, |
| "grad_norm": 0.6185343070978655, |
| "learning_rate": 3.840483520380896e-05, |
| "loss": 0.3296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11785129457712173, |
| "step": 950, |
| "valid_targets_mean": 3136.1, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 1.5158730158730158, |
| "grad_norm": 0.7109509570702359, |
| "learning_rate": 3.837371449220717e-05, |
| "loss": 0.3296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18690654635429382, |
| "step": 955, |
| "valid_targets_mean": 3742.0, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 1.5238095238095237, |
| "grad_norm": 0.7752023546341235, |
| "learning_rate": 3.834230599176251e-05, |
| "loss": 0.3319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1134377121925354, |
| "step": 960, |
| "valid_targets_mean": 1666.9, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 1.5317460317460316, |
| "grad_norm": 0.642223551798259, |
| "learning_rate": 3.831061019442864e-05, |
| "loss": 0.3356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1406305432319641, |
| "step": 965, |
| "valid_targets_mean": 3459.5, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 1.5396825396825395, |
| "grad_norm": 0.7389463906485425, |
| "learning_rate": 3.827862759665916e-05, |
| "loss": 0.3307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17435957491397858, |
| "step": 970, |
| "valid_targets_mean": 2838.5, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 1.5476190476190477, |
| "grad_norm": 0.9324752016602136, |
| "learning_rate": 3.8246358699399853e-05, |
| "loss": 0.327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16448692977428436, |
| "step": 975, |
| "valid_targets_mean": 2016.4, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 1.5555555555555556, |
| "grad_norm": 0.7164291842449987, |
| "learning_rate": 3.8213804008080824e-05, |
| "loss": 0.3441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21906238794326782, |
| "step": 980, |
| "valid_targets_mean": 4072.2, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 1.5634920634920635, |
| "grad_norm": 0.6920532471489735, |
| "learning_rate": 3.818096403260862e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18423213064670563, |
| "step": 985, |
| "valid_targets_mean": 3113.2, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 1.5714285714285714, |
| "grad_norm": 0.5959713542415751, |
| "learning_rate": 3.8147839287358185e-05, |
| "loss": 0.3235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15230652689933777, |
| "step": 990, |
| "valid_targets_mean": 3757.6, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 1.5793650793650795, |
| "grad_norm": 0.823279374199861, |
| "learning_rate": 3.8114430291164836e-05, |
| "loss": 0.3091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13656845688819885, |
| "step": 995, |
| "valid_targets_mean": 1662.8, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 1.5873015873015874, |
| "grad_norm": 0.6873357420736661, |
| "learning_rate": 3.808073756731615e-05, |
| "loss": 0.318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15334893763065338, |
| "step": 1000, |
| "valid_targets_mean": 3311.2, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 1.5952380952380953, |
| "grad_norm": 0.6484825809948287, |
| "learning_rate": 3.8046761643543734e-05, |
| "loss": 0.3121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1463339626789093, |
| "step": 1005, |
| "valid_targets_mean": 4150.1, |
| "valid_targets_min": 1798 |
| }, |
| { |
| "epoch": 1.6031746031746033, |
| "grad_norm": 0.6817054528039794, |
| "learning_rate": 3.8012503052014996e-05, |
| "loss": 0.3656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17801718413829803, |
| "step": 1010, |
| "valid_targets_mean": 3748.4, |
| "valid_targets_min": 1955 |
| }, |
| { |
| "epoch": 1.6111111111111112, |
| "grad_norm": 0.7872906055674049, |
| "learning_rate": 3.797796232932476e-05, |
| "loss": 0.3287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1268722265958786, |
| "step": 1015, |
| "valid_targets_mean": 2023.8, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 1.619047619047619, |
| "grad_norm": 0.651529600042665, |
| "learning_rate": 3.794314001648692e-05, |
| "loss": 0.3167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14170636236667633, |
| "step": 1020, |
| "valid_targets_mean": 2843.0, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 1.626984126984127, |
| "grad_norm": 0.6171435300769704, |
| "learning_rate": 3.7908036658925926e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16796676814556122, |
| "step": 1025, |
| "valid_targets_mean": 2937.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 1.6349206349206349, |
| "grad_norm": 0.7476071653963485, |
| "learning_rate": 3.787265280646825e-05, |
| "loss": 0.3161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16783180832862854, |
| "step": 1030, |
| "valid_targets_mean": 2927.6, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 1.6428571428571428, |
| "grad_norm": 0.6644484494281356, |
| "learning_rate": 3.7836989013333776e-05, |
| "loss": 0.3194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13871848583221436, |
| "step": 1035, |
| "valid_targets_mean": 3492.8, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 1.6507936507936507, |
| "grad_norm": 0.5725806618836755, |
| "learning_rate": 3.780104583812712e-05, |
| "loss": 0.3175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16656331717967987, |
| "step": 1040, |
| "valid_targets_mean": 4105.2, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 1.6587301587301586, |
| "grad_norm": 0.7354883976199714, |
| "learning_rate": 3.7764823843828883e-05, |
| "loss": 0.3321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18832966685295105, |
| "step": 1045, |
| "valid_targets_mean": 3323.4, |
| "valid_targets_min": 1571 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.6548011282202095, |
| "learning_rate": 3.7728323597786834e-05, |
| "loss": 0.3087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11662226915359497, |
| "step": 1050, |
| "valid_targets_mean": 2727.0, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 1.6746031746031746, |
| "grad_norm": 0.7662281834478178, |
| "learning_rate": 3.7691545671707007e-05, |
| "loss": 0.3448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16389185190200806, |
| "step": 1055, |
| "valid_targets_mean": 2433.9, |
| "valid_targets_min": 1068 |
| }, |
| { |
| "epoch": 1.6825396825396826, |
| "grad_norm": 0.6191057387381401, |
| "learning_rate": 3.765449064164477e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09424316883087158, |
| "step": 1060, |
| "valid_targets_mean": 2522.8, |
| "valid_targets_min": 1517 |
| }, |
| { |
| "epoch": 1.6904761904761905, |
| "grad_norm": 0.7089163950388633, |
| "learning_rate": 3.7617159087995784e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16477319598197937, |
| "step": 1065, |
| "valid_targets_mean": 4247.1, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 1.6984126984126984, |
| "grad_norm": 0.7336010684393983, |
| "learning_rate": 3.757955159548693e-05, |
| "loss": 0.3324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1567060947418213, |
| "step": 1070, |
| "valid_targets_mean": 2002.9, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 1.7063492063492065, |
| "grad_norm": 0.5551974094945166, |
| "learning_rate": 3.754166875316713e-05, |
| "loss": 0.3024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18975624442100525, |
| "step": 1075, |
| "valid_targets_mean": 5140.1, |
| "valid_targets_min": 1990 |
| }, |
| { |
| "epoch": 1.7142857142857144, |
| "grad_norm": 0.7790486862381991, |
| "learning_rate": 3.750351115439812e-05, |
| "loss": 0.3302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16643652319908142, |
| "step": 1080, |
| "valid_targets_mean": 3622.6, |
| "valid_targets_min": 1729 |
| }, |
| { |
| "epoch": 1.7222222222222223, |
| "grad_norm": 0.6895583697751339, |
| "learning_rate": 3.746507939684519e-05, |
| "loss": 0.3126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1543181836605072, |
| "step": 1085, |
| "valid_targets_mean": 2840.0, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 1.7301587301587302, |
| "grad_norm": 0.6649886180118483, |
| "learning_rate": 3.742637408246779e-05, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20172613859176636, |
| "step": 1090, |
| "valid_targets_mean": 4078.4, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 1.7380952380952381, |
| "grad_norm": 0.6986475804737025, |
| "learning_rate": 3.73873958175101e-05, |
| "loss": 0.3242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1479484736919403, |
| "step": 1095, |
| "valid_targets_mean": 3294.2, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 1.746031746031746, |
| "grad_norm": 0.7108510865696669, |
| "learning_rate": 3.734814521249156e-05, |
| "loss": 0.3307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1519460678100586, |
| "step": 1100, |
| "valid_targets_mean": 3030.0, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 1.753968253968254, |
| "grad_norm": 0.780130184905361, |
| "learning_rate": 3.7308622882197294e-05, |
| "loss": 0.3102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11438941955566406, |
| "step": 1105, |
| "valid_targets_mean": 2342.4, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 1.7619047619047619, |
| "grad_norm": 0.6919296705990884, |
| "learning_rate": 3.7268829445668456e-05, |
| "loss": 0.3304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1509092152118683, |
| "step": 1110, |
| "valid_targets_mean": 2715.0, |
| "valid_targets_min": 1656 |
| }, |
| { |
| "epoch": 1.7698412698412698, |
| "grad_norm": 0.7095337197458086, |
| "learning_rate": 3.722876552619257e-05, |
| "loss": 0.3329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1642485111951828, |
| "step": 1115, |
| "valid_targets_mean": 3003.0, |
| "valid_targets_min": 1832 |
| }, |
| { |
| "epoch": 1.7777777777777777, |
| "grad_norm": 0.6623605599103729, |
| "learning_rate": 3.718843175129378e-05, |
| "loss": 0.3133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1656493842601776, |
| "step": 1120, |
| "valid_targets_mean": 3344.5, |
| "valid_targets_min": 1639 |
| }, |
| { |
| "epoch": 1.7857142857142856, |
| "grad_norm": 0.6509353975185467, |
| "learning_rate": 3.7147828752722944e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16948366165161133, |
| "step": 1125, |
| "valid_targets_mean": 3909.0, |
| "valid_targets_min": 2076 |
| }, |
| { |
| "epoch": 1.7936507936507935, |
| "grad_norm": 0.7055857265594317, |
| "learning_rate": 3.7106957166447834e-05, |
| "loss": 0.3001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.182726189494133, |
| "step": 1130, |
| "valid_targets_mean": 3147.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 1.8015873015873016, |
| "grad_norm": 0.5821370256541043, |
| "learning_rate": 3.7065817632643115e-05, |
| "loss": 0.3083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20441317558288574, |
| "step": 1135, |
| "valid_targets_mean": 6269.5, |
| "valid_targets_min": 2700 |
| }, |
| { |
| "epoch": 1.8095238095238095, |
| "grad_norm": 0.6271222096362784, |
| "learning_rate": 3.7024410795680326e-05, |
| "loss": 0.3065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14290623366832733, |
| "step": 1140, |
| "valid_targets_mean": 3049.8, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 1.8174603174603174, |
| "grad_norm": 0.5742957360318593, |
| "learning_rate": 3.698273730411782e-05, |
| "loss": 0.3181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1737782061100006, |
| "step": 1145, |
| "valid_targets_mean": 4881.1, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 1.8253968253968254, |
| "grad_norm": 0.7237896853510777, |
| "learning_rate": 3.694079781069053e-05, |
| "loss": 0.3124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1605367660522461, |
| "step": 1150, |
| "valid_targets_mean": 2798.1, |
| "valid_targets_min": 1461 |
| }, |
| { |
| "epoch": 1.8333333333333335, |
| "grad_norm": 0.7796561546026146, |
| "learning_rate": 3.6898592972299875e-05, |
| "loss": 0.3177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14959201216697693, |
| "step": 1155, |
| "valid_targets_mean": 2855.1, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 1.8412698412698414, |
| "grad_norm": 0.7814814222422569, |
| "learning_rate": 3.6856123450003306e-05, |
| "loss": 0.3331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18412166833877563, |
| "step": 1160, |
| "valid_targets_mean": 3015.8, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 1.8492063492063493, |
| "grad_norm": 0.6571893565564805, |
| "learning_rate": 3.68133899090041e-05, |
| "loss": 0.3197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12655168771743774, |
| "step": 1165, |
| "valid_targets_mean": 2925.4, |
| "valid_targets_min": 1490 |
| }, |
| { |
| "epoch": 1.8571428571428572, |
| "grad_norm": 0.5625971515672297, |
| "learning_rate": 3.677039301864085e-05, |
| "loss": 0.3281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15519466996192932, |
| "step": 1170, |
| "valid_targets_mean": 3959.8, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 1.8650793650793651, |
| "grad_norm": 0.7022395536958516, |
| "learning_rate": 3.672713345237701e-05, |
| "loss": 0.3228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12823298573493958, |
| "step": 1175, |
| "valid_targets_mean": 2513.6, |
| "valid_targets_min": 1325 |
| }, |
| { |
| "epoch": 1.873015873015873, |
| "grad_norm": 0.7382776756172028, |
| "learning_rate": 3.6683611887790356e-05, |
| "loss": 0.3195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2348577082157135, |
| "step": 1180, |
| "valid_targets_mean": 3610.5, |
| "valid_targets_min": 1258 |
| }, |
| { |
| "epoch": 1.880952380952381, |
| "grad_norm": 0.6379811831724779, |
| "learning_rate": 3.663982900656236e-05, |
| "loss": 0.3279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1788225919008255, |
| "step": 1185, |
| "valid_targets_mean": 3843.0, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 1.8888888888888888, |
| "grad_norm": 0.6677114190374929, |
| "learning_rate": 3.6595785494467516e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1895446628332138, |
| "step": 1190, |
| "valid_targets_mean": 4057.9, |
| "valid_targets_min": 493 |
| }, |
| { |
| "epoch": 1.8968253968253967, |
| "grad_norm": 0.554324996485495, |
| "learning_rate": 3.655148204136259e-05, |
| "loss": 0.2951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1370246708393097, |
| "step": 1195, |
| "valid_targets_mean": 4461.0, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 1.9047619047619047, |
| "grad_norm": 0.5714890741512307, |
| "learning_rate": 3.650691934117584e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1589963287115097, |
| "step": 1200, |
| "valid_targets_mean": 4565.9, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 1.9126984126984126, |
| "grad_norm": 0.7448282050971057, |
| "learning_rate": 3.646209809189611e-05, |
| "loss": 0.3131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20559057593345642, |
| "step": 1205, |
| "valid_targets_mean": 3693.9, |
| "valid_targets_min": 1229 |
| }, |
| { |
| "epoch": 1.9206349206349205, |
| "grad_norm": 0.6320209854193637, |
| "learning_rate": 3.641701899556192e-05, |
| "loss": 0.3229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24096056818962097, |
| "step": 1210, |
| "valid_targets_mean": 5899.9, |
| "valid_targets_min": 1722 |
| }, |
| { |
| "epoch": 1.9285714285714286, |
| "grad_norm": 0.5359385368169469, |
| "learning_rate": 3.63716827582505e-05, |
| "loss": 0.295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11727620661258698, |
| "step": 1215, |
| "valid_targets_mean": 2772.8, |
| "valid_targets_min": 1515 |
| }, |
| { |
| "epoch": 1.9365079365079365, |
| "grad_norm": 0.643091990151274, |
| "learning_rate": 3.632609009006665e-05, |
| "loss": 0.301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13127782940864563, |
| "step": 1220, |
| "valid_targets_mean": 3445.0, |
| "valid_targets_min": 1638 |
| }, |
| { |
| "epoch": 1.9444444444444444, |
| "grad_norm": 0.7242904191833993, |
| "learning_rate": 3.62802417051317e-05, |
| "loss": 0.3301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19884291291236877, |
| "step": 1225, |
| "valid_targets_mean": 3024.6, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 1.9523809523809523, |
| "grad_norm": 0.7142658889462979, |
| "learning_rate": 3.6234138321572274e-05, |
| "loss": 0.3239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16410435736179352, |
| "step": 1230, |
| "valid_targets_mean": 2792.0, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 1.9603174603174605, |
| "grad_norm": 0.7622407534270608, |
| "learning_rate": 3.6187780661509074e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13600055873394012, |
| "step": 1235, |
| "valid_targets_mean": 2606.2, |
| "valid_targets_min": 1292 |
| }, |
| { |
| "epoch": 1.9682539682539684, |
| "grad_norm": 2.0519892124143264, |
| "learning_rate": 3.6141169451045526e-05, |
| "loss": 0.3312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22042493522167206, |
| "step": 1240, |
| "valid_targets_mean": 3888.2, |
| "valid_targets_min": 1648 |
| }, |
| { |
| "epoch": 1.9761904761904763, |
| "grad_norm": 0.661985430252956, |
| "learning_rate": 3.609430542025646e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17805568873882294, |
| "step": 1245, |
| "valid_targets_mean": 3606.0, |
| "valid_targets_min": 463 |
| }, |
| { |
| "epoch": 1.9841269841269842, |
| "grad_norm": 0.6677192065899155, |
| "learning_rate": 3.604718930317664e-05, |
| "loss": 0.3106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11548539996147156, |
| "step": 1250, |
| "valid_targets_mean": 2009.4, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 1.992063492063492, |
| "grad_norm": 0.6535363195362384, |
| "learning_rate": 3.5999821837789275e-05, |
| "loss": 0.3162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13011835515499115, |
| "step": 1255, |
| "valid_targets_mean": 3151.8, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 0.6667531440533361, |
| "learning_rate": 3.595220376601447e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19327494502067566, |
| "step": 1260, |
| "valid_targets_mean": 3476.6, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 2.007936507936508, |
| "grad_norm": 0.6583520262553467, |
| "learning_rate": 3.590433583369758e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11713065207004547, |
| "step": 1265, |
| "valid_targets_mean": 3390.6, |
| "valid_targets_min": 319 |
| }, |
| { |
| "epoch": 2.015873015873016, |
| "grad_norm": 0.6184665053818716, |
| "learning_rate": 3.5856218790597554e-05, |
| "loss": 0.3059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1123209297657013, |
| "step": 1270, |
| "valid_targets_mean": 3809.2, |
| "valid_targets_min": 1431 |
| }, |
| { |
| "epoch": 2.0238095238095237, |
| "grad_norm": 0.7493002816181802, |
| "learning_rate": 3.580785339037519e-05, |
| "loss": 0.2729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16529607772827148, |
| "step": 1275, |
| "valid_targets_mean": 3118.0, |
| "valid_targets_min": 1336 |
| }, |
| { |
| "epoch": 2.0317460317460316, |
| "grad_norm": 0.7741262247536087, |
| "learning_rate": 3.57592403905813e-05, |
| "loss": 0.2949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12097487598657608, |
| "step": 1280, |
| "valid_targets_mean": 2530.2, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 2.0396825396825395, |
| "grad_norm": 0.6230151198360837, |
| "learning_rate": 3.571038055264489e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14992347359657288, |
| "step": 1285, |
| "valid_targets_mean": 5069.0, |
| "valid_targets_min": 2124 |
| }, |
| { |
| "epoch": 2.0476190476190474, |
| "grad_norm": 0.810562148405268, |
| "learning_rate": 3.566127464186119e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21131475269794464, |
| "step": 1290, |
| "valid_targets_mean": 3328.2, |
| "valid_targets_min": 538 |
| }, |
| { |
| "epoch": 2.0555555555555554, |
| "grad_norm": 0.5476942649122561, |
| "learning_rate": 3.56119234273797e-05, |
| "loss": 0.2904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13968425989151, |
| "step": 1295, |
| "valid_targets_mean": 5129.4, |
| "valid_targets_min": 1461 |
| }, |
| { |
| "epoch": 2.0634920634920633, |
| "grad_norm": 0.5657998227607735, |
| "learning_rate": 3.5562327682192134e-05, |
| "loss": 0.2853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20042595267295837, |
| "step": 1300, |
| "valid_targets_mean": 5548.2, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 2.0714285714285716, |
| "grad_norm": 0.6072758802013452, |
| "learning_rate": 3.5512488183120286e-05, |
| "loss": 0.2769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1297391653060913, |
| "step": 1305, |
| "valid_targets_mean": 3396.8, |
| "valid_targets_min": 1489 |
| }, |
| { |
| "epoch": 2.0793650793650795, |
| "grad_norm": 0.6816298909752555, |
| "learning_rate": 3.54624057108039e-05, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14064955711364746, |
| "step": 1310, |
| "valid_targets_mean": 3406.9, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 2.0873015873015874, |
| "grad_norm": 0.6703325281786866, |
| "learning_rate": 3.5412081049688444e-05, |
| "loss": 0.2794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1433454304933548, |
| "step": 1315, |
| "valid_targets_mean": 3164.2, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 2.0952380952380953, |
| "grad_norm": 0.6835358753375542, |
| "learning_rate": 3.5361514988012774e-05, |
| "loss": 0.2715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09970133751630783, |
| "step": 1320, |
| "valid_targets_mean": 2335.0, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 2.1031746031746033, |
| "grad_norm": 0.6326834094504827, |
| "learning_rate": 3.5310708317796844e-05, |
| "loss": 0.2664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1121712401509285, |
| "step": 1325, |
| "valid_targets_mean": 2643.4, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 2.111111111111111, |
| "grad_norm": 3.950868272026065, |
| "learning_rate": 3.5259661834829266e-05, |
| "loss": 0.2953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14811912178993225, |
| "step": 1330, |
| "valid_targets_mean": 3642.4, |
| "valid_targets_min": 1865 |
| }, |
| { |
| "epoch": 2.119047619047619, |
| "grad_norm": 0.6816657238059641, |
| "learning_rate": 3.5208376338654866e-05, |
| "loss": 0.2839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1544703096151352, |
| "step": 1335, |
| "valid_targets_mean": 3581.6, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 2.126984126984127, |
| "grad_norm": 0.6047101996393489, |
| "learning_rate": 3.515685263256214e-05, |
| "loss": 0.2924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12545567750930786, |
| "step": 1340, |
| "valid_targets_mean": 3086.5, |
| "valid_targets_min": 1125 |
| }, |
| { |
| "epoch": 2.134920634920635, |
| "grad_norm": 0.7668214060032036, |
| "learning_rate": 3.51050915235707e-05, |
| "loss": 0.2899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15387457609176636, |
| "step": 1345, |
| "valid_targets_mean": 2922.4, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 2.142857142857143, |
| "grad_norm": 0.6341428031092777, |
| "learning_rate": 3.5053093822418596e-05, |
| "loss": 0.2836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18130765855312347, |
| "step": 1350, |
| "valid_targets_mean": 4195.0, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 2.1507936507936507, |
| "grad_norm": 0.6248047434099063, |
| "learning_rate": 3.500086034354966e-05, |
| "loss": 0.275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1647244542837143, |
| "step": 1355, |
| "valid_targets_mean": 4345.2, |
| "valid_targets_min": 1896 |
| }, |
| { |
| "epoch": 2.1587301587301586, |
| "grad_norm": 0.6747528154705348, |
| "learning_rate": 3.494839190510071e-05, |
| "loss": 0.2805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12260128557682037, |
| "step": 1360, |
| "valid_targets_mean": 2796.8, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 2.1666666666666665, |
| "grad_norm": 0.7118102595286983, |
| "learning_rate": 3.489568932888877e-05, |
| "loss": 0.2783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16787979006767273, |
| "step": 1365, |
| "valid_targets_mean": 2947.5, |
| "valid_targets_min": 1622 |
| }, |
| { |
| "epoch": 2.1746031746031744, |
| "grad_norm": 0.6385054350831572, |
| "learning_rate": 3.484275344039815e-05, |
| "loss": 0.2816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14596769213676453, |
| "step": 1370, |
| "valid_targets_mean": 3821.0, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 2.1825396825396823, |
| "grad_norm": 0.7154596844294332, |
| "learning_rate": 3.478958506876759e-05, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1572347730398178, |
| "step": 1375, |
| "valid_targets_mean": 3031.8, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 2.1904761904761907, |
| "grad_norm": 0.6664826932154091, |
| "learning_rate": 3.47361850467772e-05, |
| "loss": 0.2788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14033150672912598, |
| "step": 1380, |
| "valid_targets_mean": 3299.4, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 2.1984126984126986, |
| "grad_norm": 0.6285119796929689, |
| "learning_rate": 3.468255421083546e-05, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15819507837295532, |
| "step": 1385, |
| "valid_targets_mean": 3849.9, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 2.2063492063492065, |
| "grad_norm": 0.7275694931249483, |
| "learning_rate": 3.46286934009661e-05, |
| "loss": 0.293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13317999243736267, |
| "step": 1390, |
| "valid_targets_mean": 2756.9, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 2.2142857142857144, |
| "grad_norm": 0.6358951472501403, |
| "learning_rate": 3.457460346079495e-05, |
| "loss": 0.2843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13068701326847076, |
| "step": 1395, |
| "valid_targets_mean": 3634.2, |
| "valid_targets_min": 1807 |
| }, |
| { |
| "epoch": 2.2222222222222223, |
| "grad_norm": 2.0139879928616233, |
| "learning_rate": 3.452028523753673e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1745387613773346, |
| "step": 1400, |
| "valid_targets_mean": 3817.2, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 2.2301587301587302, |
| "grad_norm": 0.6465986757489767, |
| "learning_rate": 3.446573958198176e-05, |
| "loss": 0.2781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14092761278152466, |
| "step": 1405, |
| "valid_targets_mean": 3375.8, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 2.238095238095238, |
| "grad_norm": 0.7747629398813702, |
| "learning_rate": 3.4410967348482666e-05, |
| "loss": 0.2753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10323482751846313, |
| "step": 1410, |
| "valid_targets_mean": 1944.0, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 2.246031746031746, |
| "grad_norm": 0.597350797307689, |
| "learning_rate": 3.435596939494098e-05, |
| "loss": 0.2805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10818013548851013, |
| "step": 1415, |
| "valid_targets_mean": 3180.1, |
| "valid_targets_min": 1579 |
| }, |
| { |
| "epoch": 2.253968253968254, |
| "grad_norm": 0.6699385734099821, |
| "learning_rate": 3.430074658279369e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1064271479845047, |
| "step": 1420, |
| "valid_targets_mean": 2770.2, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 2.261904761904762, |
| "grad_norm": 0.75576808503992, |
| "learning_rate": 3.424529977699977e-05, |
| "loss": 0.2752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14628705382347107, |
| "step": 1425, |
| "valid_targets_mean": 2557.9, |
| "valid_targets_min": 1104 |
| }, |
| { |
| "epoch": 2.2698412698412698, |
| "grad_norm": 0.6025560694996105, |
| "learning_rate": 3.418962984602661e-05, |
| "loss": 0.2921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11078731715679169, |
| "step": 1430, |
| "valid_targets_mean": 2991.8, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 2.2777777777777777, |
| "grad_norm": 0.7739932318724013, |
| "learning_rate": 3.413373766183646e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12117686867713928, |
| "step": 1435, |
| "valid_targets_mean": 1849.1, |
| "valid_targets_min": 586 |
| }, |
| { |
| "epoch": 2.2857142857142856, |
| "grad_norm": 0.6235979138790416, |
| "learning_rate": 3.40776240998727e-05, |
| "loss": 0.2802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1533014178276062, |
| "step": 1440, |
| "valid_targets_mean": 4757.4, |
| "valid_targets_min": 1467 |
| }, |
| { |
| "epoch": 2.2936507936507935, |
| "grad_norm": 0.745768264262844, |
| "learning_rate": 3.4021290039046184e-05, |
| "loss": 0.2874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1377353072166443, |
| "step": 1445, |
| "valid_targets_mean": 2300.9, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 2.3015873015873014, |
| "grad_norm": 0.6254453190255295, |
| "learning_rate": 3.396473636172146e-05, |
| "loss": 0.2906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12696042656898499, |
| "step": 1450, |
| "valid_targets_mean": 3798.0, |
| "valid_targets_min": 1759 |
| }, |
| { |
| "epoch": 2.3095238095238093, |
| "grad_norm": 0.6457999463573912, |
| "learning_rate": 3.390796395370294e-05, |
| "loss": 0.2747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14060063660144806, |
| "step": 1455, |
| "valid_targets_mean": 3829.0, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 2.317460317460317, |
| "grad_norm": 0.746423663933539, |
| "learning_rate": 3.385097370422102e-05, |
| "loss": 0.3019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1291799396276474, |
| "step": 1460, |
| "valid_targets_mean": 2310.8, |
| "valid_targets_min": 1472 |
| }, |
| { |
| "epoch": 2.3253968253968256, |
| "grad_norm": 0.6768216692086332, |
| "learning_rate": 3.3793766505918185e-05, |
| "loss": 0.2998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1252336949110031, |
| "step": 1465, |
| "valid_targets_mean": 2343.1, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.3333333333333335, |
| "grad_norm": 0.8554015943268323, |
| "learning_rate": 3.3736343254834994e-05, |
| "loss": 0.2773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14149311184883118, |
| "step": 1470, |
| "valid_targets_mean": 3089.0, |
| "valid_targets_min": 1826 |
| }, |
| { |
| "epoch": 2.3412698412698414, |
| "grad_norm": 0.5699352738058534, |
| "learning_rate": 3.3678704850396045e-05, |
| "loss": 0.2713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1736626923084259, |
| "step": 1475, |
| "valid_targets_mean": 5070.6, |
| "valid_targets_min": 1119 |
| }, |
| { |
| "epoch": 2.3492063492063493, |
| "grad_norm": 0.678427343004129, |
| "learning_rate": 3.362085219539592e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17105717957019806, |
| "step": 1480, |
| "valid_targets_mean": 3659.2, |
| "valid_targets_min": 1391 |
| }, |
| { |
| "epoch": 2.357142857142857, |
| "grad_norm": 0.6478379778271129, |
| "learning_rate": 3.3562786195985025e-05, |
| "loss": 0.289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13324151933193207, |
| "step": 1485, |
| "valid_targets_mean": 3253.6, |
| "valid_targets_min": 356 |
| }, |
| { |
| "epoch": 2.365079365079365, |
| "grad_norm": 0.676700032911331, |
| "learning_rate": 3.350450776165535e-05, |
| "loss": 0.2684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11475967615842819, |
| "step": 1490, |
| "valid_targets_mean": 2737.2, |
| "valid_targets_min": 1414 |
| }, |
| { |
| "epoch": 2.373015873015873, |
| "grad_norm": 0.7360708037445938, |
| "learning_rate": 3.344601780522634e-05, |
| "loss": 0.2815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12047970294952393, |
| "step": 1495, |
| "valid_targets_mean": 2303.1, |
| "valid_targets_min": 986 |
| }, |
| { |
| "epoch": 2.380952380952381, |
| "grad_norm": 0.7144328682757947, |
| "learning_rate": 3.3387317242830466e-05, |
| "loss": 0.2959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11342642456293106, |
| "step": 1500, |
| "valid_targets_mean": 2235.1, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 2.388888888888889, |
| "grad_norm": 0.6778072852737712, |
| "learning_rate": 3.332840699389897e-05, |
| "loss": 0.275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11429885029792786, |
| "step": 1505, |
| "valid_targets_mean": 4177.8, |
| "valid_targets_min": 1508 |
| }, |
| { |
| "epoch": 2.3968253968253967, |
| "grad_norm": 0.6602113352709741, |
| "learning_rate": 3.32692879811474e-05, |
| "loss": 0.2733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09258200228214264, |
| "step": 1510, |
| "valid_targets_mean": 2555.5, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 2.4047619047619047, |
| "grad_norm": 0.7944569505936786, |
| "learning_rate": 3.320996113056123e-05, |
| "loss": 0.2994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14962106943130493, |
| "step": 1515, |
| "valid_targets_mean": 2968.1, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 2.4126984126984126, |
| "grad_norm": 0.7895832341518009, |
| "learning_rate": 3.315042737138128e-05, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.128577321767807, |
| "step": 1520, |
| "valid_targets_mean": 2297.6, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 2.4206349206349205, |
| "grad_norm": 0.6113596264456261, |
| "learning_rate": 3.309068763608919e-05, |
| "loss": 0.2916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14215974509716034, |
| "step": 1525, |
| "valid_targets_mean": 4635.9, |
| "valid_targets_min": 1311 |
| }, |
| { |
| "epoch": 2.4285714285714284, |
| "grad_norm": 0.7606294131509589, |
| "learning_rate": 3.303074286039285e-05, |
| "loss": 0.2913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15265774726867676, |
| "step": 1530, |
| "valid_targets_mean": 3241.4, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 2.4365079365079367, |
| "grad_norm": 0.6597348036859395, |
| "learning_rate": 3.2970593983211694e-05, |
| "loss": 0.291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16022004187107086, |
| "step": 1535, |
| "valid_targets_mean": 4045.4, |
| "valid_targets_min": 1319 |
| }, |
| { |
| "epoch": 2.4444444444444446, |
| "grad_norm": 0.6418418930113634, |
| "learning_rate": 3.2910241946661993e-05, |
| "loss": 0.2827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1274852603673935, |
| "step": 1540, |
| "valid_targets_mean": 3660.1, |
| "valid_targets_min": 1576 |
| }, |
| { |
| "epoch": 2.4523809523809526, |
| "grad_norm": 0.5596752424003796, |
| "learning_rate": 3.2849687696042165e-05, |
| "loss": 0.2811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12781956791877747, |
| "step": 1545, |
| "valid_targets_mean": 3888.6, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 2.4603174603174605, |
| "grad_norm": 0.6298774595726288, |
| "learning_rate": 3.2788932179817886e-05, |
| "loss": 0.2806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12249404937028885, |
| "step": 1550, |
| "valid_targets_mean": 3024.8, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 2.4682539682539684, |
| "grad_norm": 0.8294293286080818, |
| "learning_rate": 3.2727976349607276e-05, |
| "loss": 0.2869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16689524054527283, |
| "step": 1555, |
| "valid_targets_mean": 3518.5, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 2.4761904761904763, |
| "grad_norm": 0.8170059407606398, |
| "learning_rate": 3.266682116016599e-05, |
| "loss": 0.2865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15669232606887817, |
| "step": 1560, |
| "valid_targets_mean": 2421.6, |
| "valid_targets_min": 1520 |
| }, |
| { |
| "epoch": 2.484126984126984, |
| "grad_norm": 0.6500010061538937, |
| "learning_rate": 3.260546756937227e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10150349140167236, |
| "step": 1565, |
| "valid_targets_mean": 2195.6, |
| "valid_targets_min": 1602 |
| }, |
| { |
| "epoch": 2.492063492063492, |
| "grad_norm": 0.8474876828092535, |
| "learning_rate": 3.254391653821192e-05, |
| "loss": 0.2723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16686615347862244, |
| "step": 1570, |
| "valid_targets_mean": 2120.5, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.6084457929463493, |
| "learning_rate": 3.248216903076328e-05, |
| "loss": 0.286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11863277852535248, |
| "step": 1575, |
| "valid_targets_mean": 3777.1, |
| "valid_targets_min": 1557 |
| }, |
| { |
| "epoch": 2.507936507936508, |
| "grad_norm": 0.6549666435127953, |
| "learning_rate": 3.24202260141821e-05, |
| "loss": 0.282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1478644460439682, |
| "step": 1580, |
| "valid_targets_mean": 3566.9, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 2.515873015873016, |
| "grad_norm": 0.7084095804077182, |
| "learning_rate": 3.235808845868641e-05, |
| "loss": 0.2744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13560350239276886, |
| "step": 1585, |
| "valid_targets_mean": 3083.1, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 2.5238095238095237, |
| "grad_norm": 0.7283622693375735, |
| "learning_rate": 3.229575733754132e-05, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13665327429771423, |
| "step": 1590, |
| "valid_targets_mean": 3873.9, |
| "valid_targets_min": 1988 |
| }, |
| { |
| "epoch": 2.5317460317460316, |
| "grad_norm": 0.7813924734763139, |
| "learning_rate": 3.2233233627043765e-05, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18560901284217834, |
| "step": 1595, |
| "valid_targets_mean": 3023.4, |
| "valid_targets_min": 1717 |
| }, |
| { |
| "epoch": 2.5396825396825395, |
| "grad_norm": 0.7724895632284718, |
| "learning_rate": 3.217051830650722e-05, |
| "loss": 0.2882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13543711602687836, |
| "step": 1600, |
| "valid_targets_mean": 2324.1, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 2.5476190476190474, |
| "grad_norm": 0.631251167859757, |
| "learning_rate": 3.210761235824639e-05, |
| "loss": 0.284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19025763869285583, |
| "step": 1605, |
| "valid_targets_mean": 4070.1, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 2.5555555555555554, |
| "grad_norm": 0.6693047102178958, |
| "learning_rate": 3.204451676756175e-05, |
| "loss": 0.272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13068076968193054, |
| "step": 1610, |
| "valid_targets_mean": 2703.6, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 2.5634920634920633, |
| "grad_norm": 0.6793425587783933, |
| "learning_rate": 3.198123252272419e-05, |
| "loss": 0.3072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15108279883861542, |
| "step": 1615, |
| "valid_targets_mean": 3861.0, |
| "valid_targets_min": 2115 |
| }, |
| { |
| "epoch": 2.571428571428571, |
| "grad_norm": 0.7533398118442075, |
| "learning_rate": 3.1917760614959505e-05, |
| "loss": 0.279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17746326327323914, |
| "step": 1620, |
| "valid_targets_mean": 3869.5, |
| "valid_targets_min": 2101 |
| }, |
| { |
| "epoch": 2.5793650793650795, |
| "grad_norm": 0.6401603357735229, |
| "learning_rate": 3.1854102038432856e-05, |
| "loss": 0.2779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0972735583782196, |
| "step": 1625, |
| "valid_targets_mean": 2536.4, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 2.5873015873015874, |
| "grad_norm": 0.6534800131136479, |
| "learning_rate": 3.17902577902332e-05, |
| "loss": 0.2885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1368650197982788, |
| "step": 1630, |
| "valid_targets_mean": 3628.0, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 2.5952380952380953, |
| "grad_norm": 0.6723421200741301, |
| "learning_rate": 3.172622887035771e-05, |
| "loss": 0.303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16636143624782562, |
| "step": 1635, |
| "valid_targets_mean": 3449.6, |
| "valid_targets_min": 1366 |
| }, |
| { |
| "epoch": 2.6031746031746033, |
| "grad_norm": 0.6086043667473161, |
| "learning_rate": 3.1662016281696073e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1077192947268486, |
| "step": 1640, |
| "valid_targets_mean": 3127.9, |
| "valid_targets_min": 1693 |
| }, |
| { |
| "epoch": 2.611111111111111, |
| "grad_norm": 0.5976415874014748, |
| "learning_rate": 3.15976210300148e-05, |
| "loss": 0.277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08958538621664047, |
| "step": 1645, |
| "valid_targets_mean": 2533.8, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 2.619047619047619, |
| "grad_norm": 0.7581524318153838, |
| "learning_rate": 3.153304412394143e-05, |
| "loss": 0.2873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1573348343372345, |
| "step": 1650, |
| "valid_targets_mean": 2123.6, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 2.626984126984127, |
| "grad_norm": 0.754404491585718, |
| "learning_rate": 3.146828657494883e-05, |
| "loss": 0.2899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14607343077659607, |
| "step": 1655, |
| "valid_targets_mean": 2874.5, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 2.634920634920635, |
| "grad_norm": 0.7776622806557849, |
| "learning_rate": 3.140334939733924e-05, |
| "loss": 0.283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15422557294368744, |
| "step": 1660, |
| "valid_targets_mean": 2812.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 2.642857142857143, |
| "grad_norm": 0.7851829681510233, |
| "learning_rate": 3.1338233608228455e-05, |
| "loss": 0.2923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17594920098781586, |
| "step": 1665, |
| "valid_targets_mean": 4304.4, |
| "valid_targets_min": 1584 |
| }, |
| { |
| "epoch": 2.6507936507936507, |
| "grad_norm": 0.6186866548868446, |
| "learning_rate": 3.127294022752988e-05, |
| "loss": 0.2907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12931489944458008, |
| "step": 1670, |
| "valid_targets_mean": 4241.0, |
| "valid_targets_min": 1549 |
| }, |
| { |
| "epoch": 2.6587301587301586, |
| "grad_norm": 0.6404478009955566, |
| "learning_rate": 3.120747027793854e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1313716024160385, |
| "step": 1675, |
| "valid_targets_mean": 3436.2, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 2.6666666666666665, |
| "grad_norm": 0.6424760221978681, |
| "learning_rate": 3.114182478491509e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14358645677566528, |
| "step": 1680, |
| "valid_targets_mean": 3566.9, |
| "valid_targets_min": 1824 |
| }, |
| { |
| "epoch": 2.674603174603175, |
| "grad_norm": 0.6212608954505446, |
| "learning_rate": 3.107600477666969e-05, |
| "loss": 0.2689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11525902152061462, |
| "step": 1685, |
| "valid_targets_mean": 4901.4, |
| "valid_targets_min": 1684 |
| }, |
| { |
| "epoch": 2.682539682539683, |
| "grad_norm": 0.7373215482236564, |
| "learning_rate": 3.1010011284146004e-05, |
| "loss": 0.2748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15655554831027985, |
| "step": 1690, |
| "valid_targets_mean": 2539.5, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 2.6904761904761907, |
| "grad_norm": 0.7711994151976389, |
| "learning_rate": 3.0943845341004944e-05, |
| "loss": 0.2856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15932291746139526, |
| "step": 1695, |
| "valid_targets_mean": 2453.8, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.6984126984126986, |
| "grad_norm": 0.5832119782072631, |
| "learning_rate": 3.087750798360856e-05, |
| "loss": 0.296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09954415261745453, |
| "step": 1700, |
| "valid_targets_mean": 3089.4, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 2.7063492063492065, |
| "grad_norm": 0.6507828484721623, |
| "learning_rate": 3.0811000251003774e-05, |
| "loss": 0.276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15949490666389465, |
| "step": 1705, |
| "valid_targets_mean": 3973.5, |
| "valid_targets_min": 1863 |
| }, |
| { |
| "epoch": 2.7142857142857144, |
| "grad_norm": 0.647286678324319, |
| "learning_rate": 3.074432318490608e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16663986444473267, |
| "step": 1710, |
| "valid_targets_mean": 3909.6, |
| "valid_targets_min": 1870 |
| }, |
| { |
| "epoch": 2.7222222222222223, |
| "grad_norm": 0.5662716434730383, |
| "learning_rate": 3.067747782968328e-05, |
| "loss": 0.2761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12369729578495026, |
| "step": 1715, |
| "valid_targets_mean": 4857.1, |
| "valid_targets_min": 2173 |
| }, |
| { |
| "epoch": 2.7301587301587302, |
| "grad_norm": 0.6836298091917609, |
| "learning_rate": 3.0610465232339096e-05, |
| "loss": 0.2844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11899368464946747, |
| "step": 1720, |
| "valid_targets_mean": 3117.0, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 2.738095238095238, |
| "grad_norm": 0.611020228050993, |
| "learning_rate": 3.054328644249677e-05, |
| "loss": 0.2876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11934395879507065, |
| "step": 1725, |
| "valid_targets_mean": 2926.1, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 2.746031746031746, |
| "grad_norm": 0.7971191409966951, |
| "learning_rate": 3.047594251238265e-05, |
| "loss": 0.3046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18401601910591125, |
| "step": 1730, |
| "valid_targets_mean": 3678.5, |
| "valid_targets_min": 1815 |
| }, |
| { |
| "epoch": 2.753968253968254, |
| "grad_norm": 0.6824521691463085, |
| "learning_rate": 3.0408434496809643e-05, |
| "loss": 0.31, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14168040454387665, |
| "step": 1735, |
| "valid_targets_mean": 2618.5, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 2.761904761904762, |
| "grad_norm": 0.7071997600045877, |
| "learning_rate": 3.034076345316079e-05, |
| "loss": 0.2696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13625219464302063, |
| "step": 1740, |
| "valid_targets_mean": 3389.4, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 2.7698412698412698, |
| "grad_norm": 0.6570185747900452, |
| "learning_rate": 3.0272930441372628e-05, |
| "loss": 0.2825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12578660249710083, |
| "step": 1745, |
| "valid_targets_mean": 3387.0, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 2.7777777777777777, |
| "grad_norm": 0.5756355415915643, |
| "learning_rate": 3.02049365239186e-05, |
| "loss": 0.2599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13883277773857117, |
| "step": 1750, |
| "valid_targets_mean": 4081.4, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 2.7857142857142856, |
| "grad_norm": 0.6741636937753623, |
| "learning_rate": 3.0136782765792455e-05, |
| "loss": 0.2806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14945513010025024, |
| "step": 1755, |
| "valid_targets_mean": 3490.8, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 2.7936507936507935, |
| "grad_norm": 0.6285050348403557, |
| "learning_rate": 3.0068470234491517e-05, |
| "loss": 0.2742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16284587979316711, |
| "step": 1760, |
| "valid_targets_mean": 4642.1, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 2.8015873015873014, |
| "grad_norm": 0.6692873837736333, |
| "learning_rate": 3.0000000000000004e-05, |
| "loss": 0.2913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11234371364116669, |
| "step": 1765, |
| "valid_targets_mean": 3148.2, |
| "valid_targets_min": 532 |
| }, |
| { |
| "epoch": 2.8095238095238093, |
| "grad_norm": 0.6308462732358487, |
| "learning_rate": 2.993137313477223e-05, |
| "loss": 0.291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09374731779098511, |
| "step": 1770, |
| "valid_targets_mean": 2508.5, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 2.817460317460317, |
| "grad_norm": 0.7007377433335262, |
| "learning_rate": 2.9862590713715837e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1225220113992691, |
| "step": 1775, |
| "valid_targets_mean": 2797.4, |
| "valid_targets_min": 932 |
| }, |
| { |
| "epoch": 2.825396825396825, |
| "grad_norm": 0.6598142297768089, |
| "learning_rate": 2.9793653814174957e-05, |
| "loss": 0.2974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13078439235687256, |
| "step": 1780, |
| "valid_targets_mean": 3160.2, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 2.8333333333333335, |
| "grad_norm": 0.6341362087786145, |
| "learning_rate": 2.9724563515913317e-05, |
| "loss": 0.2834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08914564549922943, |
| "step": 1785, |
| "valid_targets_mean": 2214.0, |
| "valid_targets_min": 486 |
| }, |
| { |
| "epoch": 2.8412698412698414, |
| "grad_norm": 0.7609575143650333, |
| "learning_rate": 2.9655320901097348e-05, |
| "loss": 0.28, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15402570366859436, |
| "step": 1790, |
| "valid_targets_mean": 2849.5, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 2.8492063492063493, |
| "grad_norm": 0.6657562541253584, |
| "learning_rate": 2.9585927054279224e-05, |
| "loss": 0.2685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.143843412399292, |
| "step": 1795, |
| "valid_targets_mean": 3437.2, |
| "valid_targets_min": 1651 |
| }, |
| { |
| "epoch": 2.857142857142857, |
| "grad_norm": 0.6799877740404671, |
| "learning_rate": 2.951638306237988e-05, |
| "loss": 0.2786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15773284435272217, |
| "step": 1800, |
| "valid_targets_mean": 2877.4, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 2.865079365079365, |
| "grad_norm": 0.6865473240955069, |
| "learning_rate": 2.9446690014671976e-05, |
| "loss": 0.2808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1253039836883545, |
| "step": 1805, |
| "valid_targets_mean": 2390.0, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 2.873015873015873, |
| "grad_norm": 0.6534863995749159, |
| "learning_rate": 2.937684900276285e-05, |
| "loss": 0.2725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11391299962997437, |
| "step": 1810, |
| "valid_targets_mean": 2806.4, |
| "valid_targets_min": 1592 |
| }, |
| { |
| "epoch": 2.880952380952381, |
| "grad_norm": 0.7567889432998731, |
| "learning_rate": 2.9306861120577416e-05, |
| "loss": 0.2573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11856131255626678, |
| "step": 1815, |
| "valid_targets_mean": 2440.9, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 2.888888888888889, |
| "grad_norm": 0.6635665729697707, |
| "learning_rate": 2.923672746434103e-05, |
| "loss": 0.2906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11890023946762085, |
| "step": 1820, |
| "valid_targets_mean": 3114.4, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 2.8968253968253967, |
| "grad_norm": 0.7898960244652132, |
| "learning_rate": 2.9166449132562303e-05, |
| "loss": 0.2921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2273479551076889, |
| "step": 1825, |
| "valid_targets_mean": 3445.4, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 2.9047619047619047, |
| "grad_norm": 0.6221253005823774, |
| "learning_rate": 2.9096027226015927e-05, |
| "loss": 0.2698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16060924530029297, |
| "step": 1830, |
| "valid_targets_mean": 3911.6, |
| "valid_targets_min": 1618 |
| }, |
| { |
| "epoch": 2.9126984126984126, |
| "grad_norm": 0.6890919052022301, |
| "learning_rate": 2.9025462847725405e-05, |
| "loss": 0.3028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15114042162895203, |
| "step": 1835, |
| "valid_targets_mean": 3334.8, |
| "valid_targets_min": 1413 |
| }, |
| { |
| "epoch": 2.9206349206349205, |
| "grad_norm": 0.7151703994390879, |
| "learning_rate": 2.8954757102945798e-05, |
| "loss": 0.2743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.164110004901886, |
| "step": 1840, |
| "valid_targets_mean": 3427.1, |
| "valid_targets_min": 1160 |
| }, |
| { |
| "epoch": 2.928571428571429, |
| "grad_norm": 0.6725713608557474, |
| "learning_rate": 2.888391109914638e-05, |
| "loss": 0.2785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17118103802204132, |
| "step": 1845, |
| "valid_targets_mean": 4161.8, |
| "valid_targets_min": 1537 |
| }, |
| { |
| "epoch": 2.9365079365079367, |
| "grad_norm": 0.6210771507140483, |
| "learning_rate": 2.8812925945993333e-05, |
| "loss": 0.2856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10453899949789047, |
| "step": 1850, |
| "valid_targets_mean": 3119.2, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 2.9444444444444446, |
| "grad_norm": 0.6584848576192016, |
| "learning_rate": 2.8741802755332332e-05, |
| "loss": 0.288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15300224721431732, |
| "step": 1855, |
| "valid_targets_mean": 3997.0, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.9523809523809526, |
| "grad_norm": 0.603729636604423, |
| "learning_rate": 2.8670542641171155e-05, |
| "loss": 0.2735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16688242554664612, |
| "step": 1860, |
| "valid_targets_mean": 3805.8, |
| "valid_targets_min": 1368 |
| }, |
| { |
| "epoch": 2.9603174603174605, |
| "grad_norm": 0.6685639760048532, |
| "learning_rate": 2.859914671966221e-05, |
| "loss": 0.283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15483403205871582, |
| "step": 1865, |
| "valid_targets_mean": 3771.5, |
| "valid_targets_min": 2012 |
| }, |
| { |
| "epoch": 2.9682539682539684, |
| "grad_norm": 0.7257652525758371, |
| "learning_rate": 2.8527616109085082e-05, |
| "loss": 0.2695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11175280809402466, |
| "step": 1870, |
| "valid_targets_mean": 2321.2, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 2.9761904761904763, |
| "grad_norm": 0.764225120374443, |
| "learning_rate": 2.8455951929828977e-05, |
| "loss": 0.2918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16258296370506287, |
| "step": 1875, |
| "valid_targets_mean": 2744.0, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 2.984126984126984, |
| "grad_norm": 0.7040782057209479, |
| "learning_rate": 2.8384155304375223e-05, |
| "loss": 0.2815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2076944261789322, |
| "step": 1880, |
| "valid_targets_mean": 4440.1, |
| "valid_targets_min": 1859 |
| }, |
| { |
| "epoch": 2.992063492063492, |
| "grad_norm": 0.5526066260270843, |
| "learning_rate": 2.8312227357279646e-05, |
| "loss": 0.2772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1588117629289627, |
| "step": 1885, |
| "valid_targets_mean": 4321.2, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 0.7083973280267318, |
| "learning_rate": 2.8240169215154977e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11426911503076553, |
| "step": 1890, |
| "valid_targets_mean": 2519.1, |
| "valid_targets_min": 1488 |
| }, |
| { |
| "epoch": 3.007936507936508, |
| "grad_norm": 0.6902028100549552, |
| "learning_rate": 2.8167982006653196e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12100070714950562, |
| "step": 1895, |
| "valid_targets_mean": 2715.6, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 3.015873015873016, |
| "grad_norm": 0.7498148150106853, |
| "learning_rate": 2.8095666862447876e-05, |
| "loss": 0.2509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15154170989990234, |
| "step": 1900, |
| "valid_targets_mean": 3611.8, |
| "valid_targets_min": 1506 |
| }, |
| { |
| "epoch": 3.0238095238095237, |
| "grad_norm": 0.6616656629988206, |
| "learning_rate": 2.8023224915216442e-05, |
| "loss": 0.2499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1271711140871048, |
| "step": 1905, |
| "valid_targets_mean": 3507.9, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 3.0317460317460316, |
| "grad_norm": 0.7116856168102649, |
| "learning_rate": 2.795065729962244e-05, |
| "loss": 0.254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08189952373504639, |
| "step": 1910, |
| "valid_targets_mean": 2039.9, |
| "valid_targets_min": 1125 |
| }, |
| { |
| "epoch": 3.0396825396825395, |
| "grad_norm": 0.6876408809777227, |
| "learning_rate": 2.7877965152297785e-05, |
| "loss": 0.2422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10088761150836945, |
| "step": 1915, |
| "valid_targets_mean": 2376.2, |
| "valid_targets_min": 1454 |
| }, |
| { |
| "epoch": 3.0476190476190474, |
| "grad_norm": 0.6942636265425131, |
| "learning_rate": 2.780514961182492e-05, |
| "loss": 0.2539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1270643174648285, |
| "step": 1920, |
| "valid_targets_mean": 3030.1, |
| "valid_targets_min": 1496 |
| }, |
| { |
| "epoch": 3.0555555555555554, |
| "grad_norm": 0.6047340947825474, |
| "learning_rate": 2.773221181871903e-05, |
| "loss": 0.2416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1178026869893074, |
| "step": 1925, |
| "valid_targets_mean": 4042.6, |
| "valid_targets_min": 1537 |
| }, |
| { |
| "epoch": 3.0634920634920633, |
| "grad_norm": 0.6821898699763301, |
| "learning_rate": 2.765915291541013e-05, |
| "loss": 0.2527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13922007381916046, |
| "step": 1930, |
| "valid_targets_mean": 3912.5, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 3.0714285714285716, |
| "grad_norm": 0.6551781793298332, |
| "learning_rate": 2.7585974046225206e-05, |
| "loss": 0.2585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14014190435409546, |
| "step": 1935, |
| "valid_targets_mean": 3799.6, |
| "valid_targets_min": 1019 |
| }, |
| { |
| "epoch": 3.0793650793650795, |
| "grad_norm": 0.7821365657217646, |
| "learning_rate": 2.751267635737027e-05, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1164986789226532, |
| "step": 1940, |
| "valid_targets_mean": 2321.2, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 3.0873015873015874, |
| "grad_norm": 0.6698276676313706, |
| "learning_rate": 2.7439260996912423e-05, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11518267542123795, |
| "step": 1945, |
| "valid_targets_mean": 3101.5, |
| "valid_targets_min": 1563 |
| }, |
| { |
| "epoch": 3.0952380952380953, |
| "grad_norm": 0.7281910335267264, |
| "learning_rate": 2.7365729114761862e-05, |
| "loss": 0.277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1856643557548523, |
| "step": 1950, |
| "valid_targets_mean": 3758.4, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 3.1031746031746033, |
| "grad_norm": 0.8454083755018548, |
| "learning_rate": 2.729208186265386e-05, |
| "loss": 0.2565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17740434408187866, |
| "step": 1955, |
| "valid_targets_mean": 3700.9, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 3.111111111111111, |
| "grad_norm": 0.8235684513843857, |
| "learning_rate": 2.721832039413077e-05, |
| "loss": 0.2555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12159430235624313, |
| "step": 1960, |
| "valid_targets_mean": 2358.2, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 3.119047619047619, |
| "grad_norm": 0.7603822952932935, |
| "learning_rate": 2.7144445864523887e-05, |
| "loss": 0.2471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11871971189975739, |
| "step": 1965, |
| "valid_targets_mean": 2330.9, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 3.126984126984127, |
| "grad_norm": 0.5890854643098785, |
| "learning_rate": 2.7070459430935407e-05, |
| "loss": 0.244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11397400498390198, |
| "step": 1970, |
| "valid_targets_mean": 3696.4, |
| "valid_targets_min": 1454 |
| }, |
| { |
| "epoch": 3.134920634920635, |
| "grad_norm": 0.6251976447943539, |
| "learning_rate": 2.69963622522203e-05, |
| "loss": 0.2494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10502277314662933, |
| "step": 1975, |
| "valid_targets_mean": 3759.9, |
| "valid_targets_min": 2157 |
| }, |
| { |
| "epoch": 3.142857142857143, |
| "grad_norm": 0.723522815940443, |
| "learning_rate": 2.6922155488968117e-05, |
| "loss": 0.2437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10363540053367615, |
| "step": 1980, |
| "valid_targets_mean": 2637.6, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 3.1507936507936507, |
| "grad_norm": 0.890979704609736, |
| "learning_rate": 2.684784030348486e-05, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13063833117485046, |
| "step": 1985, |
| "valid_targets_mean": 2054.8, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 3.1587301587301586, |
| "grad_norm": 0.7071717645076813, |
| "learning_rate": 2.6773417859774755e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11484183371067047, |
| "step": 1990, |
| "valid_targets_mean": 3003.2, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 3.1666666666666665, |
| "grad_norm": 0.7255166589054973, |
| "learning_rate": 2.669888932352201e-05, |
| "loss": 0.2502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10529197752475739, |
| "step": 1995, |
| "valid_targets_mean": 2306.5, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 3.1746031746031744, |
| "grad_norm": 0.7002772175531771, |
| "learning_rate": 2.662425586207259e-05, |
| "loss": 0.2665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12117639183998108, |
| "step": 2000, |
| "valid_targets_mean": 3534.6, |
| "valid_targets_min": 1424 |
| }, |
| { |
| "epoch": 3.1825396825396823, |
| "grad_norm": 0.646490577280726, |
| "learning_rate": 2.6549518644415876e-05, |
| "loss": 0.2467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09091825038194656, |
| "step": 2005, |
| "valid_targets_mean": 2662.6, |
| "valid_targets_min": 1489 |
| }, |
| { |
| "epoch": 3.1904761904761907, |
| "grad_norm": 0.6342896994103852, |
| "learning_rate": 2.6474678841166426e-05, |
| "loss": 0.2604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1556168496608734, |
| "step": 2010, |
| "valid_targets_mean": 4756.2, |
| "valid_targets_min": 1659 |
| }, |
| { |
| "epoch": 3.1984126984126986, |
| "grad_norm": 0.6522004622714066, |
| "learning_rate": 2.639973762454558e-05, |
| "loss": 0.2518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12138301134109497, |
| "step": 2015, |
| "valid_targets_mean": 3672.4, |
| "valid_targets_min": 1612 |
| }, |
| { |
| "epoch": 3.2063492063492065, |
| "grad_norm": 0.7782670981533159, |
| "learning_rate": 2.6324696168363134e-05, |
| "loss": 0.2527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1658809781074524, |
| "step": 2020, |
| "valid_targets_mean": 3090.1, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 3.2142857142857144, |
| "grad_norm": 0.6622860830034212, |
| "learning_rate": 2.624955564799894e-05, |
| "loss": 0.2479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1196448802947998, |
| "step": 2025, |
| "valid_targets_mean": 3399.8, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 3.2222222222222223, |
| "grad_norm": 0.693901810628061, |
| "learning_rate": 2.617431724038451e-05, |
| "loss": 0.2486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10215766727924347, |
| "step": 2030, |
| "valid_targets_mean": 2399.5, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 3.2301587301587302, |
| "grad_norm": 0.5671979640230917, |
| "learning_rate": 2.609898212398455e-05, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16594891250133514, |
| "step": 2035, |
| "valid_targets_mean": 5821.9, |
| "valid_targets_min": 1505 |
| }, |
| { |
| "epoch": 3.238095238095238, |
| "grad_norm": 0.6974681739689081, |
| "learning_rate": 2.6023551478778535e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11858563125133514, |
| "step": 2040, |
| "valid_targets_mean": 2829.8, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 3.246031746031746, |
| "grad_norm": 0.6882592331713957, |
| "learning_rate": 2.5948026486242225e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10707972943782806, |
| "step": 2045, |
| "valid_targets_mean": 3013.4, |
| "valid_targets_min": 1161 |
| }, |
| { |
| "epoch": 3.253968253968254, |
| "grad_norm": 0.6051374206215899, |
| "learning_rate": 2.5872408329329136e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14780555665493011, |
| "step": 2050, |
| "valid_targets_mean": 6003.6, |
| "valid_targets_min": 2869 |
| }, |
| { |
| "epoch": 3.261904761904762, |
| "grad_norm": 0.8178419818692619, |
| "learning_rate": 2.5796698192452016e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13839825987815857, |
| "step": 2055, |
| "valid_targets_mean": 3007.5, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 3.2698412698412698, |
| "grad_norm": 0.610892128183204, |
| "learning_rate": 2.572089726146432e-05, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.131939098238945, |
| "step": 2060, |
| "valid_targets_mean": 4979.1, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 3.2777777777777777, |
| "grad_norm": 0.5925456999380748, |
| "learning_rate": 2.564500672364162e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08675329387187958, |
| "step": 2065, |
| "valid_targets_mean": 3128.8, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 3.2857142857142856, |
| "grad_norm": 0.7101170401554764, |
| "learning_rate": 2.556902776766298e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11017313599586487, |
| "step": 2070, |
| "valid_targets_mean": 2635.2, |
| "valid_targets_min": 1656 |
| }, |
| { |
| "epoch": 3.2936507936507935, |
| "grad_norm": 0.6737500763312219, |
| "learning_rate": 2.5492961583592397e-05, |
| "loss": 0.2512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11181756108999252, |
| "step": 2075, |
| "valid_targets_mean": 2606.4, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 3.3015873015873014, |
| "grad_norm": 0.7396901842301878, |
| "learning_rate": 2.5416809362860107e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13949820399284363, |
| "step": 2080, |
| "valid_targets_mean": 3067.6, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 3.3095238095238093, |
| "grad_norm": 0.6498890292466925, |
| "learning_rate": 2.5340572298243946e-05, |
| "loss": 0.253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10242730379104614, |
| "step": 2085, |
| "valid_targets_mean": 2982.5, |
| "valid_targets_min": 1488 |
| }, |
| { |
| "epoch": 3.317460317460317, |
| "grad_norm": 0.7574837036969985, |
| "learning_rate": 2.5264251583850677e-05, |
| "loss": 0.2603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1579362004995346, |
| "step": 2090, |
| "valid_targets_mean": 3493.5, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 3.3253968253968256, |
| "grad_norm": 0.5407051448256301, |
| "learning_rate": 2.518784841509726e-05, |
| "loss": 0.2513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11689899861812592, |
| "step": 2095, |
| "valid_targets_mean": 4560.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.6970226932960573, |
| "learning_rate": 2.511136398869216e-05, |
| "loss": 0.2449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13105079531669617, |
| "step": 2100, |
| "valid_targets_mean": 3603.1, |
| "valid_targets_min": 331 |
| }, |
| { |
| "epoch": 3.3412698412698414, |
| "grad_norm": 0.7186804216812557, |
| "learning_rate": 2.503479950261658e-05, |
| "loss": 0.2502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13403379917144775, |
| "step": 2105, |
| "valid_targets_mean": 2903.1, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 3.3492063492063493, |
| "grad_norm": 0.6455942984531485, |
| "learning_rate": 2.4958156156105693e-05, |
| "loss": 0.239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10922306776046753, |
| "step": 2110, |
| "valid_targets_mean": 3211.5, |
| "valid_targets_min": 2118 |
| }, |
| { |
| "epoch": 3.357142857142857, |
| "grad_norm": 0.6571243872308732, |
| "learning_rate": 2.4881435149629892e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13601714372634888, |
| "step": 2115, |
| "valid_targets_mean": 3930.4, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 3.365079365079365, |
| "grad_norm": 0.6585273608503487, |
| "learning_rate": 2.4804637684875937e-05, |
| "loss": 0.2536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10247397422790527, |
| "step": 2120, |
| "valid_targets_mean": 2421.5, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 3.373015873015873, |
| "grad_norm": 0.62544048579586, |
| "learning_rate": 2.4727764964728177e-05, |
| "loss": 0.2455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16413845121860504, |
| "step": 2125, |
| "valid_targets_mean": 4857.9, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 3.380952380952381, |
| "grad_norm": 0.6792630869673345, |
| "learning_rate": 2.4650818193249693e-05, |
| "loss": 0.243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12296905368566513, |
| "step": 2130, |
| "valid_targets_mean": 3710.6, |
| "valid_targets_min": 1830 |
| }, |
| { |
| "epoch": 3.388888888888889, |
| "grad_norm": 0.6779730353915933, |
| "learning_rate": 2.4573798575663425e-05, |
| "loss": 0.2672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11248013377189636, |
| "step": 2135, |
| "valid_targets_mean": 2979.5, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.3968253968253967, |
| "grad_norm": 0.9098770112161331, |
| "learning_rate": 2.4496707318333323e-05, |
| "loss": 0.2643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12486522644758224, |
| "step": 2140, |
| "valid_targets_mean": 1802.4, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 3.4047619047619047, |
| "grad_norm": 0.7636101057011379, |
| "learning_rate": 2.441954562874541e-05, |
| "loss": 0.2766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.125074565410614, |
| "step": 2145, |
| "valid_targets_mean": 2825.0, |
| "valid_targets_min": 1558 |
| }, |
| { |
| "epoch": 3.4126984126984126, |
| "grad_norm": 0.6467450666633284, |
| "learning_rate": 2.434231471548893e-05, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08474473655223846, |
| "step": 2150, |
| "valid_targets_mean": 3010.1, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.4206349206349205, |
| "grad_norm": 0.6917977015493815, |
| "learning_rate": 2.4265015788237348e-05, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1237451583147049, |
| "step": 2155, |
| "valid_targets_mean": 2535.2, |
| "valid_targets_min": 1103 |
| }, |
| { |
| "epoch": 3.4285714285714284, |
| "grad_norm": 0.7739173113165484, |
| "learning_rate": 2.4187650057729465e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13617797195911407, |
| "step": 2160, |
| "valid_targets_mean": 2652.1, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 3.4365079365079367, |
| "grad_norm": 0.6831983748541813, |
| "learning_rate": 2.4110218735750403e-05, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12043888866901398, |
| "step": 2165, |
| "valid_targets_mean": 3557.0, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 3.4444444444444446, |
| "grad_norm": 0.6052935127475482, |
| "learning_rate": 2.4032723035112667e-05, |
| "loss": 0.2385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10145443677902222, |
| "step": 2170, |
| "valid_targets_mean": 4060.8, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 3.4523809523809526, |
| "grad_norm": 0.7675317267799375, |
| "learning_rate": 2.3955164169637124e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08529975265264511, |
| "step": 2175, |
| "valid_targets_mean": 1873.2, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 3.4603174603174605, |
| "grad_norm": 0.6683938001153137, |
| "learning_rate": 2.387754335413398e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10772879421710968, |
| "step": 2180, |
| "valid_targets_mean": 3114.6, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 3.4682539682539684, |
| "grad_norm": 0.6735296084441879, |
| "learning_rate": 2.3799861804383807e-05, |
| "loss": 0.2579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13499006628990173, |
| "step": 2185, |
| "valid_targets_mean": 3644.8, |
| "valid_targets_min": 1400 |
| }, |
| { |
| "epoch": 3.4761904761904763, |
| "grad_norm": 0.6831817897125874, |
| "learning_rate": 2.3722120737118414e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07938480377197266, |
| "step": 2190, |
| "valid_targets_mean": 1924.0, |
| "valid_targets_min": 1054 |
| }, |
| { |
| "epoch": 3.484126984126984, |
| "grad_norm": 0.6737327071370827, |
| "learning_rate": 2.3644321370001868e-05, |
| "loss": 0.2562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1572818160057068, |
| "step": 2195, |
| "valid_targets_mean": 2819.1, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 3.492063492063492, |
| "grad_norm": 0.6691135799512201, |
| "learning_rate": 2.3566464921611393e-05, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11640235781669617, |
| "step": 2200, |
| "valid_targets_mean": 2922.6, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 3.5, |
| "grad_norm": 0.6587392719241073, |
| "learning_rate": 2.348855261141827e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10942356288433075, |
| "step": 2205, |
| "valid_targets_mean": 3722.4, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 3.507936507936508, |
| "grad_norm": 0.750713040033646, |
| "learning_rate": 2.341058565976874e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13870318233966827, |
| "step": 2210, |
| "valid_targets_mean": 2861.6, |
| "valid_targets_min": 1779 |
| }, |
| { |
| "epoch": 3.515873015873016, |
| "grad_norm": 0.7491380731832215, |
| "learning_rate": 2.3332565287864918e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14582455158233643, |
| "step": 2215, |
| "valid_targets_mean": 2783.4, |
| "valid_targets_min": 1314 |
| }, |
| { |
| "epoch": 3.5238095238095237, |
| "grad_norm": 0.6351357539271595, |
| "learning_rate": 2.325449271774563e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11707961559295654, |
| "step": 2220, |
| "valid_targets_mean": 3604.9, |
| "valid_targets_min": 1073 |
| }, |
| { |
| "epoch": 3.5317460317460316, |
| "grad_norm": 0.8231068256271177, |
| "learning_rate": 2.3176369172267286e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19035357236862183, |
| "step": 2225, |
| "valid_targets_mean": 3547.5, |
| "valid_targets_min": 1823 |
| }, |
| { |
| "epoch": 3.5396825396825395, |
| "grad_norm": 0.6637559646990401, |
| "learning_rate": 2.3098195875084732e-05, |
| "loss": 0.2798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19387897849082947, |
| "step": 2230, |
| "valid_targets_mean": 4797.4, |
| "valid_targets_min": 1702 |
| }, |
| { |
| "epoch": 3.5476190476190474, |
| "grad_norm": 0.5840086031255308, |
| "learning_rate": 2.301997405063208e-05, |
| "loss": 0.2491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13106292486190796, |
| "step": 2235, |
| "valid_targets_mean": 4836.0, |
| "valid_targets_min": 2196 |
| }, |
| { |
| "epoch": 3.5555555555555554, |
| "grad_norm": 0.6883285297059432, |
| "learning_rate": 2.2941704924103535e-05, |
| "loss": 0.2409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0974530503153801, |
| "step": 2240, |
| "valid_targets_mean": 2712.2, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 3.5634920634920633, |
| "grad_norm": 0.6118340955483631, |
| "learning_rate": 2.2863389721434165e-05, |
| "loss": 0.2658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13404448330402374, |
| "step": 2245, |
| "valid_targets_mean": 3707.8, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.571428571428571, |
| "grad_norm": 0.6823518338026194, |
| "learning_rate": 2.2785029669280775e-05, |
| "loss": 0.2675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09207911789417267, |
| "step": 2250, |
| "valid_targets_mean": 2036.5, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 3.5793650793650795, |
| "grad_norm": 0.722255561298478, |
| "learning_rate": 2.2706625995002626e-05, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11790738254785538, |
| "step": 2255, |
| "valid_targets_mean": 2746.2, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 3.5873015873015874, |
| "grad_norm": 0.6732026842214269, |
| "learning_rate": 2.262817992664224e-05, |
| "loss": 0.249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14672116935253143, |
| "step": 2260, |
| "valid_targets_mean": 4038.0, |
| "valid_targets_min": 1675 |
| }, |
| { |
| "epoch": 3.5952380952380953, |
| "grad_norm": 0.781949743871262, |
| "learning_rate": 2.2549692692906158e-05, |
| "loss": 0.2714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13185100257396698, |
| "step": 2265, |
| "valid_targets_mean": 2627.5, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 3.6031746031746033, |
| "grad_norm": 0.7262791657638447, |
| "learning_rate": 2.24711655231457e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20940609276294708, |
| "step": 2270, |
| "valid_targets_mean": 5433.1, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 3.611111111111111, |
| "grad_norm": 0.784848270932435, |
| "learning_rate": 2.2392599647337724e-05, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12663155794143677, |
| "step": 2275, |
| "valid_targets_mean": 2872.4, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 3.619047619047619, |
| "grad_norm": 0.6453755291298704, |
| "learning_rate": 2.23139962960653e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16382941603660583, |
| "step": 2280, |
| "valid_targets_mean": 5086.6, |
| "valid_targets_min": 1625 |
| }, |
| { |
| "epoch": 3.626984126984127, |
| "grad_norm": 0.6243214368704214, |
| "learning_rate": 2.2235356700498528e-05, |
| "loss": 0.2574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09489156305789948, |
| "step": 2285, |
| "valid_targets_mean": 2987.9, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 3.634920634920635, |
| "grad_norm": 0.728831644905216, |
| "learning_rate": 2.2156682092375175e-05, |
| "loss": 0.2584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12532003223896027, |
| "step": 2290, |
| "valid_targets_mean": 3108.4, |
| "valid_targets_min": 1380 |
| }, |
| { |
| "epoch": 3.642857142857143, |
| "grad_norm": 0.6766396276223146, |
| "learning_rate": 2.2077973703981423e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10541743785142899, |
| "step": 2295, |
| "valid_targets_mean": 3278.2, |
| "valid_targets_min": 1427 |
| }, |
| { |
| "epoch": 3.6507936507936507, |
| "grad_norm": 0.728273106075939, |
| "learning_rate": 2.1999232768132552e-05, |
| "loss": 0.2585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13243606686592102, |
| "step": 2300, |
| "valid_targets_mean": 3081.8, |
| "valid_targets_min": 1017 |
| }, |
| { |
| "epoch": 3.6587301587301586, |
| "grad_norm": 0.6367194277051416, |
| "learning_rate": 2.1920460518153637e-05, |
| "loss": 0.2666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14943772554397583, |
| "step": 2305, |
| "valid_targets_mean": 3977.2, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 3.6666666666666665, |
| "grad_norm": 0.6636887290598896, |
| "learning_rate": 2.1841658187860232e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14413931965827942, |
| "step": 2310, |
| "valid_targets_mean": 3984.5, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 3.674603174603175, |
| "grad_norm": 0.6924824608448896, |
| "learning_rate": 2.176282701153904e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10788863897323608, |
| "step": 2315, |
| "valid_targets_mean": 3827.2, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 3.682539682539683, |
| "grad_norm": 0.7500867165407975, |
| "learning_rate": 2.1683968223928572e-05, |
| "loss": 0.2665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11223761737346649, |
| "step": 2320, |
| "valid_targets_mean": 2388.6, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 3.6904761904761907, |
| "grad_norm": 0.6150664924768718, |
| "learning_rate": 2.1605083060199835e-05, |
| "loss": 0.2489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13505640625953674, |
| "step": 2325, |
| "valid_targets_mean": 3697.6, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 3.6984126984126986, |
| "grad_norm": 0.7555466609315117, |
| "learning_rate": 2.152617275593694e-05, |
| "loss": 0.2676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521606296300888, |
| "step": 2330, |
| "valid_targets_mean": 3023.5, |
| "valid_targets_min": 1520 |
| }, |
| { |
| "epoch": 3.7063492063492065, |
| "grad_norm": 0.7029257644513573, |
| "learning_rate": 2.144723854711781e-05, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16023379564285278, |
| "step": 2335, |
| "valid_targets_mean": 3591.4, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 3.7142857142857144, |
| "grad_norm": 0.6918176391496552, |
| "learning_rate": 2.1368281670094766e-05, |
| "loss": 0.2624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13360567390918732, |
| "step": 2340, |
| "valid_targets_mean": 3050.0, |
| "valid_targets_min": 1247 |
| }, |
| { |
| "epoch": 3.7222222222222223, |
| "grad_norm": 0.6428044957155385, |
| "learning_rate": 2.1289303361575175e-05, |
| "loss": 0.2627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11518841981887817, |
| "step": 2345, |
| "valid_targets_mean": 3680.9, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 3.7301587301587302, |
| "grad_norm": 0.6973754385222307, |
| "learning_rate": 2.121030485860211e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1621910184621811, |
| "step": 2350, |
| "valid_targets_mean": 3594.0, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 3.738095238095238, |
| "grad_norm": 0.7349289761819597, |
| "learning_rate": 2.113128739853493e-05, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13967764377593994, |
| "step": 2355, |
| "valid_targets_mean": 3569.4, |
| "valid_targets_min": 1369 |
| }, |
| { |
| "epoch": 3.746031746031746, |
| "grad_norm": 0.7522020159710882, |
| "learning_rate": 2.1052252219029944e-05, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12228189408779144, |
| "step": 2360, |
| "valid_targets_mean": 2334.9, |
| "valid_targets_min": 1448 |
| }, |
| { |
| "epoch": 3.753968253968254, |
| "grad_norm": 0.5729484428634234, |
| "learning_rate": 2.0973200558020967e-05, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09384536743164062, |
| "step": 2365, |
| "valid_targets_mean": 3340.4, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 3.761904761904762, |
| "grad_norm": 0.6492714046787679, |
| "learning_rate": 2.0894133653700005e-05, |
| "loss": 0.2555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12654618918895721, |
| "step": 2370, |
| "valid_targets_mean": 3602.9, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 3.7698412698412698, |
| "grad_norm": 0.697904697849088, |
| "learning_rate": 2.0815052744497795e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14032703638076782, |
| "step": 2375, |
| "valid_targets_mean": 3229.0, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 3.7777777777777777, |
| "grad_norm": 0.7308391868980172, |
| "learning_rate": 2.0735959069064434e-05, |
| "loss": 0.252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12916788458824158, |
| "step": 2380, |
| "valid_targets_mean": 2837.2, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 3.7857142857142856, |
| "grad_norm": 0.691499175418863, |
| "learning_rate": 2.065685386624999e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1294250339269638, |
| "step": 2385, |
| "valid_targets_mean": 3112.2, |
| "valid_targets_min": 1521 |
| }, |
| { |
| "epoch": 3.7936507936507935, |
| "grad_norm": 0.5969033546170376, |
| "learning_rate": 2.0577738375085076e-05, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09190475195646286, |
| "step": 2390, |
| "valid_targets_mean": 2841.9, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 3.8015873015873014, |
| "grad_norm": 0.7220359693489179, |
| "learning_rate": 2.0498613834761462e-05, |
| "loss": 0.2582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16056948900222778, |
| "step": 2395, |
| "valid_targets_mean": 3376.4, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 3.8095238095238093, |
| "grad_norm": 1.2099115424108589, |
| "learning_rate": 2.041948148461264e-05, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13240090012550354, |
| "step": 2400, |
| "valid_targets_mean": 3901.5, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 3.817460317460317, |
| "grad_norm": 0.7893114301162967, |
| "learning_rate": 2.0340342564094436e-05, |
| "loss": 0.2661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1543714702129364, |
| "step": 2405, |
| "valid_targets_mean": 2780.1, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 3.825396825396825, |
| "grad_norm": 0.6632506580999861, |
| "learning_rate": 2.0261198312765597e-05, |
| "loss": 0.2585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12213265150785446, |
| "step": 2410, |
| "valid_targets_mean": 3707.4, |
| "valid_targets_min": 1452 |
| }, |
| { |
| "epoch": 3.8333333333333335, |
| "grad_norm": 0.5666934298053149, |
| "learning_rate": 2.0182049970268355e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11713714152574539, |
| "step": 2415, |
| "valid_targets_mean": 4613.4, |
| "valid_targets_min": 1868 |
| }, |
| { |
| "epoch": 3.8412698412698414, |
| "grad_norm": 0.7113706519827881, |
| "learning_rate": 2.010289877630902e-05, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12731067836284637, |
| "step": 2420, |
| "valid_targets_mean": 4011.0, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 3.8492063492063493, |
| "grad_norm": 0.5910058190767906, |
| "learning_rate": 2.002374597063858e-05, |
| "loss": 0.2641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0885014608502388, |
| "step": 2425, |
| "valid_targets_mean": 3732.4, |
| "valid_targets_min": 1372 |
| }, |
| { |
| "epoch": 3.857142857142857, |
| "grad_norm": 0.613181664922125, |
| "learning_rate": 1.9944592793033255e-05, |
| "loss": 0.2436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1397075355052948, |
| "step": 2430, |
| "valid_targets_mean": 3596.5, |
| "valid_targets_min": 1614 |
| }, |
| { |
| "epoch": 3.865079365079365, |
| "grad_norm": 0.7433760742723559, |
| "learning_rate": 1.9865440483275086e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11835931986570358, |
| "step": 2435, |
| "valid_targets_mean": 3025.0, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 3.873015873015873, |
| "grad_norm": 0.6605685240194553, |
| "learning_rate": 1.978629028113254e-05, |
| "loss": 0.2338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10053889453411102, |
| "step": 2440, |
| "valid_targets_mean": 2641.2, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 3.880952380952381, |
| "grad_norm": 0.7119660876197761, |
| "learning_rate": 1.9707143426341058e-05, |
| "loss": 0.2419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13378119468688965, |
| "step": 2445, |
| "valid_targets_mean": 3406.1, |
| "valid_targets_min": 1708 |
| }, |
| { |
| "epoch": 3.888888888888889, |
| "grad_norm": 0.671693312370587, |
| "learning_rate": 1.962800115858364e-05, |
| "loss": 0.2636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17709845304489136, |
| "step": 2450, |
| "valid_targets_mean": 4737.1, |
| "valid_targets_min": 1773 |
| }, |
| { |
| "epoch": 3.8968253968253967, |
| "grad_norm": 0.5187002193324203, |
| "learning_rate": 1.9548864717471472e-05, |
| "loss": 0.2555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.114749014377594, |
| "step": 2455, |
| "valid_targets_mean": 5417.0, |
| "valid_targets_min": 2435 |
| }, |
| { |
| "epoch": 3.9047619047619047, |
| "grad_norm": 0.5690598952425717, |
| "learning_rate": 1.9469735342524454e-05, |
| "loss": 0.253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1283632516860962, |
| "step": 2460, |
| "valid_targets_mean": 4894.6, |
| "valid_targets_min": 1517 |
| }, |
| { |
| "epoch": 3.9126984126984126, |
| "grad_norm": 0.8811218156014363, |
| "learning_rate": 1.939061427315179e-05, |
| "loss": 0.2607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14203287661075592, |
| "step": 2465, |
| "valid_targets_mean": 1957.8, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 3.9206349206349205, |
| "grad_norm": 0.7300566426187972, |
| "learning_rate": 1.931150274863265e-05, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15685239434242249, |
| "step": 2470, |
| "valid_targets_mean": 3397.5, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 3.928571428571429, |
| "grad_norm": 0.6643843278715006, |
| "learning_rate": 1.9232402008096643e-05, |
| "loss": 0.267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1505836546421051, |
| "step": 2475, |
| "valid_targets_mean": 3670.0, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 3.9365079365079367, |
| "grad_norm": 0.7251725567833401, |
| "learning_rate": 1.9153313290504495e-05, |
| "loss": 0.2622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14810281991958618, |
| "step": 2480, |
| "valid_targets_mean": 3935.0, |
| "valid_targets_min": 1705 |
| }, |
| { |
| "epoch": 3.9444444444444446, |
| "grad_norm": 0.6456264170608652, |
| "learning_rate": 1.9074237834628623e-05, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12540534138679504, |
| "step": 2485, |
| "valid_targets_mean": 3541.1, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 3.9523809523809526, |
| "grad_norm": 0.8356018356170182, |
| "learning_rate": 1.8995176879033698e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1368331015110016, |
| "step": 2490, |
| "valid_targets_mean": 2445.4, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 3.9603174603174605, |
| "grad_norm": 0.6288308457322553, |
| "learning_rate": 1.89161316620573e-05, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14380553364753723, |
| "step": 2495, |
| "valid_targets_mean": 4345.1, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 3.9682539682539684, |
| "grad_norm": 0.6579847446205861, |
| "learning_rate": 1.8837103421790486e-05, |
| "loss": 0.2431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07781261205673218, |
| "step": 2500, |
| "valid_targets_mean": 2298.8, |
| "valid_targets_min": 586 |
| }, |
| { |
| "epoch": 3.9761904761904763, |
| "grad_norm": 0.7093298174783987, |
| "learning_rate": 1.8758093396058386e-05, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1043231263756752, |
| "step": 2505, |
| "valid_targets_mean": 2240.4, |
| "valid_targets_min": 1245 |
| }, |
| { |
| "epoch": 3.984126984126984, |
| "grad_norm": 0.7566876521088187, |
| "learning_rate": 1.8679102822400874e-05, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10809953510761261, |
| "step": 2510, |
| "valid_targets_mean": 2235.2, |
| "valid_targets_min": 373 |
| }, |
| { |
| "epoch": 3.992063492063492, |
| "grad_norm": 0.6429354432180481, |
| "learning_rate": 1.8600132938053098e-05, |
| "loss": 0.254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1338648647069931, |
| "step": 2515, |
| "valid_targets_mean": 4055.4, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 0.7125286840342117, |
| "learning_rate": 1.8521184979926177e-05, |
| "loss": 0.2634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10315399616956711, |
| "step": 2520, |
| "valid_targets_mean": 2988.1, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 4.007936507936508, |
| "grad_norm": 0.5876567034131157, |
| "learning_rate": 1.8442260184587804e-05, |
| "loss": 0.2273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1037619337439537, |
| "step": 2525, |
| "valid_targets_mean": 3516.1, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 4.015873015873016, |
| "grad_norm": 0.6765268923330178, |
| "learning_rate": 1.8363359788242842e-05, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09999796748161316, |
| "step": 2530, |
| "valid_targets_mean": 3009.6, |
| "valid_targets_min": 1258 |
| }, |
| { |
| "epoch": 4.023809523809524, |
| "grad_norm": 0.843564874643514, |
| "learning_rate": 1.8284485026714013e-05, |
| "loss": 0.2576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1326655000448227, |
| "step": 2535, |
| "valid_targets_mean": 2664.0, |
| "valid_targets_min": 1373 |
| }, |
| { |
| "epoch": 4.031746031746032, |
| "grad_norm": 0.7819775900849527, |
| "learning_rate": 1.8205637135422525e-05, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12343311309814453, |
| "step": 2540, |
| "valid_targets_mean": 2378.2, |
| "valid_targets_min": 1514 |
| }, |
| { |
| "epoch": 4.0396825396825395, |
| "grad_norm": 0.6399638759318811, |
| "learning_rate": 1.8126817349368697e-05, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12565383315086365, |
| "step": 2545, |
| "valid_targets_mean": 4908.5, |
| "valid_targets_min": 1814 |
| }, |
| { |
| "epoch": 4.0476190476190474, |
| "grad_norm": 0.7019507639956757, |
| "learning_rate": 1.8048026903112632e-05, |
| "loss": 0.2346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13092780113220215, |
| "step": 2550, |
| "valid_targets_mean": 3983.9, |
| "valid_targets_min": 1711 |
| }, |
| { |
| "epoch": 4.055555555555555, |
| "grad_norm": 0.6288446075374055, |
| "learning_rate": 1.7969267030754903e-05, |
| "loss": 0.2372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11063070595264435, |
| "step": 2555, |
| "valid_targets_mean": 3873.1, |
| "valid_targets_min": 1824 |
| }, |
| { |
| "epoch": 4.063492063492063, |
| "grad_norm": 0.6811814187899629, |
| "learning_rate": 1.7890538965917184e-05, |
| "loss": 0.2329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11278326064348221, |
| "step": 2560, |
| "valid_targets_mean": 3182.5, |
| "valid_targets_min": 866 |
| }, |
| { |
| "epoch": 4.071428571428571, |
| "grad_norm": 0.7348752847522607, |
| "learning_rate": 1.7811843941722952e-05, |
| "loss": 0.2189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14403583109378815, |
| "step": 2565, |
| "valid_targets_mean": 3754.9, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 4.079365079365079, |
| "grad_norm": 0.6911463348956305, |
| "learning_rate": 1.7733183190778174e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17022690176963806, |
| "step": 2570, |
| "valid_targets_mean": 4647.0, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 4.087301587301587, |
| "grad_norm": 0.7780248768456252, |
| "learning_rate": 1.7654557945151968e-05, |
| "loss": 0.2092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0747632160782814, |
| "step": 2575, |
| "valid_targets_mean": 2295.0, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 4.095238095238095, |
| "grad_norm": 0.6940182721758144, |
| "learning_rate": 1.7575969436357352e-05, |
| "loss": 0.237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1094612330198288, |
| "step": 2580, |
| "valid_targets_mean": 3678.9, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 4.103174603174603, |
| "grad_norm": 0.5643874374030184, |
| "learning_rate": 1.7497418895331934e-05, |
| "loss": 0.214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10210039466619492, |
| "step": 2585, |
| "valid_targets_mean": 4622.6, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 4.111111111111111, |
| "grad_norm": 0.7297769226717193, |
| "learning_rate": 1.7418907552418597e-05, |
| "loss": 0.2414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1272350400686264, |
| "step": 2590, |
| "valid_targets_mean": 3948.5, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 4.119047619047619, |
| "grad_norm": 0.8006581395181448, |
| "learning_rate": 1.7340436637346315e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12104944884777069, |
| "step": 2595, |
| "valid_targets_mean": 2991.2, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 4.1269841269841265, |
| "grad_norm": 0.6613137801764501, |
| "learning_rate": 1.726200737921079e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06504228711128235, |
| "step": 2600, |
| "valid_targets_mean": 2492.5, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 4.134920634920635, |
| "grad_norm": 0.7387136949916735, |
| "learning_rate": 1.718362100645527e-05, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12065084278583527, |
| "step": 2605, |
| "valid_targets_mean": 2898.9, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 4.142857142857143, |
| "grad_norm": 0.7090937396787783, |
| "learning_rate": 1.710527874685129e-05, |
| "loss": 0.2234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11025974899530411, |
| "step": 2610, |
| "valid_targets_mean": 2430.9, |
| "valid_targets_min": 1056 |
| }, |
| { |
| "epoch": 4.150793650793651, |
| "grad_norm": 0.722190758689241, |
| "learning_rate": 1.702698182747942e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10215307772159576, |
| "step": 2615, |
| "valid_targets_mean": 2964.1, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 4.158730158730159, |
| "grad_norm": 0.7144776057022394, |
| "learning_rate": 1.6948731474710075e-05, |
| "loss": 0.2393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12342202663421631, |
| "step": 2620, |
| "valid_targets_mean": 3819.5, |
| "valid_targets_min": 1317 |
| }, |
| { |
| "epoch": 4.166666666666667, |
| "grad_norm": 0.7492914431944917, |
| "learning_rate": 1.68705289141843e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13639488816261292, |
| "step": 2625, |
| "valid_targets_mean": 3750.9, |
| "valid_targets_min": 1330 |
| }, |
| { |
| "epoch": 4.174603174603175, |
| "grad_norm": 0.7401208722013239, |
| "learning_rate": 1.679237537079454e-05, |
| "loss": 0.233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1440812647342682, |
| "step": 2630, |
| "valid_targets_mean": 3458.8, |
| "valid_targets_min": 1229 |
| }, |
| { |
| "epoch": 4.182539682539683, |
| "grad_norm": 0.6025773710893592, |
| "learning_rate": 1.6714272068665526e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08263147622346878, |
| "step": 2635, |
| "valid_targets_mean": 3376.2, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 4.190476190476191, |
| "grad_norm": 0.596963688362553, |
| "learning_rate": 1.663622023113501e-05, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09171557426452637, |
| "step": 2640, |
| "valid_targets_mean": 4571.8, |
| "valid_targets_min": 2009 |
| }, |
| { |
| "epoch": 4.198412698412699, |
| "grad_norm": 0.7542922003219502, |
| "learning_rate": 1.655822108073467e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12120301276445389, |
| "step": 2645, |
| "valid_targets_mean": 3426.8, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 4.2063492063492065, |
| "grad_norm": 0.794127406475235, |
| "learning_rate": 1.648027583917095e-05, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13536590337753296, |
| "step": 2650, |
| "valid_targets_mean": 3598.9, |
| "valid_targets_min": 1506 |
| }, |
| { |
| "epoch": 4.214285714285714, |
| "grad_norm": 0.7449195658686859, |
| "learning_rate": 1.640238572730591e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10461185872554779, |
| "step": 2655, |
| "valid_targets_mean": 3327.4, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 4.222222222222222, |
| "grad_norm": 0.6732836280628659, |
| "learning_rate": 1.632455196513809e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12440332025289536, |
| "step": 2660, |
| "valid_targets_mean": 3556.0, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 4.23015873015873, |
| "grad_norm": 0.7638215074334139, |
| "learning_rate": 1.624677577178345e-05, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15293553471565247, |
| "step": 2665, |
| "valid_targets_mean": 3222.5, |
| "valid_targets_min": 1203 |
| }, |
| { |
| "epoch": 4.238095238095238, |
| "grad_norm": 0.6453140298046666, |
| "learning_rate": 1.616905836545624e-05, |
| "loss": 0.2309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11287044733762741, |
| "step": 2670, |
| "valid_targets_mean": 4032.5, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 4.246031746031746, |
| "grad_norm": 0.9229381005829962, |
| "learning_rate": 1.6091400963449894e-05, |
| "loss": 0.2405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18993867933750153, |
| "step": 2675, |
| "valid_targets_mean": 3324.4, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 4.253968253968254, |
| "grad_norm": 0.7863010352864319, |
| "learning_rate": 1.6013804782118043e-05, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1106230691075325, |
| "step": 2680, |
| "valid_targets_mean": 2505.0, |
| "valid_targets_min": 318 |
| }, |
| { |
| "epoch": 4.261904761904762, |
| "grad_norm": 0.7694376524205275, |
| "learning_rate": 1.5936271036855372e-05, |
| "loss": 0.2151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08633385598659515, |
| "step": 2685, |
| "valid_targets_mean": 2414.8, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 4.26984126984127, |
| "grad_norm": 0.6357694871639326, |
| "learning_rate": 1.585880094207864e-05, |
| "loss": 0.2329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12916597723960876, |
| "step": 2690, |
| "valid_targets_mean": 4749.9, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 4.277777777777778, |
| "grad_norm": 0.838277956659092, |
| "learning_rate": 1.5781395711207664e-05, |
| "loss": 0.2297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11889150738716125, |
| "step": 2695, |
| "valid_targets_mean": 2379.8, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 4.285714285714286, |
| "grad_norm": 0.6591004793230493, |
| "learning_rate": 1.5704056556646255e-05, |
| "loss": 0.223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10079076886177063, |
| "step": 2700, |
| "valid_targets_mean": 3413.8, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 4.2936507936507935, |
| "grad_norm": 0.6543704431835511, |
| "learning_rate": 1.562678468976329e-05, |
| "loss": 0.26, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10609576106071472, |
| "step": 2705, |
| "valid_targets_mean": 3200.8, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 4.301587301587301, |
| "grad_norm": 0.7687796568069265, |
| "learning_rate": 1.5549581320873715e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10676814615726471, |
| "step": 2710, |
| "valid_targets_mean": 3095.1, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 4.309523809523809, |
| "grad_norm": 0.6932002931278404, |
| "learning_rate": 1.5472447659219573e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13282454013824463, |
| "step": 2715, |
| "valid_targets_mean": 3701.2, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 4.317460317460317, |
| "grad_norm": 0.5902369291201127, |
| "learning_rate": 1.5395384912951096e-05, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12770837545394897, |
| "step": 2720, |
| "valid_targets_mean": 5372.8, |
| "valid_targets_min": 1753 |
| }, |
| { |
| "epoch": 4.325396825396825, |
| "grad_norm": 0.6748449023035938, |
| "learning_rate": 1.531839428910774e-05, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.120603047311306, |
| "step": 2725, |
| "valid_targets_mean": 3591.1, |
| "valid_targets_min": 2100 |
| }, |
| { |
| "epoch": 4.333333333333333, |
| "grad_norm": 0.5987121324615388, |
| "learning_rate": 1.5241476993599318e-05, |
| "loss": 0.2236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11681363731622696, |
| "step": 2730, |
| "valid_targets_mean": 5095.5, |
| "valid_targets_min": 1581 |
| }, |
| { |
| "epoch": 4.341269841269841, |
| "grad_norm": 0.7159427225817645, |
| "learning_rate": 1.5164634231187106e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14144907891750336, |
| "step": 2735, |
| "valid_targets_mean": 3225.6, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 4.349206349206349, |
| "grad_norm": 0.6611954382275911, |
| "learning_rate": 1.5087867205464933e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09750405699014664, |
| "step": 2740, |
| "valid_targets_mean": 3417.1, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 4.357142857142857, |
| "grad_norm": 0.7263798618780849, |
| "learning_rate": 1.5011177118840376e-05, |
| "loss": 0.228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12625962495803833, |
| "step": 2745, |
| "valid_targets_mean": 3994.0, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 4.365079365079365, |
| "grad_norm": 0.7933122878926689, |
| "learning_rate": 1.4934565172515917e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0890585258603096, |
| "step": 2750, |
| "valid_targets_mean": 2174.6, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 4.3730158730158735, |
| "grad_norm": 0.7213075598879185, |
| "learning_rate": 1.4858032566470107e-05, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17482303082942963, |
| "step": 2755, |
| "valid_targets_mean": 5093.8, |
| "valid_targets_min": 1293 |
| }, |
| { |
| "epoch": 4.380952380952381, |
| "grad_norm": 0.8248529406403541, |
| "learning_rate": 1.4781580499438794e-05, |
| "loss": 0.2316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08823531866073608, |
| "step": 2760, |
| "valid_targets_mean": 1934.1, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 4.388888888888889, |
| "grad_norm": 0.7466423261561578, |
| "learning_rate": 1.4705210168896327e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11548350751399994, |
| "step": 2765, |
| "valid_targets_mean": 3395.5, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 4.396825396825397, |
| "grad_norm": 0.6912935398648323, |
| "learning_rate": 1.462892277103681e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11666476726531982, |
| "step": 2770, |
| "valid_targets_mean": 3372.8, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 4.404761904761905, |
| "grad_norm": 0.6849370643438872, |
| "learning_rate": 1.455271950075539e-05, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09486103057861328, |
| "step": 2775, |
| "valid_targets_mean": 2735.1, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 4.412698412698413, |
| "grad_norm": 0.5989489711073828, |
| "learning_rate": 1.4476601551629493e-05, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11204937100410461, |
| "step": 2780, |
| "valid_targets_mean": 4433.1, |
| "valid_targets_min": 1363 |
| }, |
| { |
| "epoch": 4.420634920634921, |
| "grad_norm": 0.8531974727728336, |
| "learning_rate": 1.4400570115900147e-05, |
| "loss": 0.2231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1309199035167694, |
| "step": 2785, |
| "valid_targets_mean": 3022.9, |
| "valid_targets_min": 1582 |
| }, |
| { |
| "epoch": 4.428571428571429, |
| "grad_norm": 0.7725264862980028, |
| "learning_rate": 1.4324626384453345e-05, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12786544859409332, |
| "step": 2790, |
| "valid_targets_mean": 3201.5, |
| "valid_targets_min": 1886 |
| }, |
| { |
| "epoch": 4.436507936507937, |
| "grad_norm": 1.2348782492609787, |
| "learning_rate": 1.4248771546801339e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10978405177593231, |
| "step": 2795, |
| "valid_targets_mean": 2609.4, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 4.444444444444445, |
| "grad_norm": 0.5857767158165396, |
| "learning_rate": 1.4173006791064023e-05, |
| "loss": 0.229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11274480074644089, |
| "step": 2800, |
| "valid_targets_mean": 4386.8, |
| "valid_targets_min": 1685 |
| }, |
| { |
| "epoch": 4.4523809523809526, |
| "grad_norm": 0.7243806950657568, |
| "learning_rate": 1.4097333303950368e-05, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13323573768138885, |
| "step": 2805, |
| "valid_targets_mean": 3164.4, |
| "valid_targets_min": 1546 |
| }, |
| { |
| "epoch": 4.4603174603174605, |
| "grad_norm": 0.8365899391330908, |
| "learning_rate": 1.4021752270739759e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17075440287590027, |
| "step": 2810, |
| "valid_targets_mean": 3530.6, |
| "valid_targets_min": 1523 |
| }, |
| { |
| "epoch": 4.468253968253968, |
| "grad_norm": 0.6426801032723285, |
| "learning_rate": 1.3946264875263485e-05, |
| "loss": 0.237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10363493859767914, |
| "step": 2815, |
| "valid_targets_mean": 3605.0, |
| "valid_targets_min": 1712 |
| }, |
| { |
| "epoch": 4.476190476190476, |
| "grad_norm": 0.6890993167954129, |
| "learning_rate": 1.3870872299886184e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07421109080314636, |
| "step": 2820, |
| "valid_targets_mean": 2241.6, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 4.484126984126984, |
| "grad_norm": 0.6729360045725103, |
| "learning_rate": 1.3795575725487303e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09559076279401779, |
| "step": 2825, |
| "valid_targets_mean": 3219.1, |
| "valid_targets_min": 1489 |
| }, |
| { |
| "epoch": 4.492063492063492, |
| "grad_norm": 0.9472374491757762, |
| "learning_rate": 1.3720376331442652e-05, |
| "loss": 0.236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12624111771583557, |
| "step": 2830, |
| "valid_targets_mean": 1985.1, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 4.5, |
| "grad_norm": 0.6423699741233883, |
| "learning_rate": 1.364527529560586e-05, |
| "loss": 0.2317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09665095806121826, |
| "step": 2835, |
| "valid_targets_mean": 3381.6, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 4.507936507936508, |
| "grad_norm": 0.8434624170792736, |
| "learning_rate": 1.3570273794289978e-05, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11487355828285217, |
| "step": 2840, |
| "valid_targets_mean": 2106.1, |
| "valid_targets_min": 1085 |
| }, |
| { |
| "epoch": 4.515873015873016, |
| "grad_norm": 0.8176335490386788, |
| "learning_rate": 1.3495373002249061e-05, |
| "loss": 0.2351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11494874209165573, |
| "step": 2845, |
| "valid_targets_mean": 2774.2, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 4.523809523809524, |
| "grad_norm": 0.7509641841477122, |
| "learning_rate": 1.3420574092659713e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0945759192109108, |
| "step": 2850, |
| "valid_targets_mean": 2959.2, |
| "valid_targets_min": 1038 |
| }, |
| { |
| "epoch": 4.531746031746032, |
| "grad_norm": 0.7303411502442227, |
| "learning_rate": 1.3345878237102766e-05, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12984412908554077, |
| "step": 2855, |
| "valid_targets_mean": 3543.2, |
| "valid_targets_min": 1360 |
| }, |
| { |
| "epoch": 4.5396825396825395, |
| "grad_norm": 0.7135801927779284, |
| "learning_rate": 1.3271286605544906e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1369558870792389, |
| "step": 2860, |
| "valid_targets_mean": 4178.8, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 4.5476190476190474, |
| "grad_norm": 0.8002438173525717, |
| "learning_rate": 1.3196800366320357e-05, |
| "loss": 0.222, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13606247305870056, |
| "step": 2865, |
| "valid_targets_mean": 3268.6, |
| "valid_targets_min": 961 |
| }, |
| { |
| "epoch": 4.555555555555555, |
| "grad_norm": 0.7255775013934033, |
| "learning_rate": 1.3122420686112554e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09334878623485565, |
| "step": 2870, |
| "valid_targets_mean": 2750.4, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 4.563492063492063, |
| "grad_norm": 0.7155396542120448, |
| "learning_rate": 1.3048148729935917e-05, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12097464501857758, |
| "step": 2875, |
| "valid_targets_mean": 3632.4, |
| "valid_targets_min": 1730 |
| }, |
| { |
| "epoch": 4.571428571428571, |
| "grad_norm": 1.8092713084981278, |
| "learning_rate": 1.297398566111756e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11287643015384674, |
| "step": 2880, |
| "valid_targets_mean": 3300.0, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 4.579365079365079, |
| "grad_norm": 0.7654711485267467, |
| "learning_rate": 1.2899932641279082e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11186093091964722, |
| "step": 2885, |
| "valid_targets_mean": 2760.4, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 4.587301587301587, |
| "grad_norm": 0.774643668364101, |
| "learning_rate": 1.2825990830318395e-05, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09278203547000885, |
| "step": 2890, |
| "valid_targets_mean": 2548.6, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 4.595238095238095, |
| "grad_norm": 0.8001318452509485, |
| "learning_rate": 1.2752161386391526e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10767956078052521, |
| "step": 2895, |
| "valid_targets_mean": 2060.4, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 4.603174603174603, |
| "grad_norm": 0.5712255444569291, |
| "learning_rate": 1.2678445465894491e-05, |
| "loss": 0.2234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10319489985704422, |
| "step": 2900, |
| "valid_targets_mean": 4445.1, |
| "valid_targets_min": 2055 |
| }, |
| { |
| "epoch": 4.611111111111111, |
| "grad_norm": 0.6135689736493125, |
| "learning_rate": 1.2604844223445181e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07687068730592728, |
| "step": 2905, |
| "valid_targets_mean": 2514.1, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 4.619047619047619, |
| "grad_norm": 0.6579258264976859, |
| "learning_rate": 1.2531358811865268e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11658872663974762, |
| "step": 2910, |
| "valid_targets_mean": 3789.9, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 4.6269841269841265, |
| "grad_norm": 0.6444665058651138, |
| "learning_rate": 1.2457990382162173e-05, |
| "loss": 0.237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12281468510627747, |
| "step": 2915, |
| "valid_targets_mean": 4370.9, |
| "valid_targets_min": 1616 |
| }, |
| { |
| "epoch": 4.634920634920634, |
| "grad_norm": 0.6876035515078412, |
| "learning_rate": 1.238474008351101e-05, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09872429817914963, |
| "step": 2920, |
| "valid_targets_mean": 3054.0, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 4.642857142857143, |
| "grad_norm": 0.6931951314781377, |
| "learning_rate": 1.2311609063236594e-05, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10577560216188431, |
| "step": 2925, |
| "valid_targets_mean": 3132.2, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 4.650793650793651, |
| "grad_norm": 0.6819762221919383, |
| "learning_rate": 1.2238598466795493e-05, |
| "loss": 0.2143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11494247615337372, |
| "step": 2930, |
| "valid_targets_mean": 3767.6, |
| "valid_targets_min": 1581 |
| }, |
| { |
| "epoch": 4.658730158730159, |
| "grad_norm": 0.5497909587102477, |
| "learning_rate": 1.2165709437758042e-05, |
| "loss": 0.2211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1371319591999054, |
| "step": 2935, |
| "valid_targets_mean": 4767.9, |
| "valid_targets_min": 2053 |
| }, |
| { |
| "epoch": 4.666666666666667, |
| "grad_norm": 0.7497286458898537, |
| "learning_rate": 1.209294311779047e-05, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10149647295475006, |
| "step": 2940, |
| "valid_targets_mean": 2748.5, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 4.674603174603175, |
| "grad_norm": 0.794199842888716, |
| "learning_rate": 1.2020300646637018e-05, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12010520696640015, |
| "step": 2945, |
| "valid_targets_mean": 2594.0, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 4.682539682539683, |
| "grad_norm": 0.6156502044065189, |
| "learning_rate": 1.1947783162102043e-05, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0953923910856247, |
| "step": 2950, |
| "valid_targets_mean": 3468.9, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 4.690476190476191, |
| "grad_norm": 0.7560140620960419, |
| "learning_rate": 1.1875391800032248e-05, |
| "loss": 0.2295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14818307757377625, |
| "step": 2955, |
| "valid_targets_mean": 3391.6, |
| "valid_targets_min": 1426 |
| }, |
| { |
| "epoch": 4.698412698412699, |
| "grad_norm": 0.6675396719960957, |
| "learning_rate": 1.1803127694298873e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10536058992147446, |
| "step": 2960, |
| "valid_targets_mean": 3879.0, |
| "valid_targets_min": 1464 |
| }, |
| { |
| "epoch": 4.7063492063492065, |
| "grad_norm": 0.7216255033546128, |
| "learning_rate": 1.173099197677992e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09683910012245178, |
| "step": 2965, |
| "valid_targets_mean": 3976.0, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 4.714285714285714, |
| "grad_norm": 0.6299655661341759, |
| "learning_rate": 1.1658985777342458e-05, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10072541236877441, |
| "step": 2970, |
| "valid_targets_mean": 4138.9, |
| "valid_targets_min": 2165 |
| }, |
| { |
| "epoch": 4.722222222222222, |
| "grad_norm": 0.7267114286430387, |
| "learning_rate": 1.1587110223824874e-05, |
| "loss": 0.2371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11458795517683029, |
| "step": 2975, |
| "valid_targets_mean": 3501.6, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 4.73015873015873, |
| "grad_norm": 0.5711880649526813, |
| "learning_rate": 1.151536644201925e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10362765938043594, |
| "step": 2980, |
| "valid_targets_mean": 5068.5, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 4.738095238095238, |
| "grad_norm": 0.6837744972295653, |
| "learning_rate": 1.1443755555653751e-05, |
| "loss": 0.2115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11046740412712097, |
| "step": 2985, |
| "valid_targets_mean": 3774.5, |
| "valid_targets_min": 1516 |
| }, |
| { |
| "epoch": 4.746031746031746, |
| "grad_norm": 0.8268088262430978, |
| "learning_rate": 1.1372278686374935e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11939245462417603, |
| "step": 2990, |
| "valid_targets_mean": 2241.9, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 4.753968253968254, |
| "grad_norm": 0.7080274610839087, |
| "learning_rate": 1.1300936953730273e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07471520453691483, |
| "step": 2995, |
| "valid_targets_mean": 2855.1, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 4.761904761904762, |
| "grad_norm": 0.6346454470756567, |
| "learning_rate": 1.1229731475150594e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09645067900419235, |
| "step": 3000, |
| "valid_targets_mean": 3225.0, |
| "valid_targets_min": 1558 |
| }, |
| { |
| "epoch": 4.76984126984127, |
| "grad_norm": 0.8159716611544979, |
| "learning_rate": 1.1158663365932529e-05, |
| "loss": 0.2293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16088628768920898, |
| "step": 3005, |
| "valid_targets_mean": 3942.8, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 4.777777777777778, |
| "grad_norm": 0.7485963907590999, |
| "learning_rate": 1.1087733739221109e-05, |
| "loss": 0.2293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07297512143850327, |
| "step": 3010, |
| "valid_targets_mean": 2137.1, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 4.785714285714286, |
| "grad_norm": 0.6959060383565719, |
| "learning_rate": 1.1016943705992311e-05, |
| "loss": 0.2467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14023664593696594, |
| "step": 3015, |
| "valid_targets_mean": 4470.1, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 4.7936507936507935, |
| "grad_norm": 0.8209624595660114, |
| "learning_rate": 1.0946294375035639e-05, |
| "loss": 0.2205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10550207644701004, |
| "step": 3020, |
| "valid_targets_mean": 2292.6, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 4.801587301587301, |
| "grad_norm": 0.8467111860371475, |
| "learning_rate": 1.087578685293674e-05, |
| "loss": 0.229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1101028323173523, |
| "step": 3025, |
| "valid_targets_mean": 2002.0, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 4.809523809523809, |
| "grad_norm": 0.7031175355751162, |
| "learning_rate": 1.080542224406015e-05, |
| "loss": 0.2235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08865861594676971, |
| "step": 3030, |
| "valid_targets_mean": 2722.9, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 4.817460317460317, |
| "grad_norm": 0.6340433410827726, |
| "learning_rate": 1.0735201650531915e-05, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08490338921546936, |
| "step": 3035, |
| "valid_targets_mean": 3582.5, |
| "valid_targets_min": 1662 |
| }, |
| { |
| "epoch": 4.825396825396825, |
| "grad_norm": 0.8779889239691778, |
| "learning_rate": 1.066512617222235e-05, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1368151307106018, |
| "step": 3040, |
| "valid_targets_mean": 2917.8, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 4.833333333333333, |
| "grad_norm": 0.8148128948217418, |
| "learning_rate": 1.059519690672884e-05, |
| "loss": 0.2282, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1347075253725052, |
| "step": 3045, |
| "valid_targets_mean": 3162.8, |
| "valid_targets_min": 1554 |
| }, |
| { |
| "epoch": 4.841269841269841, |
| "grad_norm": 0.7163970373680205, |
| "learning_rate": 1.0525414949358614e-05, |
| "loss": 0.2257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12431874126195908, |
| "step": 3050, |
| "valid_targets_mean": 4172.5, |
| "valid_targets_min": 1986 |
| }, |
| { |
| "epoch": 4.849206349206349, |
| "grad_norm": 0.7360036176983142, |
| "learning_rate": 1.0455781393111613e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15029457211494446, |
| "step": 3055, |
| "valid_targets_mean": 4648.4, |
| "valid_targets_min": 1219 |
| }, |
| { |
| "epoch": 4.857142857142857, |
| "grad_norm": 0.7198933951477575, |
| "learning_rate": 1.0386297328663353e-05, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11901850998401642, |
| "step": 3060, |
| "valid_targets_mean": 3197.0, |
| "valid_targets_min": 2097 |
| }, |
| { |
| "epoch": 4.865079365079366, |
| "grad_norm": 0.7591758487987466, |
| "learning_rate": 1.0316963844347843e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16917167603969574, |
| "step": 3065, |
| "valid_targets_mean": 3458.1, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 4.8730158730158735, |
| "grad_norm": 0.6661543635742453, |
| "learning_rate": 1.0247782026140576e-05, |
| "loss": 0.2151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1022878885269165, |
| "step": 3070, |
| "valid_targets_mean": 2875.9, |
| "valid_targets_min": 1623 |
| }, |
| { |
| "epoch": 4.880952380952381, |
| "grad_norm": 0.8652472888174663, |
| "learning_rate": 1.017875295764144e-05, |
| "loss": 0.2256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1259920448064804, |
| "step": 3075, |
| "valid_targets_mean": 2689.5, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 4.888888888888889, |
| "grad_norm": 0.7850884128960549, |
| "learning_rate": 1.0109877720057818e-05, |
| "loss": 0.2437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09217704832553864, |
| "step": 3080, |
| "valid_targets_mean": 2314.9, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 4.896825396825397, |
| "grad_norm": 0.7008626159310546, |
| "learning_rate": 1.0041157392187651e-05, |
| "loss": 0.2351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09693759679794312, |
| "step": 3085, |
| "valid_targets_mean": 2638.2, |
| "valid_targets_min": 1401 |
| }, |
| { |
| "epoch": 4.904761904761905, |
| "grad_norm": 0.8580160012430362, |
| "learning_rate": 9.972593050402471e-06, |
| "loss": 0.2502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11387155950069427, |
| "step": 3090, |
| "valid_targets_mean": 1859.2, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 4.912698412698413, |
| "grad_norm": 0.6468446443099518, |
| "learning_rate": 9.904185768630612e-06, |
| "loss": 0.2286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15160252153873444, |
| "step": 3095, |
| "valid_targets_mean": 5390.9, |
| "valid_targets_min": 1587 |
| }, |
| { |
| "epoch": 4.920634920634921, |
| "grad_norm": 0.5684268979378351, |
| "learning_rate": 9.835936618340377e-06, |
| "loss": 0.2418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13138213753700256, |
| "step": 3100, |
| "valid_targets_mean": 4122.5, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 4.928571428571429, |
| "grad_norm": 0.7131733546217154, |
| "learning_rate": 9.76784666852323e-06, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06886936724185944, |
| "step": 3105, |
| "valid_targets_mean": 1896.1, |
| "valid_targets_min": 1242 |
| }, |
| { |
| "epoch": 4.936507936507937, |
| "grad_norm": 0.8263911818151064, |
| "learning_rate": 9.699916985677062e-06, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13891655206680298, |
| "step": 3110, |
| "valid_targets_mean": 3128.5, |
| "valid_targets_min": 1302 |
| }, |
| { |
| "epoch": 4.944444444444445, |
| "grad_norm": 0.678512236825066, |
| "learning_rate": 9.6321486337895e-06, |
| "loss": 0.2309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10146833956241608, |
| "step": 3115, |
| "valid_targets_mean": 3825.9, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 4.9523809523809526, |
| "grad_norm": 0.6938061243394774, |
| "learning_rate": 9.564542674321228e-06, |
| "loss": 0.2205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11534064263105392, |
| "step": 3120, |
| "valid_targets_mean": 3539.6, |
| "valid_targets_min": 1226 |
| }, |
| { |
| "epoch": 4.9603174603174605, |
| "grad_norm": 0.6496250853188159, |
| "learning_rate": 9.49710016618937e-06, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13002172112464905, |
| "step": 3125, |
| "valid_targets_mean": 3752.9, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 4.968253968253968, |
| "grad_norm": 0.731846216839573, |
| "learning_rate": 9.429822165750893e-06, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1303645372390747, |
| "step": 3130, |
| "valid_targets_mean": 3501.1, |
| "valid_targets_min": 1453 |
| }, |
| { |
| "epoch": 4.976190476190476, |
| "grad_norm": 0.7302474135173942, |
| "learning_rate": 9.36270972678607e-06, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12065795063972473, |
| "step": 3135, |
| "valid_targets_mean": 3030.6, |
| "valid_targets_min": 1525 |
| }, |
| { |
| "epoch": 4.984126984126984, |
| "grad_norm": 0.8382447486874602, |
| "learning_rate": 9.295763900481977e-06, |
| "loss": 0.23, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08970605581998825, |
| "step": 3140, |
| "valid_targets_mean": 2422.5, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 4.992063492063492, |
| "grad_norm": 0.6946408347465951, |
| "learning_rate": 9.22898573541602e-06, |
| "loss": 0.2342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10561580210924149, |
| "step": 3145, |
| "valid_targets_mean": 3991.8, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.7898033128472092, |
| "learning_rate": 9.162376277539513e-06, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11227846145629883, |
| "step": 3150, |
| "valid_targets_mean": 2750.9, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 5.007936507936508, |
| "grad_norm": 0.7146420475983313, |
| "learning_rate": 9.095936570161301e-06, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12624788284301758, |
| "step": 3155, |
| "valid_targets_mean": 3846.4, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 5.015873015873016, |
| "grad_norm": 0.6517411197054727, |
| "learning_rate": 9.029667653931411e-06, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06766072660684586, |
| "step": 3160, |
| "valid_targets_mean": 3087.6, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 5.023809523809524, |
| "grad_norm": 0.8345596778348867, |
| "learning_rate": 8.96357056682475e-06, |
| "loss": 0.2082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10621356964111328, |
| "step": 3165, |
| "valid_targets_mean": 2631.9, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 5.031746031746032, |
| "grad_norm": 0.8085550022852781, |
| "learning_rate": 8.897646344124882e-06, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12722842395305634, |
| "step": 3170, |
| "valid_targets_mean": 3126.6, |
| "valid_targets_min": 1496 |
| }, |
| { |
| "epoch": 5.0396825396825395, |
| "grad_norm": 0.6859939671973228, |
| "learning_rate": 8.83189601840773e-06, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08324988931417465, |
| "step": 3175, |
| "valid_targets_mean": 2954.6, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 5.0476190476190474, |
| "grad_norm": 0.6329422503933559, |
| "learning_rate": 8.766320619525511e-06, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11945187300443649, |
| "step": 3180, |
| "valid_targets_mean": 4450.5, |
| "valid_targets_min": 1558 |
| }, |
| { |
| "epoch": 5.055555555555555, |
| "grad_norm": 0.8029282832348713, |
| "learning_rate": 8.700921174590525e-06, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10649940371513367, |
| "step": 3185, |
| "valid_targets_mean": 2527.2, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 5.063492063492063, |
| "grad_norm": 0.6560077390622969, |
| "learning_rate": 8.63569870795907e-06, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12603171169757843, |
| "step": 3190, |
| "valid_targets_mean": 5060.4, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 5.071428571428571, |
| "grad_norm": 0.7218401202124031, |
| "learning_rate": 8.570654241215466e-06, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11767058074474335, |
| "step": 3195, |
| "valid_targets_mean": 3966.0, |
| "valid_targets_min": 2226 |
| }, |
| { |
| "epoch": 5.079365079365079, |
| "grad_norm": 0.8081789481249295, |
| "learning_rate": 8.505788793155978e-06, |
| "loss": 0.2042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08667795360088348, |
| "step": 3200, |
| "valid_targets_mean": 2434.5, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 5.087301587301587, |
| "grad_norm": 0.7458764582812119, |
| "learning_rate": 8.441103379772893e-06, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09307099878787994, |
| "step": 3205, |
| "valid_targets_mean": 3196.9, |
| "valid_targets_min": 1336 |
| }, |
| { |
| "epoch": 5.095238095238095, |
| "grad_norm": 0.6048773964520159, |
| "learning_rate": 8.376599014238605e-06, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08689746260643005, |
| "step": 3210, |
| "valid_targets_mean": 3691.8, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 5.103174603174603, |
| "grad_norm": 0.7088750227894017, |
| "learning_rate": 8.312276706889738e-06, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11118713021278381, |
| "step": 3215, |
| "valid_targets_mean": 3710.4, |
| "valid_targets_min": 1442 |
| }, |
| { |
| "epoch": 5.111111111111111, |
| "grad_norm": 0.7875888873370555, |
| "learning_rate": 8.24813746521133e-06, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10653230547904968, |
| "step": 3220, |
| "valid_targets_mean": 2371.4, |
| "valid_targets_min": 1474 |
| }, |
| { |
| "epoch": 5.119047619047619, |
| "grad_norm": 0.6271107098202612, |
| "learning_rate": 8.184182293821046e-06, |
| "loss": 0.2123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09181641787290573, |
| "step": 3225, |
| "valid_targets_mean": 3844.1, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 5.1269841269841265, |
| "grad_norm": 0.7729536882848088, |
| "learning_rate": 8.120412194453442e-06, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13168609142303467, |
| "step": 3230, |
| "valid_targets_mean": 3441.9, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 5.134920634920635, |
| "grad_norm": 0.7684229615937804, |
| "learning_rate": 8.056828165944282e-06, |
| "loss": 0.2075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09150117635726929, |
| "step": 3235, |
| "valid_targets_mean": 2375.8, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 5.142857142857143, |
| "grad_norm": 0.7878065076580593, |
| "learning_rate": 7.993431204214883e-06, |
| "loss": 0.2051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1006222665309906, |
| "step": 3240, |
| "valid_targets_mean": 2976.8, |
| "valid_targets_min": 877 |
| }, |
| { |
| "epoch": 5.150793650793651, |
| "grad_norm": 0.7479238006778793, |
| "learning_rate": 7.93022230225652e-06, |
| "loss": 0.219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12401343137025833, |
| "step": 3245, |
| "valid_targets_mean": 3254.5, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 5.158730158730159, |
| "grad_norm": 0.702402201184209, |
| "learning_rate": 7.867202450114892e-06, |
| "loss": 0.2206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09244085103273392, |
| "step": 3250, |
| "valid_targets_mean": 3044.9, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 5.166666666666667, |
| "grad_norm": 0.6904073371631958, |
| "learning_rate": 7.804372634874582e-06, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11687523871660233, |
| "step": 3255, |
| "valid_targets_mean": 4131.0, |
| "valid_targets_min": 1638 |
| }, |
| { |
| "epoch": 5.174603174603175, |
| "grad_norm": 0.794713029359026, |
| "learning_rate": 7.74173384064359e-06, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10450978577136993, |
| "step": 3260, |
| "valid_targets_mean": 3100.6, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 5.182539682539683, |
| "grad_norm": 0.7899895590351436, |
| "learning_rate": 7.679287048537987e-06, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12722371518611908, |
| "step": 3265, |
| "valid_targets_mean": 3208.2, |
| "valid_targets_min": 1358 |
| }, |
| { |
| "epoch": 5.190476190476191, |
| "grad_norm": 0.6296178163629895, |
| "learning_rate": 7.617033236666469e-06, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07929957658052444, |
| "step": 3270, |
| "valid_targets_mean": 3253.1, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 5.198412698412699, |
| "grad_norm": 0.772550287330192, |
| "learning_rate": 7.55497338011506e-06, |
| "loss": 0.2169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12237787246704102, |
| "step": 3275, |
| "valid_targets_mean": 3851.5, |
| "valid_targets_min": 1990 |
| }, |
| { |
| "epoch": 5.2063492063492065, |
| "grad_norm": 0.6767191861039769, |
| "learning_rate": 7.493108450931879e-06, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10229524970054626, |
| "step": 3280, |
| "valid_targets_mean": 4133.1, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 5.214285714285714, |
| "grad_norm": 0.720480770224619, |
| "learning_rate": 7.4314394181118636e-06, |
| "loss": 0.2118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11554890125989914, |
| "step": 3285, |
| "valid_targets_mean": 4656.8, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 5.222222222222222, |
| "grad_norm": 0.726519804219711, |
| "learning_rate": 7.369967247581611e-06, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1208588257431984, |
| "step": 3290, |
| "valid_targets_mean": 3772.8, |
| "valid_targets_min": 1731 |
| }, |
| { |
| "epoch": 5.23015873015873, |
| "grad_norm": 0.7321877521486466, |
| "learning_rate": 7.3086929021842575e-06, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1158241480588913, |
| "step": 3295, |
| "valid_targets_mean": 4226.0, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 5.238095238095238, |
| "grad_norm": 0.7393559355923631, |
| "learning_rate": 7.247617341664384e-06, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13511210680007935, |
| "step": 3300, |
| "valid_targets_mean": 4740.5, |
| "valid_targets_min": 1710 |
| }, |
| { |
| "epoch": 5.246031746031746, |
| "grad_norm": 0.793371294614497, |
| "learning_rate": 7.186741522652994e-06, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0859147161245346, |
| "step": 3305, |
| "valid_targets_mean": 2580.8, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 5.253968253968254, |
| "grad_norm": 0.8066319717320056, |
| "learning_rate": 7.12606639865252e-06, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.172830730676651, |
| "step": 3310, |
| "valid_targets_mean": 3399.0, |
| "valid_targets_min": 1479 |
| }, |
| { |
| "epoch": 5.261904761904762, |
| "grad_norm": 0.8161505028774265, |
| "learning_rate": 7.065592920021893e-06, |
| "loss": 0.2153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12437000870704651, |
| "step": 3315, |
| "valid_targets_mean": 2944.4, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 5.26984126984127, |
| "grad_norm": 0.6723134626596974, |
| "learning_rate": 7.005322033961679e-06, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09198858588933945, |
| "step": 3320, |
| "valid_targets_mean": 3883.2, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 5.277777777777778, |
| "grad_norm": 0.6815222171306629, |
| "learning_rate": 6.945254684499185e-06, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08335371315479279, |
| "step": 3325, |
| "valid_targets_mean": 3160.1, |
| "valid_targets_min": 1536 |
| }, |
| { |
| "epoch": 5.285714285714286, |
| "grad_norm": 0.9098274401850043, |
| "learning_rate": 6.8853918124737274e-06, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1184665709733963, |
| "step": 3330, |
| "valid_targets_mean": 2596.0, |
| "valid_targets_min": 1315 |
| }, |
| { |
| "epoch": 5.2936507936507935, |
| "grad_norm": 0.6857614007500089, |
| "learning_rate": 6.825734355521898e-06, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1017097607254982, |
| "step": 3335, |
| "valid_targets_mean": 4198.5, |
| "valid_targets_min": 1562 |
| }, |
| { |
| "epoch": 5.301587301587301, |
| "grad_norm": 0.8272058345129579, |
| "learning_rate": 6.766283248062817e-06, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08390039950609207, |
| "step": 3340, |
| "valid_targets_mean": 2267.4, |
| "valid_targets_min": 1306 |
| }, |
| { |
| "epoch": 5.309523809523809, |
| "grad_norm": 0.8083062386180365, |
| "learning_rate": 6.707039421283559e-06, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0976867526769638, |
| "step": 3345, |
| "valid_targets_mean": 2621.0, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 5.317460317460317, |
| "grad_norm": 0.7907657672139157, |
| "learning_rate": 6.648003803124559e-06, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06761344522237778, |
| "step": 3350, |
| "valid_targets_mean": 2349.9, |
| "valid_targets_min": 1323 |
| }, |
| { |
| "epoch": 5.325396825396825, |
| "grad_norm": 0.8295765502920541, |
| "learning_rate": 6.589177318265047e-06, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08894240111112595, |
| "step": 3355, |
| "valid_targets_mean": 3019.9, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 5.333333333333333, |
| "grad_norm": 0.7155977892403146, |
| "learning_rate": 6.53056088810857e-06, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08744360506534576, |
| "step": 3360, |
| "valid_targets_mean": 3405.6, |
| "valid_targets_min": 1690 |
| }, |
| { |
| "epoch": 5.341269841269841, |
| "grad_norm": 0.7623686882341104, |
| "learning_rate": 6.472155430768608e-06, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.096970334649086, |
| "step": 3365, |
| "valid_targets_mean": 3433.9, |
| "valid_targets_min": 1287 |
| }, |
| { |
| "epoch": 5.349206349206349, |
| "grad_norm": 0.6991086887361436, |
| "learning_rate": 6.413961861054132e-06, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09134359657764435, |
| "step": 3370, |
| "valid_targets_mean": 3337.8, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 5.357142857142857, |
| "grad_norm": 0.7184355046680967, |
| "learning_rate": 6.3559810904553095e-06, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09643669426441193, |
| "step": 3375, |
| "valid_targets_mean": 3267.6, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 5.365079365079365, |
| "grad_norm": 0.7691159521423506, |
| "learning_rate": 6.298214027129219e-06, |
| "loss": 0.2081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08167582750320435, |
| "step": 3380, |
| "valid_targets_mean": 3071.9, |
| "valid_targets_min": 2067 |
| }, |
| { |
| "epoch": 5.3730158730158735, |
| "grad_norm": 0.7232492216728219, |
| "learning_rate": 6.240661575885629e-06, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09442508220672607, |
| "step": 3385, |
| "valid_targets_mean": 3521.1, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 5.380952380952381, |
| "grad_norm": 0.7830495336781548, |
| "learning_rate": 6.183324638172819e-06, |
| "loss": 0.2221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10402445495128632, |
| "step": 3390, |
| "valid_targets_mean": 2552.1, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 5.388888888888889, |
| "grad_norm": 0.729818898985151, |
| "learning_rate": 6.126204112063463e-06, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1520620882511139, |
| "step": 3395, |
| "valid_targets_mean": 4477.5, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 5.396825396825397, |
| "grad_norm": 0.6920667559511638, |
| "learning_rate": 6.069300892240564e-06, |
| "loss": 0.1894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09078704565763474, |
| "step": 3400, |
| "valid_targets_mean": 3087.2, |
| "valid_targets_min": 1270 |
| }, |
| { |
| "epoch": 5.404761904761905, |
| "grad_norm": 0.7781077186783485, |
| "learning_rate": 6.0126158699834625e-06, |
| "loss": 0.2087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10325247049331665, |
| "step": 3405, |
| "valid_targets_mean": 3032.1, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 5.412698412698413, |
| "grad_norm": 0.7663501738172225, |
| "learning_rate": 5.956149933153816e-06, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07357954978942871, |
| "step": 3410, |
| "valid_targets_mean": 2068.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 5.420634920634921, |
| "grad_norm": 0.7027131190487993, |
| "learning_rate": 5.899903966181751e-06, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10673792660236359, |
| "step": 3415, |
| "valid_targets_mean": 3083.1, |
| "valid_targets_min": 1552 |
| }, |
| { |
| "epoch": 5.428571428571429, |
| "grad_norm": 0.6911729334824366, |
| "learning_rate": 5.843878850052007e-06, |
| "loss": 0.2137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09318830817937851, |
| "step": 3420, |
| "valid_targets_mean": 3576.4, |
| "valid_targets_min": 1720 |
| }, |
| { |
| "epoch": 5.436507936507937, |
| "grad_norm": 0.7317882758484224, |
| "learning_rate": 5.788075462290084e-06, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0958942249417305, |
| "step": 3425, |
| "valid_targets_mean": 2726.6, |
| "valid_targets_min": 1096 |
| }, |
| { |
| "epoch": 5.444444444444445, |
| "grad_norm": 0.7898992040430142, |
| "learning_rate": 5.732494676948554e-06, |
| "loss": 0.2095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1019308939576149, |
| "step": 3430, |
| "valid_targets_mean": 3273.1, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 5.4523809523809526, |
| "grad_norm": 0.6476619928289603, |
| "learning_rate": 5.677137364593363e-06, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1071840450167656, |
| "step": 3435, |
| "valid_targets_mean": 4286.2, |
| "valid_targets_min": 1373 |
| }, |
| { |
| "epoch": 5.4603174603174605, |
| "grad_norm": 0.8557484260093969, |
| "learning_rate": 5.622004392290163e-06, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12339898943901062, |
| "step": 3440, |
| "valid_targets_mean": 2923.4, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 5.468253968253968, |
| "grad_norm": 0.7015615872264492, |
| "learning_rate": 5.567096623590758e-06, |
| "loss": 0.2087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09825904667377472, |
| "step": 3445, |
| "valid_targets_mean": 3929.8, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 5.476190476190476, |
| "grad_norm": 0.8655562264421257, |
| "learning_rate": 5.512414918519573e-06, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1307569444179535, |
| "step": 3450, |
| "valid_targets_mean": 3211.2, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 5.484126984126984, |
| "grad_norm": 0.8890725294031256, |
| "learning_rate": 5.457960133560179e-06, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0857107937335968, |
| "step": 3455, |
| "valid_targets_mean": 1887.0, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 5.492063492063492, |
| "grad_norm": 0.7014404433696352, |
| "learning_rate": 5.403733121641883e-06, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0767240822315216, |
| "step": 3460, |
| "valid_targets_mean": 3447.1, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 5.5, |
| "grad_norm": 0.7077085117048115, |
| "learning_rate": 5.349734732126366e-06, |
| "loss": 0.2122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1149144172668457, |
| "step": 3465, |
| "valid_targets_mean": 3409.2, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 5.507936507936508, |
| "grad_norm": 0.6964990148226815, |
| "learning_rate": 5.295965810794376e-06, |
| "loss": 0.2225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12690629065036774, |
| "step": 3470, |
| "valid_targets_mean": 4805.8, |
| "valid_targets_min": 1606 |
| }, |
| { |
| "epoch": 5.515873015873016, |
| "grad_norm": 0.71008503903071, |
| "learning_rate": 5.2424271998324895e-06, |
| "loss": 0.2084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1080438420176506, |
| "step": 3475, |
| "valid_targets_mean": 3492.4, |
| "valid_targets_min": 1643 |
| }, |
| { |
| "epoch": 5.523809523809524, |
| "grad_norm": 0.7353298420126876, |
| "learning_rate": 5.189119737819912e-06, |
| "loss": 0.2086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11497688293457031, |
| "step": 3480, |
| "valid_targets_mean": 3634.8, |
| "valid_targets_min": 969 |
| }, |
| { |
| "epoch": 5.531746031746032, |
| "grad_norm": 0.8109076591558645, |
| "learning_rate": 5.136044259715342e-06, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15082211792469025, |
| "step": 3485, |
| "valid_targets_mean": 3544.9, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 5.5396825396825395, |
| "grad_norm": 0.7922885526246444, |
| "learning_rate": 5.083201596843905e-06, |
| "loss": 0.2086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10521303117275238, |
| "step": 3490, |
| "valid_targets_mean": 4138.5, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 5.5476190476190474, |
| "grad_norm": 0.8243700889289516, |
| "learning_rate": 5.030592576884117e-06, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07981052994728088, |
| "step": 3495, |
| "valid_targets_mean": 2294.5, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 5.555555555555555, |
| "grad_norm": 0.6042313383840995, |
| "learning_rate": 4.978218023854928e-06, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08307897299528122, |
| "step": 3500, |
| "valid_targets_mean": 3926.1, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 5.563492063492063, |
| "grad_norm": 0.7790070861867432, |
| "learning_rate": 4.926078758102834e-06, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11292654275894165, |
| "step": 3505, |
| "valid_targets_mean": 3235.6, |
| "valid_targets_min": 1610 |
| }, |
| { |
| "epoch": 5.571428571428571, |
| "grad_norm": 0.7080847761324837, |
| "learning_rate": 4.87417559628897e-06, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1172761619091034, |
| "step": 3510, |
| "valid_targets_mean": 3966.9, |
| "valid_targets_min": 1625 |
| }, |
| { |
| "epoch": 5.579365079365079, |
| "grad_norm": 0.7463489141334009, |
| "learning_rate": 4.822509351376399e-06, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12706415355205536, |
| "step": 3515, |
| "valid_targets_mean": 3811.5, |
| "valid_targets_min": 2163 |
| }, |
| { |
| "epoch": 5.587301587301587, |
| "grad_norm": 0.7519098028952099, |
| "learning_rate": 4.7710808326173115e-06, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1024027168750763, |
| "step": 3520, |
| "valid_targets_mean": 3474.1, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 5.595238095238095, |
| "grad_norm": 0.7086990550463645, |
| "learning_rate": 4.719890845540385e-06, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10318700969219208, |
| "step": 3525, |
| "valid_targets_mean": 3613.8, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 5.603174603174603, |
| "grad_norm": 0.7506770758799025, |
| "learning_rate": 4.668940191938156e-06, |
| "loss": 0.2159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0782381072640419, |
| "step": 3530, |
| "valid_targets_mean": 2510.2, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 5.611111111111111, |
| "grad_norm": 0.696777680063598, |
| "learning_rate": 4.618229669854464e-06, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08006583154201508, |
| "step": 3535, |
| "valid_targets_mean": 3453.9, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 5.619047619047619, |
| "grad_norm": 0.922756787599331, |
| "learning_rate": 4.567760073571947e-06, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12967818975448608, |
| "step": 3540, |
| "valid_targets_mean": 4102.4, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 5.6269841269841265, |
| "grad_norm": 0.7078421783660265, |
| "learning_rate": 4.51753219359961e-06, |
| "loss": 0.2167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09606287628412247, |
| "step": 3545, |
| "valid_targets_mean": 3108.1, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 5.634920634920634, |
| "grad_norm": 0.7506430958719362, |
| "learning_rate": 4.467546816660433e-06, |
| "loss": 0.2061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09307855367660522, |
| "step": 3550, |
| "valid_targets_mean": 2918.5, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 5.642857142857143, |
| "grad_norm": 0.9094911858240387, |
| "learning_rate": 4.417804725679058e-06, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13038109242916107, |
| "step": 3555, |
| "valid_targets_mean": 2835.5, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 5.650793650793651, |
| "grad_norm": 0.9032674979239957, |
| "learning_rate": 4.368306699769518e-06, |
| "loss": 0.2144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13430385291576385, |
| "step": 3560, |
| "valid_targets_mean": 3887.0, |
| "valid_targets_min": 338 |
| }, |
| { |
| "epoch": 5.658730158730159, |
| "grad_norm": 0.7586381935839076, |
| "learning_rate": 4.319053514223033e-06, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08391046524047852, |
| "step": 3565, |
| "valid_targets_mean": 3104.5, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 5.666666666666667, |
| "grad_norm": 0.7301760680360758, |
| "learning_rate": 4.270045940495879e-06, |
| "loss": 0.2131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0900624692440033, |
| "step": 3570, |
| "valid_targets_mean": 2651.0, |
| "valid_targets_min": 1582 |
| }, |
| { |
| "epoch": 5.674603174603175, |
| "grad_norm": 0.7547968526194967, |
| "learning_rate": 4.221284746197292e-06, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08366125822067261, |
| "step": 3575, |
| "valid_targets_mean": 2382.6, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 5.682539682539683, |
| "grad_norm": 0.8234421252575538, |
| "learning_rate": 4.172770695077437e-06, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11100704967975616, |
| "step": 3580, |
| "valid_targets_mean": 2705.6, |
| "valid_targets_min": 1352 |
| }, |
| { |
| "epoch": 5.690476190476191, |
| "grad_norm": 0.8174606359388051, |
| "learning_rate": 4.124504547015487e-06, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1208464503288269, |
| "step": 3585, |
| "valid_targets_mean": 3083.4, |
| "valid_targets_min": 1639 |
| }, |
| { |
| "epoch": 5.698412698412699, |
| "grad_norm": 0.7562999444174163, |
| "learning_rate": 4.0764870580076675e-06, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0921013206243515, |
| "step": 3590, |
| "valid_targets_mean": 2875.4, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 5.7063492063492065, |
| "grad_norm": 0.7965104320892732, |
| "learning_rate": 4.0287189801554304e-06, |
| "loss": 0.2131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09799252450466156, |
| "step": 3595, |
| "valid_targets_mean": 3153.5, |
| "valid_targets_min": 1286 |
| }, |
| { |
| "epoch": 5.714285714285714, |
| "grad_norm": 0.857269142950299, |
| "learning_rate": 3.98120106165371e-06, |
| "loss": 0.2133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08865942060947418, |
| "step": 3600, |
| "valid_targets_mean": 2800.6, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 5.722222222222222, |
| "grad_norm": 0.7527257186466023, |
| "learning_rate": 3.933934046779164e-06, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09972484409809113, |
| "step": 3605, |
| "valid_targets_mean": 2838.0, |
| "valid_targets_min": 1631 |
| }, |
| { |
| "epoch": 5.73015873015873, |
| "grad_norm": 0.5994753331151756, |
| "learning_rate": 3.886918675878513e-06, |
| "loss": 0.2074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08137780427932739, |
| "step": 3610, |
| "valid_targets_mean": 4263.1, |
| "valid_targets_min": 2086 |
| }, |
| { |
| "epoch": 5.738095238095238, |
| "grad_norm": 0.8232153717265387, |
| "learning_rate": 3.840155685356983e-06, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09935421496629715, |
| "step": 3615, |
| "valid_targets_mean": 2672.6, |
| "valid_targets_min": 1511 |
| }, |
| { |
| "epoch": 5.746031746031746, |
| "grad_norm": 0.750128536941153, |
| "learning_rate": 3.793645807666735e-06, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1128338873386383, |
| "step": 3620, |
| "valid_targets_mean": 3398.9, |
| "valid_targets_min": 1313 |
| }, |
| { |
| "epoch": 5.753968253968254, |
| "grad_norm": 0.7880891847487402, |
| "learning_rate": 3.747389771295411e-06, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10944647341966629, |
| "step": 3625, |
| "valid_targets_mean": 2556.5, |
| "valid_targets_min": 1189 |
| }, |
| { |
| "epoch": 5.761904761904762, |
| "grad_norm": 0.6786715199961021, |
| "learning_rate": 3.701388300754709e-06, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11284029483795166, |
| "step": 3630, |
| "valid_targets_mean": 4237.8, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 5.76984126984127, |
| "grad_norm": 0.786402047995528, |
| "learning_rate": 3.6556421165690516e-06, |
| "loss": 0.2029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1069340705871582, |
| "step": 3635, |
| "valid_targets_mean": 3257.5, |
| "valid_targets_min": 1574 |
| }, |
| { |
| "epoch": 5.777777777777778, |
| "grad_norm": 0.9927590000924167, |
| "learning_rate": 3.610151935264288e-06, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08624372631311417, |
| "step": 3640, |
| "valid_targets_mean": 2332.5, |
| "valid_targets_min": 318 |
| }, |
| { |
| "epoch": 5.785714285714286, |
| "grad_norm": 0.7575310728766175, |
| "learning_rate": 3.5649184693564797e-06, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08996361494064331, |
| "step": 3645, |
| "valid_targets_mean": 2656.9, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 5.7936507936507935, |
| "grad_norm": 0.6353430242205899, |
| "learning_rate": 3.5199424273407277e-06, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09710676968097687, |
| "step": 3650, |
| "valid_targets_mean": 4277.1, |
| "valid_targets_min": 2470 |
| }, |
| { |
| "epoch": 5.801587301587301, |
| "grad_norm": 0.8104745502933571, |
| "learning_rate": 3.4752245136801065e-06, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09580199420452118, |
| "step": 3655, |
| "valid_targets_mean": 2233.1, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 5.809523809523809, |
| "grad_norm": 0.8218115415777589, |
| "learning_rate": 3.430765428794569e-06, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09398232400417328, |
| "step": 3660, |
| "valid_targets_mean": 2095.1, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 5.817460317460317, |
| "grad_norm": 0.8000713802610769, |
| "learning_rate": 3.3865658690500424e-06, |
| "loss": 0.214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10749034583568573, |
| "step": 3665, |
| "valid_targets_mean": 3013.5, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 5.825396825396825, |
| "grad_norm": 0.816997724762598, |
| "learning_rate": 3.34262652674749e-06, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1072094738483429, |
| "step": 3670, |
| "valid_targets_mean": 3302.1, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 5.833333333333333, |
| "grad_norm": 0.7748883081700283, |
| "learning_rate": 3.2989480901120684e-06, |
| "loss": 0.2108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05944449454545975, |
| "step": 3675, |
| "valid_targets_mean": 1702.4, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 5.841269841269841, |
| "grad_norm": 0.7205680487267188, |
| "learning_rate": 3.2555312432823283e-06, |
| "loss": 0.2045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0655689686536789, |
| "step": 3680, |
| "valid_targets_mean": 2465.4, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 5.849206349206349, |
| "grad_norm": 0.7713827436038354, |
| "learning_rate": 3.2123766662995572e-06, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11447322368621826, |
| "step": 3685, |
| "valid_targets_mean": 3081.1, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 5.857142857142857, |
| "grad_norm": 0.6412703691192485, |
| "learning_rate": 3.1694850350970686e-06, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13718387484550476, |
| "step": 3690, |
| "valid_targets_mean": 5159.6, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 5.865079365079366, |
| "grad_norm": 0.7311165566889636, |
| "learning_rate": 3.1268570214896265e-06, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10165748745203018, |
| "step": 3695, |
| "valid_targets_mean": 3384.6, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 5.8730158730158735, |
| "grad_norm": 0.838423608791939, |
| "learning_rate": 3.0844932931629602e-06, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08572743833065033, |
| "step": 3700, |
| "valid_targets_mean": 2373.0, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 5.880952380952381, |
| "grad_norm": 0.6958758298936207, |
| "learning_rate": 3.0423945136632626e-06, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07737462967634201, |
| "step": 3705, |
| "valid_targets_mean": 2863.1, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 5.888888888888889, |
| "grad_norm": 0.6597673477275796, |
| "learning_rate": 3.000561342386814e-06, |
| "loss": 0.218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10114225745201111, |
| "step": 3710, |
| "valid_targets_mean": 3721.8, |
| "valid_targets_min": 1506 |
| }, |
| { |
| "epoch": 5.896825396825397, |
| "grad_norm": 0.8306491531882909, |
| "learning_rate": 2.9589944345696596e-06, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11550882458686829, |
| "step": 3715, |
| "valid_targets_mean": 2761.6, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 5.904761904761905, |
| "grad_norm": 0.8683852586162994, |
| "learning_rate": 2.9176944412773322e-06, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09660732746124268, |
| "step": 3720, |
| "valid_targets_mean": 2080.1, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 5.912698412698413, |
| "grad_norm": 0.7251086912309824, |
| "learning_rate": 2.876662009394673e-06, |
| "loss": 0.2291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12001783400774002, |
| "step": 3725, |
| "valid_targets_mean": 3939.5, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 5.920634920634921, |
| "grad_norm": 0.8129360177739626, |
| "learning_rate": 2.8358977816156796e-06, |
| "loss": 0.2125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10110355913639069, |
| "step": 3730, |
| "valid_targets_mean": 3384.8, |
| "valid_targets_min": 2192 |
| }, |
| { |
| "epoch": 5.928571428571429, |
| "grad_norm": 0.7180542554037956, |
| "learning_rate": 2.7954023964334485e-06, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09065502882003784, |
| "step": 3735, |
| "valid_targets_mean": 2732.5, |
| "valid_targets_min": 1448 |
| }, |
| { |
| "epoch": 5.936507936507937, |
| "grad_norm": 0.8552826097328355, |
| "learning_rate": 2.7551764881301955e-06, |
| "loss": 0.2192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08631910383701324, |
| "step": 3740, |
| "valid_targets_mean": 2285.6, |
| "valid_targets_min": 1428 |
| }, |
| { |
| "epoch": 5.944444444444445, |
| "grad_norm": 0.6262989640665731, |
| "learning_rate": 2.715220686767268e-06, |
| "loss": 0.2113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10843861103057861, |
| "step": 3745, |
| "valid_targets_mean": 5061.1, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 5.9523809523809526, |
| "grad_norm": 0.7897971423207434, |
| "learning_rate": 2.6755356181753247e-06, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10058259963989258, |
| "step": 3750, |
| "valid_targets_mean": 3069.1, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 5.9603174603174605, |
| "grad_norm": 0.7636236084851435, |
| "learning_rate": 2.6361219039445328e-06, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08092188835144043, |
| "step": 3755, |
| "valid_targets_mean": 2315.1, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 5.968253968253968, |
| "grad_norm": 0.6963273983529872, |
| "learning_rate": 2.5969801614147838e-06, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1218203455209732, |
| "step": 3760, |
| "valid_targets_mean": 4196.5, |
| "valid_targets_min": 1130 |
| }, |
| { |
| "epoch": 5.976190476190476, |
| "grad_norm": 0.6948330177609254, |
| "learning_rate": 2.558111003666075e-06, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09535790979862213, |
| "step": 3765, |
| "valid_targets_mean": 2892.5, |
| "valid_targets_min": 1354 |
| }, |
| { |
| "epoch": 5.984126984126984, |
| "grad_norm": 0.7485809892595101, |
| "learning_rate": 2.519515039508893e-06, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12762418389320374, |
| "step": 3770, |
| "valid_targets_mean": 4171.5, |
| "valid_targets_min": 1710 |
| }, |
| { |
| "epoch": 5.992063492063492, |
| "grad_norm": 0.7209339180022664, |
| "learning_rate": 2.481192873474667e-06, |
| "loss": 0.2289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14580002427101135, |
| "step": 3775, |
| "valid_targets_mean": 4015.1, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 6.0, |
| "grad_norm": 0.7486824941956289, |
| "learning_rate": 2.4431451058062928e-06, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12455324083566666, |
| "step": 3780, |
| "valid_targets_mean": 3672.8, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 6.007936507936508, |
| "grad_norm": 0.6782508888637717, |
| "learning_rate": 2.4053723324487677e-06, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0711774080991745, |
| "step": 3785, |
| "valid_targets_mean": 2518.9, |
| "valid_targets_min": 1545 |
| }, |
| { |
| "epoch": 6.015873015873016, |
| "grad_norm": 0.6911427139250138, |
| "learning_rate": 2.3678751450398196e-06, |
| "loss": 0.2042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11248598247766495, |
| "step": 3790, |
| "valid_targets_mean": 3788.2, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 6.023809523809524, |
| "grad_norm": 0.7538661391977503, |
| "learning_rate": 2.330654130900656e-06, |
| "loss": 0.201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08532236516475677, |
| "step": 3795, |
| "valid_targets_mean": 2292.0, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 6.031746031746032, |
| "grad_norm": 0.8225525420805956, |
| "learning_rate": 2.2937098730267572e-06, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1298900842666626, |
| "step": 3800, |
| "valid_targets_mean": 3416.4, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 6.0396825396825395, |
| "grad_norm": 0.7635534745827315, |
| "learning_rate": 2.2570429500787604e-06, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0920785516500473, |
| "step": 3805, |
| "valid_targets_mean": 2786.8, |
| "valid_targets_min": 1354 |
| }, |
| { |
| "epoch": 6.0476190476190474, |
| "grad_norm": 0.659940926257208, |
| "learning_rate": 2.2206539363733738e-06, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.05400678142905235, |
| "step": 3810, |
| "valid_targets_mean": 2275.5, |
| "valid_targets_min": 364 |
| }, |
| { |
| "epoch": 6.055555555555555, |
| "grad_norm": 0.6973295697920284, |
| "learning_rate": 2.1845434018744038e-06, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12242526561021805, |
| "step": 3815, |
| "valid_targets_mean": 4405.4, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 6.063492063492063, |
| "grad_norm": 0.8213586989325722, |
| "learning_rate": 2.148711912183803e-06, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1367570012807846, |
| "step": 3820, |
| "valid_targets_mean": 3735.0, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 6.071428571428571, |
| "grad_norm": 0.679938514817628, |
| "learning_rate": 2.1131600285328458e-06, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09106817096471786, |
| "step": 3825, |
| "valid_targets_mean": 4257.8, |
| "valid_targets_min": 1554 |
| }, |
| { |
| "epoch": 6.079365079365079, |
| "grad_norm": 0.6807386614704928, |
| "learning_rate": 2.0778883077732903e-06, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12356531620025635, |
| "step": 3830, |
| "valid_targets_mean": 5071.1, |
| "valid_targets_min": 1373 |
| }, |
| { |
| "epoch": 6.087301587301587, |
| "grad_norm": 0.7553925830584054, |
| "learning_rate": 2.0428973023686983e-06, |
| "loss": 0.1971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10499994456768036, |
| "step": 3835, |
| "valid_targets_mean": 3480.4, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 6.095238095238095, |
| "grad_norm": 0.888088778216751, |
| "learning_rate": 2.0081875603857726e-06, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10103853046894073, |
| "step": 3840, |
| "valid_targets_mean": 2299.6, |
| "valid_targets_min": 1160 |
| }, |
| { |
| "epoch": 6.103174603174603, |
| "grad_norm": 0.6779555773520787, |
| "learning_rate": 1.973759625485743e-06, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10814555734395981, |
| "step": 3845, |
| "valid_targets_mean": 3903.9, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 6.111111111111111, |
| "grad_norm": 0.6945692361650982, |
| "learning_rate": 1.9396140369159e-06, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0844080001115799, |
| "step": 3850, |
| "valid_targets_mean": 3611.2, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 6.119047619047619, |
| "grad_norm": 0.819841381174835, |
| "learning_rate": 1.9057513295011087e-06, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17100293934345245, |
| "step": 3855, |
| "valid_targets_mean": 3577.8, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 6.1269841269841265, |
| "grad_norm": 0.6920995453717935, |
| "learning_rate": 1.8721720336354487e-06, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07847906649112701, |
| "step": 3860, |
| "valid_targets_mean": 2644.1, |
| "valid_targets_min": 1056 |
| }, |
| { |
| "epoch": 6.134920634920635, |
| "grad_norm": 0.7097918126712862, |
| "learning_rate": 1.8388766752739017e-06, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09960925579071045, |
| "step": 3865, |
| "valid_targets_mean": 3381.4, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 6.142857142857143, |
| "grad_norm": 0.6413975048934565, |
| "learning_rate": 1.805865775924116e-06, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09482008218765259, |
| "step": 3870, |
| "valid_targets_mean": 5026.4, |
| "valid_targets_min": 1530 |
| }, |
| { |
| "epoch": 6.150793650793651, |
| "grad_norm": 0.7978109804263973, |
| "learning_rate": 1.7731398526382416e-06, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14775651693344116, |
| "step": 3875, |
| "valid_targets_mean": 3349.0, |
| "valid_targets_min": 1775 |
| }, |
| { |
| "epoch": 6.158730158730159, |
| "grad_norm": 0.6618833893869975, |
| "learning_rate": 1.7406994180048231e-06, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08926299959421158, |
| "step": 3880, |
| "valid_targets_mean": 3658.2, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 6.166666666666667, |
| "grad_norm": 0.6268145598843055, |
| "learning_rate": 1.7085449801407783e-06, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10563044995069504, |
| "step": 3885, |
| "valid_targets_mean": 4803.8, |
| "valid_targets_min": 2923 |
| }, |
| { |
| "epoch": 6.174603174603175, |
| "grad_norm": 0.7930198414251461, |
| "learning_rate": 1.67667704268343e-06, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09213380515575409, |
| "step": 3890, |
| "valid_targets_mean": 3095.4, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 6.182539682539683, |
| "grad_norm": 0.7855535649914588, |
| "learning_rate": 1.6450961047826353e-06, |
| "loss": 0.2021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10935674607753754, |
| "step": 3895, |
| "valid_targets_mean": 3000.8, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 6.190476190476191, |
| "grad_norm": 0.7167832062061632, |
| "learning_rate": 1.6138026610929446e-06, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0821952372789383, |
| "step": 3900, |
| "valid_targets_mean": 3084.2, |
| "valid_targets_min": 1591 |
| }, |
| { |
| "epoch": 6.198412698412699, |
| "grad_norm": 0.7355915549419297, |
| "learning_rate": 1.5827972017658732e-06, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07168291509151459, |
| "step": 3905, |
| "valid_targets_mean": 2457.8, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 6.2063492063492065, |
| "grad_norm": 0.7339590222002838, |
| "learning_rate": 1.5520802124422108e-06, |
| "loss": 0.2106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06518985331058502, |
| "step": 3910, |
| "valid_targets_mean": 2686.0, |
| "valid_targets_min": 1446 |
| }, |
| { |
| "epoch": 6.214285714285714, |
| "grad_norm": 0.7700254235965525, |
| "learning_rate": 1.5216521742444236e-06, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10491657257080078, |
| "step": 3915, |
| "valid_targets_mean": 3282.0, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 6.222222222222222, |
| "grad_norm": 0.7706206197929331, |
| "learning_rate": 1.491513563769118e-06, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1297735571861267, |
| "step": 3920, |
| "valid_targets_mean": 3537.9, |
| "valid_targets_min": 1342 |
| }, |
| { |
| "epoch": 6.23015873015873, |
| "grad_norm": 0.7125278750032971, |
| "learning_rate": 1.4616648530795673e-06, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12319030612707138, |
| "step": 3925, |
| "valid_targets_mean": 4568.1, |
| "valid_targets_min": 1083 |
| }, |
| { |
| "epoch": 6.238095238095238, |
| "grad_norm": 0.7509002816161764, |
| "learning_rate": 1.432106509698319e-06, |
| "loss": 0.2126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10249030590057373, |
| "step": 3930, |
| "valid_targets_mean": 3594.0, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 6.246031746031746, |
| "grad_norm": 0.8970120821160956, |
| "learning_rate": 1.4028389965998867e-06, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10491965711116791, |
| "step": 3935, |
| "valid_targets_mean": 2135.4, |
| "valid_targets_min": 1377 |
| }, |
| { |
| "epoch": 6.253968253968254, |
| "grad_norm": 0.8134853281807751, |
| "learning_rate": 1.3738627722034848e-06, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08832602202892303, |
| "step": 3940, |
| "valid_targets_mean": 2626.1, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 6.261904761904762, |
| "grad_norm": 0.7862015024702198, |
| "learning_rate": 1.345178290365845e-06, |
| "loss": 0.1908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07818420976400375, |
| "step": 3945, |
| "valid_targets_mean": 2288.4, |
| "valid_targets_min": 1510 |
| }, |
| { |
| "epoch": 6.26984126984127, |
| "grad_norm": 0.8454958849822186, |
| "learning_rate": 1.3167860003741218e-06, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11491268873214722, |
| "step": 3950, |
| "valid_targets_mean": 3148.0, |
| "valid_targets_min": 1319 |
| }, |
| { |
| "epoch": 6.277777777777778, |
| "grad_norm": 0.9550952759949879, |
| "learning_rate": 1.2886863469388389e-06, |
| "loss": 0.2159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08679212629795074, |
| "step": 3955, |
| "valid_targets_mean": 1462.1, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 6.285714285714286, |
| "grad_norm": 0.6798761734084032, |
| "learning_rate": 1.2608797701869425e-06, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1112833023071289, |
| "step": 3960, |
| "valid_targets_mean": 4642.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 6.2936507936507935, |
| "grad_norm": 0.7161938785556553, |
| "learning_rate": 1.2333667056548881e-06, |
| "loss": 0.1954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0901009738445282, |
| "step": 3965, |
| "valid_targets_mean": 3483.0, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 6.301587301587301, |
| "grad_norm": 0.7919495256788115, |
| "learning_rate": 1.2061475842818337e-06, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10928655415773392, |
| "step": 3970, |
| "valid_targets_mean": 3111.4, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 6.309523809523809, |
| "grad_norm": 0.6622868143264027, |
| "learning_rate": 1.1792228324028776e-06, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0938882902264595, |
| "step": 3975, |
| "valid_targets_mean": 4688.2, |
| "valid_targets_min": 1526 |
| }, |
| { |
| "epoch": 6.317460317460317, |
| "grad_norm": 0.714843100243358, |
| "learning_rate": 1.152592871742395e-06, |
| "loss": 0.2008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08914178609848022, |
| "step": 3980, |
| "valid_targets_mean": 3923.6, |
| "valid_targets_min": 1905 |
| }, |
| { |
| "epoch": 6.325396825396825, |
| "grad_norm": 0.7459606794822701, |
| "learning_rate": 1.1262581194074152e-06, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13458332419395447, |
| "step": 3985, |
| "valid_targets_mean": 3634.6, |
| "valid_targets_min": 1182 |
| }, |
| { |
| "epoch": 6.333333333333333, |
| "grad_norm": 0.7535897780328545, |
| "learning_rate": 1.100218987881112e-06, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08394159376621246, |
| "step": 3990, |
| "valid_targets_mean": 2917.5, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 6.341269841269841, |
| "grad_norm": 0.6530045323214579, |
| "learning_rate": 1.0744758850163085e-06, |
| "loss": 0.2044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12506398558616638, |
| "step": 3995, |
| "valid_targets_mean": 4917.4, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 6.349206349206349, |
| "grad_norm": 0.7979509577422987, |
| "learning_rate": 1.0490292140291247e-06, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11587633192539215, |
| "step": 4000, |
| "valid_targets_mean": 2967.2, |
| "valid_targets_min": 1396 |
| }, |
| { |
| "epoch": 6.357142857142857, |
| "grad_norm": 0.8755874967319832, |
| "learning_rate": 1.0238793734926467e-06, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13597938418388367, |
| "step": 4005, |
| "valid_targets_mean": 2481.9, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 6.365079365079365, |
| "grad_norm": 0.6783876323503061, |
| "learning_rate": 9.990267573306745e-07, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10617756843566895, |
| "step": 4010, |
| "valid_targets_mean": 4420.9, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 6.3730158730158735, |
| "grad_norm": 0.722469792560784, |
| "learning_rate": 9.744717548115613e-07, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09820477664470673, |
| "step": 4015, |
| "valid_targets_mean": 3403.4, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 6.380952380952381, |
| "grad_norm": 0.733459872022677, |
| "learning_rate": 9.502147505421244e-07, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08142758905887604, |
| "step": 4020, |
| "valid_targets_mean": 2535.2, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 6.388888888888889, |
| "grad_norm": 0.8345987403978284, |
| "learning_rate": 9.262561244616108e-07, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10948467999696732, |
| "step": 4025, |
| "valid_targets_mean": 3486.9, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 6.396825396825397, |
| "grad_norm": 0.7819290637056325, |
| "learning_rate": 9.025962518357323e-07, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09386520832777023, |
| "step": 4030, |
| "valid_targets_mean": 4022.1, |
| "valid_targets_min": 2193 |
| }, |
| { |
| "epoch": 6.404761904761905, |
| "grad_norm": 0.7675973062209386, |
| "learning_rate": 8.792355032508282e-07, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10054197907447815, |
| "step": 4035, |
| "valid_targets_mean": 3192.8, |
| "valid_targets_min": 1637 |
| }, |
| { |
| "epoch": 6.412698412698413, |
| "grad_norm": 0.7308179209216745, |
| "learning_rate": 8.561742446080168e-07, |
| "loss": 0.2261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13068924844264984, |
| "step": 4040, |
| "valid_targets_mean": 4124.1, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 6.420634920634921, |
| "grad_norm": 0.7949394003439152, |
| "learning_rate": 8.334128371174955e-07, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09118463099002838, |
| "step": 4045, |
| "valid_targets_mean": 2320.0, |
| "valid_targets_min": 1229 |
| }, |
| { |
| "epoch": 6.428571428571429, |
| "grad_norm": 0.8482819989896451, |
| "learning_rate": 8.109516372928605e-07, |
| "loss": 0.2047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09792070090770721, |
| "step": 4050, |
| "valid_targets_mean": 2030.2, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 6.436507936507937, |
| "grad_norm": 0.6555352946842179, |
| "learning_rate": 7.887909969455366e-07, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10069252550601959, |
| "step": 4055, |
| "valid_targets_mean": 4303.4, |
| "valid_targets_min": 2117 |
| }, |
| { |
| "epoch": 6.444444444444445, |
| "grad_norm": 0.7356412967204531, |
| "learning_rate": 7.669312631792758e-07, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09753116965293884, |
| "step": 4060, |
| "valid_targets_mean": 3563.4, |
| "valid_targets_min": 1759 |
| }, |
| { |
| "epoch": 6.4523809523809526, |
| "grad_norm": 0.831688287232052, |
| "learning_rate": 7.453727783846876e-07, |
| "loss": 0.2045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13499116897583008, |
| "step": 4065, |
| "valid_targets_mean": 3057.4, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 6.4603174603174605, |
| "grad_norm": 0.7591710445025716, |
| "learning_rate": 7.241158802339065e-07, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1253347396850586, |
| "step": 4070, |
| "valid_targets_mean": 3662.1, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 6.468253968253968, |
| "grad_norm": 0.6810251121546419, |
| "learning_rate": 7.031609016753016e-07, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07710853219032288, |
| "step": 4075, |
| "valid_targets_mean": 2938.1, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 6.476190476190476, |
| "grad_norm": 0.7354002690469413, |
| "learning_rate": 6.825081709282377e-07, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10170842707157135, |
| "step": 4080, |
| "valid_targets_mean": 3541.6, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 6.484126984126984, |
| "grad_norm": 0.6860941434399659, |
| "learning_rate": 6.62158011477958e-07, |
| "loss": 0.1941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08662896603345871, |
| "step": 4085, |
| "valid_targets_mean": 3065.5, |
| "valid_targets_min": 1368 |
| }, |
| { |
| "epoch": 6.492063492063492, |
| "grad_norm": 0.8315820409255328, |
| "learning_rate": 6.421107420705097e-07, |
| "loss": 0.2066, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10763676464557648, |
| "step": 4090, |
| "valid_targets_mean": 2476.9, |
| "valid_targets_min": 1314 |
| }, |
| { |
| "epoch": 6.5, |
| "grad_norm": 0.6779255746870322, |
| "learning_rate": 6.223666767077508e-07, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10068156570196152, |
| "step": 4095, |
| "valid_targets_mean": 4325.5, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 6.507936507936508, |
| "grad_norm": 0.703785843801452, |
| "learning_rate": 6.029261246424267e-07, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08343538641929626, |
| "step": 4100, |
| "valid_targets_mean": 3569.0, |
| "valid_targets_min": 1165 |
| }, |
| { |
| "epoch": 6.515873015873016, |
| "grad_norm": 0.8180230926027161, |
| "learning_rate": 5.837893903733394e-07, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1009148359298706, |
| "step": 4105, |
| "valid_targets_mean": 2869.2, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 6.523809523809524, |
| "grad_norm": 0.8734844267563727, |
| "learning_rate": 5.649567736405681e-07, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09930504113435745, |
| "step": 4110, |
| "valid_targets_mean": 2767.9, |
| "valid_targets_min": 1455 |
| }, |
| { |
| "epoch": 6.531746031746032, |
| "grad_norm": 0.7514289018139494, |
| "learning_rate": 5.464285694207672e-07, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11243937909603119, |
| "step": 4115, |
| "valid_targets_mean": 4020.0, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 6.5396825396825395, |
| "grad_norm": 0.6536374909100122, |
| "learning_rate": 5.282050679225714e-07, |
| "loss": 0.1951, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10605214536190033, |
| "step": 4120, |
| "valid_targets_mean": 3659.0, |
| "valid_targets_min": 1727 |
| }, |
| { |
| "epoch": 6.5476190476190474, |
| "grad_norm": 0.792550081612281, |
| "learning_rate": 5.102865545820245e-07, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15852200984954834, |
| "step": 4125, |
| "valid_targets_mean": 3726.1, |
| "valid_targets_min": 1391 |
| }, |
| { |
| "epoch": 6.555555555555555, |
| "grad_norm": 0.6031293409437452, |
| "learning_rate": 4.926733100581182e-07, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0508820079267025, |
| "step": 4130, |
| "valid_targets_mean": 3083.6, |
| "valid_targets_min": 1152 |
| }, |
| { |
| "epoch": 6.563492063492063, |
| "grad_norm": 0.9382734552288612, |
| "learning_rate": 4.7536561022840213e-07, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12225069105625153, |
| "step": 4135, |
| "valid_targets_mean": 2312.8, |
| "valid_targets_min": 1435 |
| }, |
| { |
| "epoch": 6.571428571428571, |
| "grad_norm": 0.8645030624347266, |
| "learning_rate": 4.5836372618464964e-07, |
| "loss": 0.2033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10689771175384521, |
| "step": 4140, |
| "valid_targets_mean": 2341.1, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 6.579365079365079, |
| "grad_norm": 0.6811962105069355, |
| "learning_rate": 4.416679242286215e-07, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09631943702697754, |
| "step": 4145, |
| "valid_targets_mean": 4323.8, |
| "valid_targets_min": 1536 |
| }, |
| { |
| "epoch": 6.587301587301587, |
| "grad_norm": 0.9350005697667735, |
| "learning_rate": 4.2527846586789547e-07, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10233885049819946, |
| "step": 4150, |
| "valid_targets_mean": 1772.5, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 6.595238095238095, |
| "grad_norm": 0.7013237365598121, |
| "learning_rate": 4.0919560781176317e-07, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09215062111616135, |
| "step": 4155, |
| "valid_targets_mean": 3150.1, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 6.603174603174603, |
| "grad_norm": 0.6666170005950856, |
| "learning_rate": 3.934196019672176e-07, |
| "loss": 0.1953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06517612934112549, |
| "step": 4160, |
| "valid_targets_mean": 2124.1, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 6.611111111111111, |
| "grad_norm": 0.7153573335048872, |
| "learning_rate": 3.779506954349965e-07, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09253278374671936, |
| "step": 4165, |
| "valid_targets_mean": 3570.9, |
| "valid_targets_min": 1996 |
| }, |
| { |
| "epoch": 6.619047619047619, |
| "grad_norm": 0.6315001261313217, |
| "learning_rate": 3.6278913050572076e-07, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09306520223617554, |
| "step": 4170, |
| "valid_targets_mean": 4232.5, |
| "valid_targets_min": 1537 |
| }, |
| { |
| "epoch": 6.6269841269841265, |
| "grad_norm": 0.815649453820826, |
| "learning_rate": 3.4793514465610414e-07, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11297182738780975, |
| "step": 4175, |
| "valid_targets_mean": 3307.9, |
| "valid_targets_min": 1436 |
| }, |
| { |
| "epoch": 6.634920634920634, |
| "grad_norm": 0.8506804351795452, |
| "learning_rate": 3.3338897054521205e-07, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07656246423721313, |
| "step": 4180, |
| "valid_targets_mean": 1789.6, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 6.642857142857143, |
| "grad_norm": 0.6360744471035349, |
| "learning_rate": 3.191508360108464e-07, |
| "loss": 0.2141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11496680974960327, |
| "step": 4185, |
| "valid_targets_mean": 4958.0, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 6.650793650793651, |
| "grad_norm": 0.7875567736431006, |
| "learning_rate": 3.0522096406595536e-07, |
| "loss": 0.1985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07022293657064438, |
| "step": 4190, |
| "valid_targets_mean": 2186.5, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 6.658730158730159, |
| "grad_norm": 0.7266157867648473, |
| "learning_rate": 2.9159957289514926e-07, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08252222090959549, |
| "step": 4195, |
| "valid_targets_mean": 3179.4, |
| "valid_targets_min": 1158 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.7434994690323846, |
| "learning_rate": 2.782868758512791e-07, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11222994327545166, |
| "step": 4200, |
| "valid_targets_mean": 3610.9, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 6.674603174603175, |
| "grad_norm": 0.9804608900117372, |
| "learning_rate": 2.6528308145210125e-07, |
| "loss": 0.2021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11486151814460754, |
| "step": 4205, |
| "valid_targets_mean": 2239.6, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 6.682539682539683, |
| "grad_norm": 0.8248478366294771, |
| "learning_rate": 2.525883933770046e-07, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09823493659496307, |
| "step": 4210, |
| "valid_targets_mean": 3023.0, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 6.690476190476191, |
| "grad_norm": 0.6927076587244559, |
| "learning_rate": 2.402030104638198e-07, |
| "loss": 0.2044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08244895935058594, |
| "step": 4215, |
| "valid_targets_mean": 3867.2, |
| "valid_targets_min": 1395 |
| }, |
| { |
| "epoch": 6.698412698412699, |
| "grad_norm": 0.8426480786347594, |
| "learning_rate": 2.2812712670571502e-07, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08320321142673492, |
| "step": 4220, |
| "valid_targets_mean": 2116.5, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 6.7063492063492065, |
| "grad_norm": 0.6551086035705184, |
| "learning_rate": 2.1636093124814738e-07, |
| "loss": 0.1973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09654587507247925, |
| "step": 4225, |
| "valid_targets_mean": 4037.6, |
| "valid_targets_min": 1436 |
| }, |
| { |
| "epoch": 6.714285714285714, |
| "grad_norm": 0.6617880708598886, |
| "learning_rate": 2.0490460838589855e-07, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10055264830589294, |
| "step": 4230, |
| "valid_targets_mean": 4157.2, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 6.722222222222222, |
| "grad_norm": 0.7010021079670415, |
| "learning_rate": 1.9375833756019923e-07, |
| "loss": 0.1999, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06797967851161957, |
| "step": 4235, |
| "valid_targets_mean": 2408.1, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 6.73015873015873, |
| "grad_norm": 0.7857502387885508, |
| "learning_rate": 1.8292229335590716e-07, |
| "loss": 0.2192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11493973433971405, |
| "step": 4240, |
| "valid_targets_mean": 3881.6, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 6.738095238095238, |
| "grad_norm": 0.6685857676840744, |
| "learning_rate": 1.7239664549878688e-07, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11982367932796478, |
| "step": 4245, |
| "valid_targets_mean": 4794.2, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 6.746031746031746, |
| "grad_norm": 0.8352380931276744, |
| "learning_rate": 1.6218155885283192e-07, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09608037769794464, |
| "step": 4250, |
| "valid_targets_mean": 2731.6, |
| "valid_targets_min": 1142 |
| }, |
| { |
| "epoch": 6.753968253968254, |
| "grad_norm": 0.7422039573980747, |
| "learning_rate": 1.5227719341769364e-07, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10857705026865005, |
| "step": 4255, |
| "valid_targets_mean": 4047.4, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 6.761904761904762, |
| "grad_norm": 0.8106967225306234, |
| "learning_rate": 1.4268370432618306e-07, |
| "loss": 0.2092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11048707365989685, |
| "step": 4260, |
| "valid_targets_mean": 3013.6, |
| "valid_targets_min": 1213 |
| }, |
| { |
| "epoch": 6.76984126984127, |
| "grad_norm": 0.6751488059587877, |
| "learning_rate": 1.3340124184182178e-07, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08324621617794037, |
| "step": 4265, |
| "valid_targets_mean": 2745.6, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 6.777777777777778, |
| "grad_norm": 0.8655488128813514, |
| "learning_rate": 1.2442995135650393e-07, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08682005107402802, |
| "step": 4270, |
| "valid_targets_mean": 1827.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 6.785714285714286, |
| "grad_norm": 0.7408048732361547, |
| "learning_rate": 1.1576997338821339e-07, |
| "loss": 0.2075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08840866386890411, |
| "step": 4275, |
| "valid_targets_mean": 3092.5, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 6.7936507936507935, |
| "grad_norm": 0.7105155741932084, |
| "learning_rate": 1.0742144357882567e-07, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07121296972036362, |
| "step": 4280, |
| "valid_targets_mean": 3423.8, |
| "valid_targets_min": 1620 |
| }, |
| { |
| "epoch": 6.801587301587301, |
| "grad_norm": 0.7068956813433978, |
| "learning_rate": 9.938449269197181e-08, |
| "loss": 0.2034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0767413005232811, |
| "step": 4285, |
| "valid_targets_mean": 3846.8, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 6.809523809523809, |
| "grad_norm": 0.6965119531557177, |
| "learning_rate": 9.165924661100889e-08, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09733986854553223, |
| "step": 4290, |
| "valid_targets_mean": 4943.8, |
| "valid_targets_min": 1648 |
| }, |
| { |
| "epoch": 6.817460317460317, |
| "grad_norm": 0.624576583182396, |
| "learning_rate": 8.424582633703493e-08, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09332321584224701, |
| "step": 4295, |
| "valid_targets_mean": 4326.4, |
| "valid_targets_min": 1787 |
| }, |
| { |
| "epoch": 6.825396825396825, |
| "grad_norm": 0.7482091326815062, |
| "learning_rate": 7.714434798699933e-08, |
| "loss": 0.2196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08122950047254562, |
| "step": 4300, |
| "valid_targets_mean": 2637.1, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 6.833333333333333, |
| "grad_norm": 0.7797234183323177, |
| "learning_rate": 7.035492279187538e-08, |
| "loss": 0.2058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1142660602927208, |
| "step": 4305, |
| "valid_targets_mean": 3337.1, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 6.841269841269841, |
| "grad_norm": 0.7603070154020699, |
| "learning_rate": 6.387765709493288e-08, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11581508815288544, |
| "step": 4310, |
| "valid_targets_mean": 3581.8, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 6.849206349206349, |
| "grad_norm": 0.8265224795703434, |
| "learning_rate": 5.7712652350061515e-08, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1010211855173111, |
| "step": 4315, |
| "valid_targets_mean": 2683.1, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 6.857142857142857, |
| "grad_norm": 0.8763516568425196, |
| "learning_rate": 5.186000512018341e-08, |
| "loss": 0.2248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12908044457435608, |
| "step": 4320, |
| "valid_targets_mean": 3439.4, |
| "valid_targets_min": 1869 |
| }, |
| { |
| "epoch": 6.865079365079366, |
| "grad_norm": 0.7573392781428435, |
| "learning_rate": 4.631980707574535e-08, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11205847561359406, |
| "step": 4325, |
| "valid_targets_mean": 3704.8, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 6.8730158730158735, |
| "grad_norm": 0.7230981939132772, |
| "learning_rate": 4.10921449932733e-08, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13283637166023254, |
| "step": 4330, |
| "valid_targets_mean": 4179.9, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 6.880952380952381, |
| "grad_norm": 0.7439954422056636, |
| "learning_rate": 3.61771007540268e-08, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1041351854801178, |
| "step": 4335, |
| "valid_targets_mean": 3090.6, |
| "valid_targets_min": 1286 |
| }, |
| { |
| "epoch": 6.888888888888889, |
| "grad_norm": 0.800212928436307, |
| "learning_rate": 3.157475134270227e-08, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1381809115409851, |
| "step": 4340, |
| "valid_targets_mean": 4396.8, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 6.896825396825397, |
| "grad_norm": 0.7600538047962414, |
| "learning_rate": 2.728516884624277e-08, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09590177237987518, |
| "step": 4345, |
| "valid_targets_mean": 3049.9, |
| "valid_targets_min": 1365 |
| }, |
| { |
| "epoch": 6.904761904761905, |
| "grad_norm": 0.7875192862873142, |
| "learning_rate": 2.3308420452690106e-08, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09034988284111023, |
| "step": 4350, |
| "valid_targets_mean": 2993.2, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 6.912698412698413, |
| "grad_norm": 0.7653025338992717, |
| "learning_rate": 1.9644568450147837e-08, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1180688887834549, |
| "step": 4355, |
| "valid_targets_mean": 3412.2, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 6.920634920634921, |
| "grad_norm": 0.776729001579722, |
| "learning_rate": 1.6293670225799864e-08, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1176794022321701, |
| "step": 4360, |
| "valid_targets_mean": 3754.5, |
| "valid_targets_min": 1897 |
| }, |
| { |
| "epoch": 6.928571428571429, |
| "grad_norm": 0.9428126914025173, |
| "learning_rate": 1.3255778265013342e-08, |
| "loss": 0.2156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10972875356674194, |
| "step": 4365, |
| "valid_targets_mean": 2532.8, |
| "valid_targets_min": 1014 |
| }, |
| { |
| "epoch": 6.936507936507937, |
| "grad_norm": 0.8284198122126346, |
| "learning_rate": 1.0530940150512703e-08, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08045537769794464, |
| "step": 4370, |
| "valid_targets_mean": 2189.8, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 6.944444444444445, |
| "grad_norm": 0.8350132511254953, |
| "learning_rate": 8.119198561638009e-09, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.090115025639534, |
| "step": 4375, |
| "valid_targets_mean": 2316.4, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 6.9523809523809526, |
| "grad_norm": 0.821524042196439, |
| "learning_rate": 6.020591273674381e-09, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09740573167800903, |
| "step": 4380, |
| "valid_targets_mean": 2340.9, |
| "valid_targets_min": 1488 |
| }, |
| { |
| "epoch": 6.9603174603174605, |
| "grad_norm": 0.7332655762989541, |
| "learning_rate": 4.2351511572635835e-09, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08111314475536346, |
| "step": 4385, |
| "valid_targets_mean": 2680.2, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 6.968253968253968, |
| "grad_norm": 0.7743587093318401, |
| "learning_rate": 2.7629061778866597e-09, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07953701913356781, |
| "step": 4390, |
| "valid_targets_mean": 2203.2, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 6.976190476190476, |
| "grad_norm": 0.7689455216523182, |
| "learning_rate": 1.603879395422059e-09, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1031486839056015, |
| "step": 4395, |
| "valid_targets_mean": 3022.2, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 6.984126984126984, |
| "grad_norm": 0.7245017440420248, |
| "learning_rate": 7.580889637925914e-10, |
| "loss": 0.1983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08405288308858871, |
| "step": 4400, |
| "valid_targets_mean": 3571.1, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 6.992063492063492, |
| "grad_norm": 0.7740093811974629, |
| "learning_rate": 2.2554813067676705e-10, |
| "loss": 0.1979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1309514343738556, |
| "step": 4405, |
| "valid_targets_mean": 3787.1, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 7.0, |
| "grad_norm": 0.7862017131182104, |
| "learning_rate": 6.265237300073778e-12, |
| "loss": 0.2044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12112488597631454, |
| "step": 4410, |
| "valid_targets_mean": 3677.4, |
| "valid_targets_min": 1243 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12112488597631454, |
| "step": 4410, |
| "total_flos": 1.1127298177168835e+18, |
| "train_loss": 0.27853014678641513, |
| "train_runtime": 38947.6166, |
| "train_samples_per_second": 1.811, |
| "train_steps_per_second": 0.113, |
| "valid_targets_mean": 3677.4, |
| "valid_targets_min": 1243 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4410, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1000, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1.1127298177168835e+18, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|