| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 3150, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.011111111111111112, |
| "grad_norm": 13.408544798581621, |
| "learning_rate": 5.07936507936508e-07, |
| "loss": 0.6676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5751245617866516, |
| "step": 5, |
| "valid_targets_mean": 5385.7, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 0.022222222222222223, |
| "grad_norm": 16.21108259140317, |
| "learning_rate": 1.142857142857143e-06, |
| "loss": 0.658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.687087893486023, |
| "step": 10, |
| "valid_targets_mean": 3831.0, |
| "valid_targets_min": 293 |
| }, |
| { |
| "epoch": 0.03333333333333333, |
| "grad_norm": 12.338215088436316, |
| "learning_rate": 1.777777777777778e-06, |
| "loss": 0.6536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6238576173782349, |
| "step": 15, |
| "valid_targets_mean": 4839.5, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 0.044444444444444446, |
| "grad_norm": 9.017393522713887, |
| "learning_rate": 2.412698412698413e-06, |
| "loss": 0.6353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5550223588943481, |
| "step": 20, |
| "valid_targets_mean": 4619.8, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 0.05555555555555555, |
| "grad_norm": 5.309166517130694, |
| "learning_rate": 3.047619047619048e-06, |
| "loss": 0.5386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5435296893119812, |
| "step": 25, |
| "valid_targets_mean": 4110.9, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 0.06666666666666667, |
| "grad_norm": 2.792780616604098, |
| "learning_rate": 3.6825396825396833e-06, |
| "loss": 0.5029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46670812368392944, |
| "step": 30, |
| "valid_targets_mean": 3455.2, |
| "valid_targets_min": 295 |
| }, |
| { |
| "epoch": 0.07777777777777778, |
| "grad_norm": 1.5959020052891244, |
| "learning_rate": 4.317460317460318e-06, |
| "loss": 0.4468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4236889183521271, |
| "step": 35, |
| "valid_targets_mean": 5468.6, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 0.08888888888888889, |
| "grad_norm": 1.0408106474791263, |
| "learning_rate": 4.952380952380953e-06, |
| "loss": 0.4331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41928115487098694, |
| "step": 40, |
| "valid_targets_mean": 5478.6, |
| "valid_targets_min": 1395 |
| }, |
| { |
| "epoch": 0.1, |
| "grad_norm": 0.871196479469939, |
| "learning_rate": 5.5873015873015876e-06, |
| "loss": 0.4438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40255558490753174, |
| "step": 45, |
| "valid_targets_mean": 5138.5, |
| "valid_targets_min": 1811 |
| }, |
| { |
| "epoch": 0.1111111111111111, |
| "grad_norm": 0.8029816404229763, |
| "learning_rate": 6.222222222222223e-06, |
| "loss": 0.4316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3899801969528198, |
| "step": 50, |
| "valid_targets_mean": 4666.9, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 0.12222222222222222, |
| "grad_norm": 0.7515486206211541, |
| "learning_rate": 6.857142857142858e-06, |
| "loss": 0.4538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4362230896949768, |
| "step": 55, |
| "valid_targets_mean": 4455.1, |
| "valid_targets_min": 397 |
| }, |
| { |
| "epoch": 0.13333333333333333, |
| "grad_norm": 0.5887418945104569, |
| "learning_rate": 7.492063492063493e-06, |
| "loss": 0.3969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3481084108352661, |
| "step": 60, |
| "valid_targets_mean": 5121.1, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 0.14444444444444443, |
| "grad_norm": 0.6245277781771107, |
| "learning_rate": 8.126984126984128e-06, |
| "loss": 0.3905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36860743165016174, |
| "step": 65, |
| "valid_targets_mean": 3914.1, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 0.15555555555555556, |
| "grad_norm": 0.5810023779977105, |
| "learning_rate": 8.761904761904763e-06, |
| "loss": 0.3874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3317573368549347, |
| "step": 70, |
| "valid_targets_mean": 4313.6, |
| "valid_targets_min": 1168 |
| }, |
| { |
| "epoch": 0.16666666666666666, |
| "grad_norm": 1.0288706410047126, |
| "learning_rate": 9.396825396825398e-06, |
| "loss": 0.356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3530646562576294, |
| "step": 75, |
| "valid_targets_mean": 3485.5, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 0.17777777777777778, |
| "grad_norm": 0.6056824865658866, |
| "learning_rate": 1.0031746031746033e-05, |
| "loss": 0.3536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3671146035194397, |
| "step": 80, |
| "valid_targets_mean": 3908.6, |
| "valid_targets_min": 257 |
| }, |
| { |
| "epoch": 0.18888888888888888, |
| "grad_norm": 0.6162370696114597, |
| "learning_rate": 1.0666666666666667e-05, |
| "loss": 0.3733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3743559718132019, |
| "step": 85, |
| "valid_targets_mean": 4694.6, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 0.2, |
| "grad_norm": 0.5931909767383229, |
| "learning_rate": 1.1301587301587302e-05, |
| "loss": 0.34, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3645175099372864, |
| "step": 90, |
| "valid_targets_mean": 4516.5, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 0.2111111111111111, |
| "grad_norm": 0.5852862045298343, |
| "learning_rate": 1.1936507936507937e-05, |
| "loss": 0.3612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33980345726013184, |
| "step": 95, |
| "valid_targets_mean": 4287.4, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 0.2222222222222222, |
| "grad_norm": 0.591535838571353, |
| "learning_rate": 1.2571428571428572e-05, |
| "loss": 0.3496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3416215479373932, |
| "step": 100, |
| "valid_targets_mean": 3520.2, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 0.23333333333333334, |
| "grad_norm": 0.5517118398063217, |
| "learning_rate": 1.3206349206349206e-05, |
| "loss": 0.3417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3045486807823181, |
| "step": 105, |
| "valid_targets_mean": 3936.1, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 0.24444444444444444, |
| "grad_norm": 0.6036669845712245, |
| "learning_rate": 1.3841269841269843e-05, |
| "loss": 0.3631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37737342715263367, |
| "step": 110, |
| "valid_targets_mean": 4156.3, |
| "valid_targets_min": 352 |
| }, |
| { |
| "epoch": 0.25555555555555554, |
| "grad_norm": 0.557851756149835, |
| "learning_rate": 1.4476190476190478e-05, |
| "loss": 0.33, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31270942091941833, |
| "step": 115, |
| "valid_targets_mean": 4740.2, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 0.26666666666666666, |
| "grad_norm": 0.5061593555204397, |
| "learning_rate": 1.5111111111111112e-05, |
| "loss": 0.3383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3117508292198181, |
| "step": 120, |
| "valid_targets_mean": 5759.2, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 0.2777777777777778, |
| "grad_norm": 0.5910898872360414, |
| "learning_rate": 1.5746031746031745e-05, |
| "loss": 0.3198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30763545632362366, |
| "step": 125, |
| "valid_targets_mean": 4890.5, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 0.28888888888888886, |
| "grad_norm": 0.44647524167329333, |
| "learning_rate": 1.6380952380952384e-05, |
| "loss": 0.302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27717962861061096, |
| "step": 130, |
| "valid_targets_mean": 5430.8, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.3, |
| "grad_norm": 0.5879317402321064, |
| "learning_rate": 1.7015873015873018e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30784285068511963, |
| "step": 135, |
| "valid_targets_mean": 3904.9, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 0.3111111111111111, |
| "grad_norm": 0.5605756164325479, |
| "learning_rate": 1.7650793650793653e-05, |
| "loss": 0.2979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2845287322998047, |
| "step": 140, |
| "valid_targets_mean": 4072.9, |
| "valid_targets_min": 517 |
| }, |
| { |
| "epoch": 0.32222222222222224, |
| "grad_norm": 0.5215552035079208, |
| "learning_rate": 1.8285714285714288e-05, |
| "loss": 0.3149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26664093136787415, |
| "step": 145, |
| "valid_targets_mean": 4416.2, |
| "valid_targets_min": 335 |
| }, |
| { |
| "epoch": 0.3333333333333333, |
| "grad_norm": 0.5674313964489882, |
| "learning_rate": 1.8920634920634923e-05, |
| "loss": 0.3226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3291376233100891, |
| "step": 150, |
| "valid_targets_mean": 5014.2, |
| "valid_targets_min": 251 |
| }, |
| { |
| "epoch": 0.34444444444444444, |
| "grad_norm": 0.5110719079947695, |
| "learning_rate": 1.9555555555555557e-05, |
| "loss": 0.3088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29836922883987427, |
| "step": 155, |
| "valid_targets_mean": 4633.4, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.35555555555555557, |
| "grad_norm": 0.6271829324260068, |
| "learning_rate": 2.0190476190476192e-05, |
| "loss": 0.3173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40676355361938477, |
| "step": 160, |
| "valid_targets_mean": 4353.1, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 0.36666666666666664, |
| "grad_norm": 0.5661101605652876, |
| "learning_rate": 2.082539682539683e-05, |
| "loss": 0.3187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30450916290283203, |
| "step": 165, |
| "valid_targets_mean": 4222.2, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 0.37777777777777777, |
| "grad_norm": 0.5792882504021095, |
| "learning_rate": 2.146031746031746e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3169078230857849, |
| "step": 170, |
| "valid_targets_mean": 4392.9, |
| "valid_targets_min": 286 |
| }, |
| { |
| "epoch": 0.3888888888888889, |
| "grad_norm": 0.5061884693546234, |
| "learning_rate": 2.20952380952381e-05, |
| "loss": 0.3388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32877248525619507, |
| "step": 175, |
| "valid_targets_mean": 4587.4, |
| "valid_targets_min": 603 |
| }, |
| { |
| "epoch": 0.4, |
| "grad_norm": 0.55673810264919, |
| "learning_rate": 2.273015873015873e-05, |
| "loss": 0.3079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3139079511165619, |
| "step": 180, |
| "valid_targets_mean": 5031.8, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 0.4111111111111111, |
| "grad_norm": 0.7128274083633475, |
| "learning_rate": 2.336507936507937e-05, |
| "loss": 0.3189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3152565360069275, |
| "step": 185, |
| "valid_targets_mean": 2480.9, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 0.4222222222222222, |
| "grad_norm": 0.5610727534792233, |
| "learning_rate": 2.4e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3390665054321289, |
| "step": 190, |
| "valid_targets_mean": 4430.2, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 0.43333333333333335, |
| "grad_norm": 0.8939323722899397, |
| "learning_rate": 2.463492063492064e-05, |
| "loss": 0.3016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3454466760158539, |
| "step": 195, |
| "valid_targets_mean": 3394.8, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 0.4444444444444444, |
| "grad_norm": 1.0429529339999148, |
| "learning_rate": 2.526984126984127e-05, |
| "loss": 0.3146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2936026453971863, |
| "step": 200, |
| "valid_targets_mean": 5333.9, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 0.45555555555555555, |
| "grad_norm": 0.5853756503183534, |
| "learning_rate": 2.5904761904761908e-05, |
| "loss": 0.3152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3078632950782776, |
| "step": 205, |
| "valid_targets_mean": 3632.1, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 0.4666666666666667, |
| "grad_norm": 0.5715675965569004, |
| "learning_rate": 2.653968253968254e-05, |
| "loss": 0.3122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3024342656135559, |
| "step": 210, |
| "valid_targets_mean": 4422.1, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 0.4777777777777778, |
| "grad_norm": 0.6821942507785, |
| "learning_rate": 2.7174603174603178e-05, |
| "loss": 0.3154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36502134799957275, |
| "step": 215, |
| "valid_targets_mean": 3621.6, |
| "valid_targets_min": 239 |
| }, |
| { |
| "epoch": 0.4888888888888889, |
| "grad_norm": 0.6021391191144772, |
| "learning_rate": 2.780952380952381e-05, |
| "loss": 0.28, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25724563002586365, |
| "step": 220, |
| "valid_targets_mean": 4738.3, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.5, |
| "grad_norm": 0.5234960619653491, |
| "learning_rate": 2.8444444444444447e-05, |
| "loss": 0.3075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33516725897789, |
| "step": 225, |
| "valid_targets_mean": 4865.0, |
| "valid_targets_min": 231 |
| }, |
| { |
| "epoch": 0.5111111111111111, |
| "grad_norm": 0.547550500956153, |
| "learning_rate": 2.9079365079365082e-05, |
| "loss": 0.2884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29283851385116577, |
| "step": 230, |
| "valid_targets_mean": 4564.4, |
| "valid_targets_min": 1213 |
| }, |
| { |
| "epoch": 0.5222222222222223, |
| "grad_norm": 0.5897013069621678, |
| "learning_rate": 2.9714285714285717e-05, |
| "loss": 0.2937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30815833806991577, |
| "step": 235, |
| "valid_targets_mean": 3828.2, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 0.5333333333333333, |
| "grad_norm": 0.5735263579255174, |
| "learning_rate": 3.034920634920635e-05, |
| "loss": 0.2914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30891531705856323, |
| "step": 240, |
| "valid_targets_mean": 4256.2, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 0.5444444444444444, |
| "grad_norm": 0.5249052908854333, |
| "learning_rate": 3.098412698412699e-05, |
| "loss": 0.308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26125839352607727, |
| "step": 245, |
| "valid_targets_mean": 4620.4, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 0.5555555555555556, |
| "grad_norm": 0.5405962329977203, |
| "learning_rate": 3.161904761904762e-05, |
| "loss": 0.2811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26012593507766724, |
| "step": 250, |
| "valid_targets_mean": 4433.9, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 0.5666666666666667, |
| "grad_norm": 0.8775775341101245, |
| "learning_rate": 3.225396825396826e-05, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23986881971359253, |
| "step": 255, |
| "valid_targets_mean": 3096.6, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 0.5777777777777777, |
| "grad_norm": 0.540108337375447, |
| "learning_rate": 3.288888888888889e-05, |
| "loss": 0.2962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26411673426628113, |
| "step": 260, |
| "valid_targets_mean": 5320.4, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 0.5888888888888889, |
| "grad_norm": 0.5089656627557569, |
| "learning_rate": 3.352380952380953e-05, |
| "loss": 0.298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2886936664581299, |
| "step": 265, |
| "valid_targets_mean": 5059.9, |
| "valid_targets_min": 2016 |
| }, |
| { |
| "epoch": 0.6, |
| "grad_norm": 0.8577322725171138, |
| "learning_rate": 3.415873015873016e-05, |
| "loss": 0.2903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2848944664001465, |
| "step": 270, |
| "valid_targets_mean": 4490.1, |
| "valid_targets_min": 369 |
| }, |
| { |
| "epoch": 0.6111111111111112, |
| "grad_norm": 0.7839943851011535, |
| "learning_rate": 3.47936507936508e-05, |
| "loss": 0.2766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2646746039390564, |
| "step": 275, |
| "valid_targets_mean": 4372.7, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 0.6222222222222222, |
| "grad_norm": 0.6552099358054163, |
| "learning_rate": 3.542857142857143e-05, |
| "loss": 0.28, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.279890239238739, |
| "step": 280, |
| "valid_targets_mean": 3361.1, |
| "valid_targets_min": 173 |
| }, |
| { |
| "epoch": 0.6333333333333333, |
| "grad_norm": 0.6470809605687007, |
| "learning_rate": 3.606349206349207e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3344566822052002, |
| "step": 285, |
| "valid_targets_mean": 3997.0, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 0.6444444444444445, |
| "grad_norm": 0.6042965183251453, |
| "learning_rate": 3.66984126984127e-05, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29824304580688477, |
| "step": 290, |
| "valid_targets_mean": 4553.6, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 0.6555555555555556, |
| "grad_norm": 0.9572004588809255, |
| "learning_rate": 3.733333333333334e-05, |
| "loss": 0.2685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2197730839252472, |
| "step": 295, |
| "valid_targets_mean": 4863.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 0.6666666666666666, |
| "grad_norm": 0.613931117239092, |
| "learning_rate": 3.796825396825397e-05, |
| "loss": 0.2869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2734295129776001, |
| "step": 300, |
| "valid_targets_mean": 3048.4, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 0.6777777777777778, |
| "grad_norm": 0.7225386302879916, |
| "learning_rate": 3.860317460317461e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24375391006469727, |
| "step": 305, |
| "valid_targets_mean": 4168.9, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 0.6888888888888889, |
| "grad_norm": 0.638212930897173, |
| "learning_rate": 3.923809523809524e-05, |
| "loss": 0.2679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2810541093349457, |
| "step": 310, |
| "valid_targets_mean": 3710.6, |
| "valid_targets_min": 275 |
| }, |
| { |
| "epoch": 0.7, |
| "grad_norm": 0.5816992650976073, |
| "learning_rate": 3.9873015873015876e-05, |
| "loss": 0.2778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26782992482185364, |
| "step": 315, |
| "valid_targets_mean": 4587.9, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 0.7111111111111111, |
| "grad_norm": 0.5013466486109508, |
| "learning_rate": 3.999980352246968e-05, |
| "loss": 0.2757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24904786050319672, |
| "step": 320, |
| "valid_targets_mean": 4606.5, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 0.7222222222222222, |
| "grad_norm": 0.713347061955866, |
| "learning_rate": 3.9999005339118864e-05, |
| "loss": 0.2866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30004629492759705, |
| "step": 325, |
| "valid_targets_mean": 3887.9, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 0.7333333333333333, |
| "grad_norm": 0.47963747379037935, |
| "learning_rate": 3.9997593194586953e-05, |
| "loss": 0.2852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2432718276977539, |
| "step": 330, |
| "valid_targets_mean": 4275.9, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 0.7444444444444445, |
| "grad_norm": 0.6005660039240017, |
| "learning_rate": 3.99955671322262e-05, |
| "loss": 0.2799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2737639248371124, |
| "step": 335, |
| "valid_targets_mean": 4195.4, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 0.7555555555555555, |
| "grad_norm": 0.5205837688812412, |
| "learning_rate": 3.999292721423588e-05, |
| "loss": 0.2922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3177686035633087, |
| "step": 340, |
| "valid_targets_mean": 5234.1, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 0.7666666666666667, |
| "grad_norm": 0.5202820975533874, |
| "learning_rate": 3.998967352166037e-05, |
| "loss": 0.2837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27241072058677673, |
| "step": 345, |
| "valid_targets_mean": 4445.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.7777777777777778, |
| "grad_norm": 0.5301976190091423, |
| "learning_rate": 3.998580615438671e-05, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27598923444747925, |
| "step": 350, |
| "valid_targets_mean": 5029.9, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 0.7888888888888889, |
| "grad_norm": 0.5033260846088292, |
| "learning_rate": 3.998132523114146e-05, |
| "loss": 0.2885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25926336646080017, |
| "step": 355, |
| "valid_targets_mean": 4720.8, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 0.8, |
| "grad_norm": 0.5062497800182023, |
| "learning_rate": 3.9976230889487107e-05, |
| "loss": 0.2716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25432416796684265, |
| "step": 360, |
| "valid_targets_mean": 4968.1, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 0.8111111111111111, |
| "grad_norm": 0.6022554597774316, |
| "learning_rate": 3.997052328581783e-05, |
| "loss": 0.2772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27107948064804077, |
| "step": 365, |
| "valid_targets_mean": 4174.4, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 0.8222222222222222, |
| "grad_norm": 0.523430681701777, |
| "learning_rate": 3.99642025953547e-05, |
| "loss": 0.277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26425060629844666, |
| "step": 370, |
| "valid_targets_mean": 4664.8, |
| "valid_targets_min": 1464 |
| }, |
| { |
| "epoch": 0.8333333333333334, |
| "grad_norm": 0.5063947141064169, |
| "learning_rate": 3.9957269012140306e-05, |
| "loss": 0.2786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2735532522201538, |
| "step": 375, |
| "valid_targets_mean": 4143.1, |
| "valid_targets_min": 428 |
| }, |
| { |
| "epoch": 0.8444444444444444, |
| "grad_norm": 0.5680326007926829, |
| "learning_rate": 3.9949722749032755e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24175962805747986, |
| "step": 380, |
| "valid_targets_mean": 3959.0, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 0.8555555555555555, |
| "grad_norm": 0.5324488584110421, |
| "learning_rate": 3.994156403769922e-05, |
| "loss": 0.2908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25714313983917236, |
| "step": 385, |
| "valid_targets_mean": 4401.1, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 0.8666666666666667, |
| "grad_norm": 0.5577161885914526, |
| "learning_rate": 3.993279312860876e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27009209990501404, |
| "step": 390, |
| "valid_targets_mean": 4610.8, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 0.8777777777777778, |
| "grad_norm": 0.4942352058414063, |
| "learning_rate": 3.9923410291024636e-05, |
| "loss": 0.2673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.271714985370636, |
| "step": 395, |
| "valid_targets_mean": 4242.4, |
| "valid_targets_min": 241 |
| }, |
| { |
| "epoch": 0.8888888888888888, |
| "grad_norm": 0.49807037133844223, |
| "learning_rate": 3.991341581299609e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2850569486618042, |
| "step": 400, |
| "valid_targets_mean": 5568.6, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 0.9, |
| "grad_norm": 0.516015376982657, |
| "learning_rate": 3.990281000134946e-05, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2795839309692383, |
| "step": 405, |
| "valid_targets_mean": 4242.3, |
| "valid_targets_min": 317 |
| }, |
| { |
| "epoch": 0.9111111111111111, |
| "grad_norm": 0.4858123801723977, |
| "learning_rate": 3.989159318167875e-05, |
| "loss": 0.281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2678981423377991, |
| "step": 410, |
| "valid_targets_mean": 5212.5, |
| "valid_targets_min": 419 |
| }, |
| { |
| "epoch": 0.9222222222222223, |
| "grad_norm": 0.5792943773685142, |
| "learning_rate": 3.9879765698335705e-05, |
| "loss": 0.258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24788373708724976, |
| "step": 415, |
| "valid_targets_mean": 4014.3, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 0.9333333333333333, |
| "grad_norm": 0.5323729594389564, |
| "learning_rate": 3.986732791441915e-05, |
| "loss": 0.2765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29175180196762085, |
| "step": 420, |
| "valid_targets_mean": 4264.8, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 0.9444444444444444, |
| "grad_norm": 0.5230426930677612, |
| "learning_rate": 3.985428021176391e-05, |
| "loss": 0.2613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22425571084022522, |
| "step": 425, |
| "valid_targets_mean": 4607.9, |
| "valid_targets_min": 214 |
| }, |
| { |
| "epoch": 0.9555555555555556, |
| "grad_norm": 0.5587632060354308, |
| "learning_rate": 3.984062299092904e-05, |
| "loss": 0.2607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2455931007862091, |
| "step": 430, |
| "valid_targets_mean": 3599.4, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 0.9666666666666667, |
| "grad_norm": 0.5416728906416407, |
| "learning_rate": 3.982635667118557e-05, |
| "loss": 0.2771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2705487310886383, |
| "step": 435, |
| "valid_targets_mean": 4116.0, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 0.9777777777777777, |
| "grad_norm": 0.5360254523319351, |
| "learning_rate": 3.981148169050361e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24848337471485138, |
| "step": 440, |
| "valid_targets_mean": 3970.2, |
| "valid_targets_min": 499 |
| }, |
| { |
| "epoch": 0.9888888888888889, |
| "grad_norm": 0.5253145463662034, |
| "learning_rate": 3.97959985055389e-05, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3328373432159424, |
| "step": 445, |
| "valid_targets_mean": 5336.6, |
| "valid_targets_min": 1847 |
| }, |
| { |
| "epoch": 1.0, |
| "grad_norm": 0.48196208890145337, |
| "learning_rate": 3.97799075916188e-05, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27850598096847534, |
| "step": 450, |
| "valid_targets_mean": 5520.2, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 1.011111111111111, |
| "grad_norm": 0.6252822658746067, |
| "learning_rate": 3.976320944272773e-05, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2661787271499634, |
| "step": 455, |
| "valid_targets_mean": 4193.9, |
| "valid_targets_min": 381 |
| }, |
| { |
| "epoch": 1.0222222222222221, |
| "grad_norm": 0.4701033558777485, |
| "learning_rate": 3.9745904571491916e-05, |
| "loss": 0.2431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252180814743042, |
| "step": 460, |
| "valid_targets_mean": 5736.6, |
| "valid_targets_min": 1675 |
| }, |
| { |
| "epoch": 1.0333333333333334, |
| "grad_norm": 0.8485213019287988, |
| "learning_rate": 3.972799350916375e-05, |
| "loss": 0.2631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27109605073928833, |
| "step": 465, |
| "valid_targets_mean": 4100.7, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 1.0444444444444445, |
| "grad_norm": 0.5743499080820584, |
| "learning_rate": 3.970947680560543e-05, |
| "loss": 0.2568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26906871795654297, |
| "step": 470, |
| "valid_targets_mean": 3466.4, |
| "valid_targets_min": 357 |
| }, |
| { |
| "epoch": 1.0555555555555556, |
| "grad_norm": 0.5031824328141823, |
| "learning_rate": 3.969035502927208e-05, |
| "loss": 0.2522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2581416368484497, |
| "step": 475, |
| "valid_targets_mean": 4564.5, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 1.0666666666666667, |
| "grad_norm": 0.5700693169245215, |
| "learning_rate": 3.967062876719433e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2493741810321808, |
| "step": 480, |
| "valid_targets_mean": 4157.4, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 1.0777777777777777, |
| "grad_norm": 0.7056940332930607, |
| "learning_rate": 3.965029862496023e-05, |
| "loss": 0.275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24406126141548157, |
| "step": 485, |
| "valid_targets_mean": 3929.6, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 1.0888888888888888, |
| "grad_norm": 0.6063202867573172, |
| "learning_rate": 3.962936522669674e-05, |
| "loss": 0.274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3029976487159729, |
| "step": 490, |
| "valid_targets_mean": 4941.8, |
| "valid_targets_min": 173 |
| }, |
| { |
| "epoch": 1.1, |
| "grad_norm": 1.6432217580814634, |
| "learning_rate": 3.960782921505052e-05, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26101475954055786, |
| "step": 495, |
| "valid_targets_mean": 4462.2, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 1.1111111111111112, |
| "grad_norm": 0.45742604503694995, |
| "learning_rate": 3.9585691251168205e-05, |
| "loss": 0.2534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24371081590652466, |
| "step": 500, |
| "valid_targets_mean": 5317.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 1.1222222222222222, |
| "grad_norm": 0.583691622746648, |
| "learning_rate": 3.9562952014676116e-05, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2584843039512634, |
| "step": 505, |
| "valid_targets_mean": 3938.7, |
| "valid_targets_min": 242 |
| }, |
| { |
| "epoch": 1.1333333333333333, |
| "grad_norm": 0.5669510869721377, |
| "learning_rate": 3.95396122036594e-05, |
| "loss": 0.25, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24399635195732117, |
| "step": 510, |
| "valid_targets_mean": 3737.6, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 1.1444444444444444, |
| "grad_norm": 0.5041490688945235, |
| "learning_rate": 3.951567253464058e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2624698877334595, |
| "step": 515, |
| "valid_targets_mean": 4929.1, |
| "valid_targets_min": 229 |
| }, |
| { |
| "epoch": 1.1555555555555554, |
| "grad_norm": 0.6300993096751855, |
| "learning_rate": 3.949113374255759e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.253865510225296, |
| "step": 520, |
| "valid_targets_mean": 3452.0, |
| "valid_targets_min": 350 |
| }, |
| { |
| "epoch": 1.1666666666666667, |
| "grad_norm": 0.6297449586516455, |
| "learning_rate": 3.946599658074117e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2540290951728821, |
| "step": 525, |
| "valid_targets_mean": 4043.3, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 1.1777777777777778, |
| "grad_norm": 0.6443213997898508, |
| "learning_rate": 3.94402618208918e-05, |
| "loss": 0.2753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33983704447746277, |
| "step": 530, |
| "valid_targets_mean": 4571.4, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 1.1888888888888889, |
| "grad_norm": 0.4851613432195201, |
| "learning_rate": 3.9413930253055925e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2413058876991272, |
| "step": 535, |
| "valid_targets_mean": 5014.4, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 1.2, |
| "grad_norm": 0.5924543065212132, |
| "learning_rate": 3.938700268560179e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26164644956588745, |
| "step": 540, |
| "valid_targets_mean": 5537.7, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 1.211111111111111, |
| "grad_norm": 0.5348562981348433, |
| "learning_rate": 3.935947994519455e-05, |
| "loss": 0.2473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22140653431415558, |
| "step": 545, |
| "valid_targets_mean": 3933.1, |
| "valid_targets_min": 326 |
| }, |
| { |
| "epoch": 1.2222222222222223, |
| "grad_norm": 1.1507409216365962, |
| "learning_rate": 3.933136287677095e-05, |
| "loss": 0.2797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2999425530433655, |
| "step": 550, |
| "valid_targets_mean": 4136.8, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 1.2333333333333334, |
| "grad_norm": 0.6036157268361829, |
| "learning_rate": 3.9302652343513325e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24191945791244507, |
| "step": 555, |
| "valid_targets_mean": 3355.1, |
| "valid_targets_min": 354 |
| }, |
| { |
| "epoch": 1.2444444444444445, |
| "grad_norm": 0.5594737690815887, |
| "learning_rate": 3.927334922682319e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2738354802131653, |
| "step": 560, |
| "valid_targets_mean": 4464.2, |
| "valid_targets_min": 341 |
| }, |
| { |
| "epoch": 1.2555555555555555, |
| "grad_norm": 0.60403245110363, |
| "learning_rate": 3.924345442629405e-05, |
| "loss": 0.2414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22148557007312775, |
| "step": 565, |
| "valid_targets_mean": 3713.0, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 1.2666666666666666, |
| "grad_norm": 0.5326475987050822, |
| "learning_rate": 3.9212968859683924e-05, |
| "loss": 0.239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2524668276309967, |
| "step": 570, |
| "valid_targets_mean": 4112.8, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 1.2777777777777777, |
| "grad_norm": 0.5255254450372632, |
| "learning_rate": 3.918189346288708e-05, |
| "loss": 0.249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25053149461746216, |
| "step": 575, |
| "valid_targets_mean": 4201.0, |
| "valid_targets_min": 359 |
| }, |
| { |
| "epoch": 1.2888888888888888, |
| "grad_norm": 0.5460490711902419, |
| "learning_rate": 3.9150229189905325e-05, |
| "loss": 0.2513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2665417790412903, |
| "step": 580, |
| "valid_targets_mean": 4447.8, |
| "valid_targets_min": 384 |
| }, |
| { |
| "epoch": 1.3, |
| "grad_norm": 0.8958369211208952, |
| "learning_rate": 3.911797701281872e-05, |
| "loss": 0.2594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27293702960014343, |
| "step": 585, |
| "valid_targets_mean": 3628.9, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 1.3111111111111111, |
| "grad_norm": 0.5988510933683479, |
| "learning_rate": 3.9085137921755765e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2321304976940155, |
| "step": 590, |
| "valid_targets_mean": 3787.6, |
| "valid_targets_min": 500 |
| }, |
| { |
| "epoch": 1.3222222222222222, |
| "grad_norm": 0.5432482040922059, |
| "learning_rate": 3.9051712924862926e-05, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26185327768325806, |
| "step": 595, |
| "valid_targets_mean": 5390.7, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 1.3333333333333333, |
| "grad_norm": 0.5377831944060099, |
| "learning_rate": 3.901770304827379e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22949066758155823, |
| "step": 600, |
| "valid_targets_mean": 4550.2, |
| "valid_targets_min": 214 |
| }, |
| { |
| "epoch": 1.3444444444444446, |
| "grad_norm": 0.5612439217393881, |
| "learning_rate": 3.898310933607746e-05, |
| "loss": 0.2753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2890508472919464, |
| "step": 605, |
| "valid_targets_mean": 4195.9, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 1.3555555555555556, |
| "grad_norm": 0.5303766289315424, |
| "learning_rate": 3.8947932850286585e-05, |
| "loss": 0.2389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.264137327671051, |
| "step": 610, |
| "valid_targets_mean": 4352.6, |
| "valid_targets_min": 335 |
| }, |
| { |
| "epoch": 1.3666666666666667, |
| "grad_norm": 0.5137510782550517, |
| "learning_rate": 3.891217467080472e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23932068049907684, |
| "step": 615, |
| "valid_targets_mean": 4644.5, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 1.3777777777777778, |
| "grad_norm": 0.47391135683532554, |
| "learning_rate": 3.887583589539315e-05, |
| "loss": 0.2465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.255960613489151, |
| "step": 620, |
| "valid_targets_mean": 4816.4, |
| "valid_targets_min": 579 |
| }, |
| { |
| "epoch": 1.3888888888888888, |
| "grad_norm": 0.5572300753645717, |
| "learning_rate": 3.883891763963723e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2373078167438507, |
| "step": 625, |
| "valid_targets_mean": 3751.8, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 1.4, |
| "grad_norm": 0.49937213169450123, |
| "learning_rate": 3.880142103691213e-05, |
| "loss": 0.2341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23268617689609528, |
| "step": 630, |
| "valid_targets_mean": 4873.1, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 1.411111111111111, |
| "grad_norm": 0.5406692441975431, |
| "learning_rate": 3.876334723834802e-05, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2593476176261902, |
| "step": 635, |
| "valid_targets_mean": 4517.7, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 1.4222222222222223, |
| "grad_norm": 0.553445249581852, |
| "learning_rate": 3.872469741279475e-05, |
| "loss": 0.2496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2700212597846985, |
| "step": 640, |
| "valid_targets_mean": 3890.1, |
| "valid_targets_min": 490 |
| }, |
| { |
| "epoch": 1.4333333333333333, |
| "grad_norm": 0.5301037730927833, |
| "learning_rate": 3.868547274678595e-05, |
| "loss": 0.2535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2927553057670593, |
| "step": 645, |
| "valid_targets_mean": 4392.2, |
| "valid_targets_min": 423 |
| }, |
| { |
| "epoch": 1.4444444444444444, |
| "grad_norm": 0.44259558229551654, |
| "learning_rate": 3.864567444450263e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24536505341529846, |
| "step": 650, |
| "valid_targets_mean": 6347.3, |
| "valid_targets_min": 1877 |
| }, |
| { |
| "epoch": 1.4555555555555555, |
| "grad_norm": 0.47771864860111035, |
| "learning_rate": 3.8605303727736186e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22662869095802307, |
| "step": 655, |
| "valid_targets_mean": 4389.6, |
| "valid_targets_min": 352 |
| }, |
| { |
| "epoch": 1.4666666666666668, |
| "grad_norm": 0.6247118916552183, |
| "learning_rate": 3.856436183585089e-05, |
| "loss": 0.2638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.283000111579895, |
| "step": 660, |
| "valid_targets_mean": 4078.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 1.4777777777777779, |
| "grad_norm": 1.5070723708006228, |
| "learning_rate": 3.8522850025745885e-05, |
| "loss": 0.2584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25614166259765625, |
| "step": 665, |
| "valid_targets_mean": 5278.3, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 1.488888888888889, |
| "grad_norm": 0.628570473741109, |
| "learning_rate": 3.8480769571816535e-05, |
| "loss": 0.2516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29474788904190063, |
| "step": 670, |
| "valid_targets_mean": 3874.1, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 1.5, |
| "grad_norm": 0.8699623629541559, |
| "learning_rate": 3.843812176591535e-05, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22753040492534637, |
| "step": 675, |
| "valid_targets_mean": 3918.7, |
| "valid_targets_min": 309 |
| }, |
| { |
| "epoch": 1.511111111111111, |
| "grad_norm": 0.5112871185355921, |
| "learning_rate": 3.8394907917312314e-05, |
| "loss": 0.2391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22634285688400269, |
| "step": 680, |
| "valid_targets_mean": 4564.2, |
| "valid_targets_min": 406 |
| }, |
| { |
| "epoch": 1.5222222222222221, |
| "grad_norm": 0.47954206990442566, |
| "learning_rate": 3.835112935265468e-05, |
| "loss": 0.2412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2335192710161209, |
| "step": 685, |
| "valid_targets_mean": 4790.6, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 1.5333333333333332, |
| "grad_norm": 0.48528209028878294, |
| "learning_rate": 3.830678741592625e-05, |
| "loss": 0.2358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23643608391284943, |
| "step": 690, |
| "valid_targets_mean": 4443.8, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 1.5444444444444443, |
| "grad_norm": 0.6276984597487912, |
| "learning_rate": 3.826188346840611e-05, |
| "loss": 0.262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2579842805862427, |
| "step": 695, |
| "valid_targets_mean": 3282.2, |
| "valid_targets_min": 352 |
| }, |
| { |
| "epoch": 1.5555555555555556, |
| "grad_norm": 0.5476067080880181, |
| "learning_rate": 3.8216418888626864e-05, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24156105518341064, |
| "step": 700, |
| "valid_targets_mean": 4612.9, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 1.5666666666666667, |
| "grad_norm": 0.5413141061562579, |
| "learning_rate": 3.817039507233227e-05, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2622939646244049, |
| "step": 705, |
| "valid_targets_mean": 4257.5, |
| "valid_targets_min": 286 |
| }, |
| { |
| "epoch": 1.5777777777777777, |
| "grad_norm": 0.5191592586122504, |
| "learning_rate": 3.812381343243444e-05, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2551836371421814, |
| "step": 710, |
| "valid_targets_mean": 4099.2, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 1.588888888888889, |
| "grad_norm": 0.6436243723923792, |
| "learning_rate": 3.807667539897041e-05, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.227070152759552, |
| "step": 715, |
| "valid_targets_mean": 3246.0, |
| "valid_targets_min": 348 |
| }, |
| { |
| "epoch": 1.6, |
| "grad_norm": 0.6239016531037459, |
| "learning_rate": 3.8028982419058304e-05, |
| "loss": 0.2585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26668721437454224, |
| "step": 720, |
| "valid_targets_mean": 3396.3, |
| "valid_targets_min": 248 |
| }, |
| { |
| "epoch": 1.6111111111111112, |
| "grad_norm": 0.9192051442781469, |
| "learning_rate": 3.798073595685283e-05, |
| "loss": 0.2473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25195956230163574, |
| "step": 725, |
| "valid_targets_mean": 3665.6, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 1.6222222222222222, |
| "grad_norm": 0.5623905152284274, |
| "learning_rate": 3.793193749350042e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23393118381500244, |
| "step": 730, |
| "valid_targets_mean": 5211.4, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 1.6333333333333333, |
| "grad_norm": 0.5429518143801225, |
| "learning_rate": 3.788258852709367e-05, |
| "loss": 0.2593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22861596941947937, |
| "step": 735, |
| "valid_targets_mean": 5047.1, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 1.6444444444444444, |
| "grad_norm": 0.47826555516018626, |
| "learning_rate": 3.7832690572625417e-05, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21526125073432922, |
| "step": 740, |
| "valid_targets_mean": 4602.2, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 1.6555555555555554, |
| "grad_norm": 0.5863707657883438, |
| "learning_rate": 3.77822451619422e-05, |
| "loss": 0.2603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2455175220966339, |
| "step": 745, |
| "valid_targets_mean": 4632.7, |
| "valid_targets_min": 413 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.5169118790673137, |
| "learning_rate": 3.773125384369723e-05, |
| "loss": 0.2438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27260589599609375, |
| "step": 750, |
| "valid_targets_mean": 4461.6, |
| "valid_targets_min": 331 |
| }, |
| { |
| "epoch": 1.6777777777777778, |
| "grad_norm": 0.5608117782474311, |
| "learning_rate": 3.7679718183302856e-05, |
| "loss": 0.2519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25778332352638245, |
| "step": 755, |
| "valid_targets_mean": 4585.0, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 1.6888888888888889, |
| "grad_norm": 0.5536343736249013, |
| "learning_rate": 3.762763976288252e-05, |
| "loss": 0.261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26178520917892456, |
| "step": 760, |
| "valid_targets_mean": 4168.1, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 1.7, |
| "grad_norm": 0.4967067858273974, |
| "learning_rate": 3.757502018122215e-05, |
| "loss": 0.2604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23201864957809448, |
| "step": 765, |
| "valid_targets_mean": 4762.7, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.7111111111111112, |
| "grad_norm": 0.6431920727054683, |
| "learning_rate": 3.7521861053721104e-05, |
| "loss": 0.2734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3084906339645386, |
| "step": 770, |
| "valid_targets_mean": 3282.1, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 1.7222222222222223, |
| "grad_norm": 0.49539913031077976, |
| "learning_rate": 3.74681640123426e-05, |
| "loss": 0.2436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2623264789581299, |
| "step": 775, |
| "valid_targets_mean": 4743.1, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 1.7333333333333334, |
| "grad_norm": 0.5255901704167366, |
| "learning_rate": 3.741393070556355e-05, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25359559059143066, |
| "step": 780, |
| "valid_targets_mean": 4230.9, |
| "valid_targets_min": 932 |
| }, |
| { |
| "epoch": 1.7444444444444445, |
| "grad_norm": 0.5202593209519554, |
| "learning_rate": 3.7359162798324015e-05, |
| "loss": 0.2451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3075648546218872, |
| "step": 785, |
| "valid_targets_mean": 4931.7, |
| "valid_targets_min": 426 |
| }, |
| { |
| "epoch": 1.7555555555555555, |
| "grad_norm": 0.6052760837991578, |
| "learning_rate": 3.7303861971976074e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21487626433372498, |
| "step": 790, |
| "valid_targets_mean": 3999.6, |
| "valid_targets_min": 414 |
| }, |
| { |
| "epoch": 1.7666666666666666, |
| "grad_norm": 0.5902290421718297, |
| "learning_rate": 3.724802992423218e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24608749151229858, |
| "step": 795, |
| "valid_targets_mean": 3589.3, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 1.7777777777777777, |
| "grad_norm": 0.6368794220763241, |
| "learning_rate": 3.719166836911309e-05, |
| "loss": 0.2563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25677546858787537, |
| "step": 800, |
| "valid_targets_mean": 4686.3, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 1.7888888888888888, |
| "grad_norm": 0.5323661851044132, |
| "learning_rate": 3.713477903689518e-05, |
| "loss": 0.2532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2390604317188263, |
| "step": 805, |
| "valid_targets_mean": 4084.9, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 1.8, |
| "grad_norm": 0.5186885779998889, |
| "learning_rate": 3.707736367405741e-05, |
| "loss": 0.2542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22952812910079956, |
| "step": 810, |
| "valid_targets_mean": 3964.5, |
| "valid_targets_min": 238 |
| }, |
| { |
| "epoch": 1.8111111111111111, |
| "grad_norm": 0.6011432502817368, |
| "learning_rate": 3.701942404322764e-05, |
| "loss": 0.2443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28318285942077637, |
| "step": 815, |
| "valid_targets_mean": 4504.8, |
| "valid_targets_min": 401 |
| }, |
| { |
| "epoch": 1.8222222222222222, |
| "grad_norm": 0.5057107246393668, |
| "learning_rate": 3.696096192312852e-05, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2750961482524872, |
| "step": 820, |
| "valid_targets_mean": 4184.1, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 1.8333333333333335, |
| "grad_norm": 0.5674106572096047, |
| "learning_rate": 3.690197910852294e-05, |
| "loss": 0.2688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.284572958946228, |
| "step": 825, |
| "valid_targets_mean": 4159.1, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 1.8444444444444446, |
| "grad_norm": 0.524428929125523, |
| "learning_rate": 3.684247741015888e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2377292364835739, |
| "step": 830, |
| "valid_targets_mean": 4545.5, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 1.8555555555555556, |
| "grad_norm": 0.5197318284715093, |
| "learning_rate": 3.678245865471383e-05, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25039640069007874, |
| "step": 835, |
| "valid_targets_mean": 3829.6, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 1.8666666666666667, |
| "grad_norm": 0.741122146720882, |
| "learning_rate": 3.672192468473872e-05, |
| "loss": 0.2437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25348931550979614, |
| "step": 840, |
| "valid_targets_mean": 3802.5, |
| "valid_targets_min": 494 |
| }, |
| { |
| "epoch": 1.8777777777777778, |
| "grad_norm": 0.5653997003973549, |
| "learning_rate": 3.666087735860138e-05, |
| "loss": 0.2422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23701179027557373, |
| "step": 845, |
| "valid_targets_mean": 4565.3, |
| "valid_targets_min": 441 |
| }, |
| { |
| "epoch": 1.8888888888888888, |
| "grad_norm": 0.47961375383032556, |
| "learning_rate": 3.6599318550429415e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28315088152885437, |
| "step": 850, |
| "valid_targets_mean": 4855.1, |
| "valid_targets_min": 356 |
| }, |
| { |
| "epoch": 1.9, |
| "grad_norm": 0.4960630224668749, |
| "learning_rate": 3.653725015005275e-05, |
| "loss": 0.2358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24288593232631683, |
| "step": 855, |
| "valid_targets_mean": 4795.5, |
| "valid_targets_min": 193 |
| }, |
| { |
| "epoch": 1.911111111111111, |
| "grad_norm": 0.5198260135949281, |
| "learning_rate": 3.6474674062945573e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2727063298225403, |
| "step": 860, |
| "valid_targets_mean": 5094.9, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 1.9222222222222223, |
| "grad_norm": 0.963664843983337, |
| "learning_rate": 3.6411592210167834e-05, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2163504958152771, |
| "step": 865, |
| "valid_targets_mean": 4430.9, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 1.9333333333333333, |
| "grad_norm": 0.5387347139824947, |
| "learning_rate": 3.6348006528306295e-05, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24510449171066284, |
| "step": 870, |
| "valid_targets_mean": 4382.1, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 1.9444444444444444, |
| "grad_norm": 0.499809810495946, |
| "learning_rate": 3.628391896941505e-05, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22553254663944244, |
| "step": 875, |
| "valid_targets_mean": 4035.4, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 1.9555555555555557, |
| "grad_norm": 0.5218149844142983, |
| "learning_rate": 3.621933150095561e-05, |
| "loss": 0.2662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25849276781082153, |
| "step": 880, |
| "valid_targets_mean": 3824.7, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 1.9666666666666668, |
| "grad_norm": 0.5123574858401871, |
| "learning_rate": 3.615424610573651e-05, |
| "loss": 0.2681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28296032547950745, |
| "step": 885, |
| "valid_targets_mean": 4234.2, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 1.9777777777777779, |
| "grad_norm": 0.5240352817270689, |
| "learning_rate": 3.608866478185245e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2798116207122803, |
| "step": 890, |
| "valid_targets_mean": 4745.1, |
| "valid_targets_min": 438 |
| }, |
| { |
| "epoch": 1.988888888888889, |
| "grad_norm": 0.47021296088948716, |
| "learning_rate": 3.602258954262287e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24416977167129517, |
| "step": 895, |
| "valid_targets_mean": 4577.2, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 0.5152852896564755, |
| "learning_rate": 3.595602241653028e-05, |
| "loss": 0.248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.227662593126297, |
| "step": 900, |
| "valid_targets_mean": 3932.9, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 2.011111111111111, |
| "grad_norm": 0.8269495388300478, |
| "learning_rate": 3.588896544715787e-05, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2364978790283203, |
| "step": 905, |
| "valid_targets_mean": 4779.8, |
| "valid_targets_min": 1630 |
| }, |
| { |
| "epoch": 2.022222222222222, |
| "grad_norm": 0.5822111147854571, |
| "learning_rate": 3.5821420693126834e-05, |
| "loss": 0.2403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2130419909954071, |
| "step": 910, |
| "valid_targets_mean": 3855.6, |
| "valid_targets_min": 311 |
| }, |
| { |
| "epoch": 2.033333333333333, |
| "grad_norm": 0.503530838011803, |
| "learning_rate": 3.575339022803313e-05, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1974865049123764, |
| "step": 915, |
| "valid_targets_mean": 3615.4, |
| "valid_targets_min": 242 |
| }, |
| { |
| "epoch": 2.0444444444444443, |
| "grad_norm": 0.5881001614957597, |
| "learning_rate": 3.5684876140383875e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2469121217727661, |
| "step": 920, |
| "valid_targets_mean": 4366.9, |
| "valid_targets_min": 450 |
| }, |
| { |
| "epoch": 2.0555555555555554, |
| "grad_norm": 0.5375060558594457, |
| "learning_rate": 3.561588053353319e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21924357116222382, |
| "step": 925, |
| "valid_targets_mean": 4148.6, |
| "valid_targets_min": 1350 |
| }, |
| { |
| "epoch": 2.066666666666667, |
| "grad_norm": 0.5123963351563102, |
| "learning_rate": 3.554640552561761e-05, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21245072782039642, |
| "step": 930, |
| "valid_targets_mean": 3831.3, |
| "valid_targets_min": 441 |
| }, |
| { |
| "epoch": 2.077777777777778, |
| "grad_norm": 0.5890369925664793, |
| "learning_rate": 3.5476453249491125e-05, |
| "loss": 0.2297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22979292273521423, |
| "step": 935, |
| "valid_targets_mean": 4769.4, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 2.088888888888889, |
| "grad_norm": 0.5822543746194564, |
| "learning_rate": 3.5406025852659626e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22272920608520508, |
| "step": 940, |
| "valid_targets_mean": 3913.2, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 2.1, |
| "grad_norm": 0.5062356595758193, |
| "learning_rate": 3.533512549721503e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19117265939712524, |
| "step": 945, |
| "valid_targets_mean": 4397.1, |
| "valid_targets_min": 379 |
| }, |
| { |
| "epoch": 2.111111111111111, |
| "grad_norm": 0.5053075095700746, |
| "learning_rate": 3.5263754359768896e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2279876470565796, |
| "step": 950, |
| "valid_targets_mean": 4971.6, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 2.1222222222222222, |
| "grad_norm": 0.48516711141414565, |
| "learning_rate": 3.5191914631385565e-05, |
| "loss": 0.2184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2130102515220642, |
| "step": 955, |
| "valid_targets_mean": 4136.3, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 2.1333333333333333, |
| "grad_norm": 0.5779110961074571, |
| "learning_rate": 3.511960851751496e-05, |
| "loss": 0.2139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2052951157093048, |
| "step": 960, |
| "valid_targets_mean": 3846.1, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 2.1444444444444444, |
| "grad_norm": 0.5423358183039504, |
| "learning_rate": 3.504683823792483e-05, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20998695492744446, |
| "step": 965, |
| "valid_targets_mean": 3942.2, |
| "valid_targets_min": 283 |
| }, |
| { |
| "epoch": 2.1555555555555554, |
| "grad_norm": 0.4731164937857403, |
| "learning_rate": 3.49736060266326e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20602105557918549, |
| "step": 970, |
| "valid_targets_mean": 4549.1, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 2.1666666666666665, |
| "grad_norm": 0.5192629974349211, |
| "learning_rate": 3.489991413183686e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1989196240901947, |
| "step": 975, |
| "valid_targets_mean": 4872.6, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 2.1777777777777776, |
| "grad_norm": 0.5443326064321022, |
| "learning_rate": 3.482576481584824e-05, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2225218117237091, |
| "step": 980, |
| "valid_targets_mean": 3649.8, |
| "valid_targets_min": 546 |
| }, |
| { |
| "epoch": 2.188888888888889, |
| "grad_norm": 0.5020893394971628, |
| "learning_rate": 3.4751160355020034e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23120808601379395, |
| "step": 985, |
| "valid_targets_mean": 4243.1, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 2.2, |
| "grad_norm": 0.48166947840338786, |
| "learning_rate": 3.467610303967829e-05, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18600469827651978, |
| "step": 990, |
| "valid_targets_mean": 5170.1, |
| "valid_targets_min": 1719 |
| }, |
| { |
| "epoch": 2.2111111111111112, |
| "grad_norm": 0.5583920558407086, |
| "learning_rate": 3.4600595174051496e-05, |
| "loss": 0.248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27588558197021484, |
| "step": 995, |
| "valid_targets_mean": 4328.1, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 2.2222222222222223, |
| "grad_norm": 0.5416793417738504, |
| "learning_rate": 3.452463907619986e-05, |
| "loss": 0.2202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24462614953517914, |
| "step": 1000, |
| "valid_targets_mean": 4362.1, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 2.2333333333333334, |
| "grad_norm": 0.5328060833599986, |
| "learning_rate": 3.444823707794414e-05, |
| "loss": 0.2321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2523013949394226, |
| "step": 1005, |
| "valid_targets_mean": 4839.0, |
| "valid_targets_min": 352 |
| }, |
| { |
| "epoch": 2.2444444444444445, |
| "grad_norm": 0.563391734301446, |
| "learning_rate": 3.437139152479403e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19773298501968384, |
| "step": 1010, |
| "valid_targets_mean": 4385.2, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 2.2555555555555555, |
| "grad_norm": 0.5074311551875781, |
| "learning_rate": 3.429410477587619e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2079458087682724, |
| "step": 1015, |
| "valid_targets_mean": 4402.8, |
| "valid_targets_min": 270 |
| }, |
| { |
| "epoch": 2.2666666666666666, |
| "grad_norm": 0.44755347145933255, |
| "learning_rate": 3.4216379203861785e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20723801851272583, |
| "step": 1020, |
| "valid_targets_mean": 6327.4, |
| "valid_targets_min": 2089 |
| }, |
| { |
| "epoch": 2.2777777777777777, |
| "grad_norm": 0.5637924379901195, |
| "learning_rate": 3.41382171948937e-05, |
| "loss": 0.2394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2707464098930359, |
| "step": 1025, |
| "valid_targets_mean": 4543.5, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.2888888888888888, |
| "grad_norm": 0.5493222833081342, |
| "learning_rate": 3.405962114851324e-05, |
| "loss": 0.2265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23270747065544128, |
| "step": 1030, |
| "valid_targets_mean": 3841.1, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 2.3, |
| "grad_norm": 0.5377176986106669, |
| "learning_rate": 3.398059347758647e-05, |
| "loss": 0.2384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036696970462799, |
| "step": 1035, |
| "valid_targets_mean": 3737.5, |
| "valid_targets_min": 443 |
| }, |
| { |
| "epoch": 2.311111111111111, |
| "grad_norm": 0.48575675539344104, |
| "learning_rate": 3.3901136608230166e-05, |
| "loss": 0.2424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24168801307678223, |
| "step": 1040, |
| "valid_targets_mean": 5109.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 2.3222222222222224, |
| "grad_norm": 0.5389208075547236, |
| "learning_rate": 3.38212529797373e-05, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2333628237247467, |
| "step": 1045, |
| "valid_targets_mean": 4541.2, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 2.3333333333333335, |
| "grad_norm": 0.6380380157616352, |
| "learning_rate": 3.374094504450218e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21096259355545044, |
| "step": 1050, |
| "valid_targets_mean": 2654.1, |
| "valid_targets_min": 218 |
| }, |
| { |
| "epoch": 2.3444444444444446, |
| "grad_norm": 0.5618636585728415, |
| "learning_rate": 3.366021526794517e-05, |
| "loss": 0.2289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22567206621170044, |
| "step": 1055, |
| "valid_targets_mean": 3951.7, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 2.3555555555555556, |
| "grad_norm": 0.590035420993425, |
| "learning_rate": 3.357906612843697e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22020503878593445, |
| "step": 1060, |
| "valid_targets_mean": 3162.4, |
| "valid_targets_min": 248 |
| }, |
| { |
| "epoch": 2.3666666666666667, |
| "grad_norm": 0.5197847274605225, |
| "learning_rate": 3.349750011722256e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23694512248039246, |
| "step": 1065, |
| "valid_targets_mean": 4473.9, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 2.3777777777777778, |
| "grad_norm": 0.5902730606680944, |
| "learning_rate": 3.3415519738344686e-05, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23186247050762177, |
| "step": 1070, |
| "valid_targets_mean": 4213.4, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 2.388888888888889, |
| "grad_norm": 0.48708079743882093, |
| "learning_rate": 3.333312750856703e-05, |
| "loss": 0.2184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22630329430103302, |
| "step": 1075, |
| "valid_targets_mean": 5137.1, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 2.4, |
| "grad_norm": 0.6201131687835197, |
| "learning_rate": 3.3250325957296936e-05, |
| "loss": 0.2296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2439213991165161, |
| "step": 1080, |
| "valid_targets_mean": 4311.1, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 2.411111111111111, |
| "grad_norm": 0.5910991737720884, |
| "learning_rate": 3.3167117626507726e-05, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22350382804870605, |
| "step": 1085, |
| "valid_targets_mean": 4331.2, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 2.422222222222222, |
| "grad_norm": 0.5745602273524396, |
| "learning_rate": 3.308350507066069e-05, |
| "loss": 0.2285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2272610366344452, |
| "step": 1090, |
| "valid_targets_mean": 3677.5, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 2.4333333333333336, |
| "grad_norm": 0.5154857981766388, |
| "learning_rate": 3.2999490856626674e-05, |
| "loss": 0.2117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21586115658283234, |
| "step": 1095, |
| "valid_targets_mean": 4540.8, |
| "valid_targets_min": 449 |
| }, |
| { |
| "epoch": 2.4444444444444446, |
| "grad_norm": 0.49655172714458007, |
| "learning_rate": 3.291507756360725e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23002441227436066, |
| "step": 1100, |
| "valid_targets_mean": 4644.0, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 2.4555555555555557, |
| "grad_norm": 0.6161023573158174, |
| "learning_rate": 3.283026778305554e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24754559993743896, |
| "step": 1105, |
| "valid_targets_mean": 4383.9, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 2.466666666666667, |
| "grad_norm": 0.47036375778212935, |
| "learning_rate": 3.2745064118596696e-05, |
| "loss": 0.2317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20647308230400085, |
| "step": 1110, |
| "valid_targets_mean": 5761.9, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 2.477777777777778, |
| "grad_norm": 0.5406137267974768, |
| "learning_rate": 3.265946918594793e-05, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23646476864814758, |
| "step": 1115, |
| "valid_targets_mean": 3537.1, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 2.488888888888889, |
| "grad_norm": 0.4637714307748355, |
| "learning_rate": 3.257348561283822e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22905629873275757, |
| "step": 1120, |
| "valid_targets_mean": 5062.0, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.4800390566792728, |
| "learning_rate": 3.248711603892765e-05, |
| "loss": 0.2144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2034926414489746, |
| "step": 1125, |
| "valid_targets_mean": 4869.9, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 2.511111111111111, |
| "grad_norm": 3.5144120907404144, |
| "learning_rate": 3.240036311572635e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3505418002605438, |
| "step": 1130, |
| "valid_targets_mean": 3852.2, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 2.522222222222222, |
| "grad_norm": 0.6588418511183887, |
| "learning_rate": 3.2313229506513167e-05, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24138295650482178, |
| "step": 1135, |
| "valid_targets_mean": 3041.4, |
| "valid_targets_min": 419 |
| }, |
| { |
| "epoch": 2.533333333333333, |
| "grad_norm": 0.4351804600110289, |
| "learning_rate": 3.22257178862538e-05, |
| "loss": 0.2431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22207850217819214, |
| "step": 1140, |
| "valid_targets_mean": 5268.9, |
| "valid_targets_min": 1175 |
| }, |
| { |
| "epoch": 2.5444444444444443, |
| "grad_norm": 0.5924820635484583, |
| "learning_rate": 3.213783094151873e-05, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24633681774139404, |
| "step": 1145, |
| "valid_targets_mean": 4402.8, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 2.5555555555555554, |
| "grad_norm": 0.4637928251048832, |
| "learning_rate": 3.204957137040079e-05, |
| "loss": 0.2235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22640839219093323, |
| "step": 1150, |
| "valid_targets_mean": 4871.2, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 2.5666666666666664, |
| "grad_norm": 0.5791271707374432, |
| "learning_rate": 3.196094188243224e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24356502294540405, |
| "step": 1155, |
| "valid_targets_mean": 4226.2, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 2.5777777777777775, |
| "grad_norm": 0.544475419998541, |
| "learning_rate": 3.187194519850167e-05, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21199198067188263, |
| "step": 1160, |
| "valid_targets_mean": 4666.7, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 2.588888888888889, |
| "grad_norm": 0.5117366718721723, |
| "learning_rate": 3.17825840507704e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2462947815656662, |
| "step": 1165, |
| "valid_targets_mean": 4306.7, |
| "valid_targets_min": 231 |
| }, |
| { |
| "epoch": 2.6, |
| "grad_norm": 0.5185736052483539, |
| "learning_rate": 3.169286118258867e-05, |
| "loss": 0.2191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21428170800209045, |
| "step": 1170, |
| "valid_targets_mean": 4292.4, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 2.611111111111111, |
| "grad_norm": 0.5124442481522459, |
| "learning_rate": 3.1602779348411354e-05, |
| "loss": 0.2194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21586015820503235, |
| "step": 1175, |
| "valid_targets_mean": 4098.7, |
| "valid_targets_min": 284 |
| }, |
| { |
| "epoch": 2.6222222222222222, |
| "grad_norm": 0.5013956254301979, |
| "learning_rate": 3.151234131371348e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20073631405830383, |
| "step": 1180, |
| "valid_targets_mean": 3848.8, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 2.6333333333333333, |
| "grad_norm": 0.5498700950427212, |
| "learning_rate": 3.142154985490523e-05, |
| "loss": 0.2231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22234992682933807, |
| "step": 1185, |
| "valid_targets_mean": 3493.1, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 2.6444444444444444, |
| "grad_norm": 0.5491708841030193, |
| "learning_rate": 3.1330407759246805e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22136567533016205, |
| "step": 1190, |
| "valid_targets_mean": 3996.4, |
| "valid_targets_min": 251 |
| }, |
| { |
| "epoch": 2.6555555555555554, |
| "grad_norm": 0.48268790906327425, |
| "learning_rate": 3.1238917824762794e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028353214263916, |
| "step": 1195, |
| "valid_targets_mean": 4584.0, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 2.6666666666666665, |
| "grad_norm": 0.49007399842315175, |
| "learning_rate": 3.1147082860156275e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25679466128349304, |
| "step": 1200, |
| "valid_targets_mean": 5399.8, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 2.677777777777778, |
| "grad_norm": 0.4633684064891278, |
| "learning_rate": 3.105490568472266e-05, |
| "loss": 0.2108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2022610604763031, |
| "step": 1205, |
| "valid_targets_mean": 4171.5, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 2.688888888888889, |
| "grad_norm": 0.4895671052558776, |
| "learning_rate": 3.0962389128263025e-05, |
| "loss": 0.2333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19812658429145813, |
| "step": 1210, |
| "valid_targets_mean": 5454.3, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 2.7, |
| "grad_norm": 0.5453665235834874, |
| "learning_rate": 3.086953603099736e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20646308362483978, |
| "step": 1215, |
| "valid_targets_mean": 4315.4, |
| "valid_targets_min": 465 |
| }, |
| { |
| "epoch": 2.7111111111111112, |
| "grad_norm": 0.5581759362267998, |
| "learning_rate": 3.077634924347728e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22275254130363464, |
| "step": 1220, |
| "valid_targets_mean": 3761.5, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 2.7222222222222223, |
| "grad_norm": 0.5153650133576909, |
| "learning_rate": 3.068283162649858e-05, |
| "loss": 0.2293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21216610074043274, |
| "step": 1225, |
| "valid_targets_mean": 4164.8, |
| "valid_targets_min": 296 |
| }, |
| { |
| "epoch": 2.7333333333333334, |
| "grad_norm": 0.592596188705314, |
| "learning_rate": 3.0588986051013355e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22181862592697144, |
| "step": 1230, |
| "valid_targets_mean": 4035.2, |
| "valid_targets_min": 283 |
| }, |
| { |
| "epoch": 2.7444444444444445, |
| "grad_norm": 0.5983613901546053, |
| "learning_rate": 3.049481539804192e-05, |
| "loss": 0.2231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22257715463638306, |
| "step": 1235, |
| "valid_targets_mean": 3023.5, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 2.7555555555555555, |
| "grad_norm": 0.49305225026999655, |
| "learning_rate": 3.0400322558584308e-05, |
| "loss": 0.2201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19669756293296814, |
| "step": 1240, |
| "valid_targets_mean": 4822.0, |
| "valid_targets_min": 1400 |
| }, |
| { |
| "epoch": 2.7666666666666666, |
| "grad_norm": 0.4752603478313126, |
| "learning_rate": 3.0305510433531568e-05, |
| "loss": 0.2444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23400330543518066, |
| "step": 1245, |
| "valid_targets_mean": 4814.9, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 2.7777777777777777, |
| "grad_norm": 0.5551934554676596, |
| "learning_rate": 3.0210381933576654e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2083454132080078, |
| "step": 1250, |
| "valid_targets_mean": 3553.5, |
| "valid_targets_min": 348 |
| }, |
| { |
| "epoch": 2.7888888888888888, |
| "grad_norm": 0.7744675886957486, |
| "learning_rate": 3.0114939979125135e-05, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2401510775089264, |
| "step": 1255, |
| "valid_targets_mean": 3016.8, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 2.8, |
| "grad_norm": 0.5540461372381361, |
| "learning_rate": 3.001918750020547e-05, |
| "loss": 0.2216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2751244008541107, |
| "step": 1260, |
| "valid_targets_mean": 3901.6, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 2.811111111111111, |
| "grad_norm": 0.6851890356876696, |
| "learning_rate": 2.992312743637911e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25260940194129944, |
| "step": 1265, |
| "valid_targets_mean": 4583.8, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 2.822222222222222, |
| "grad_norm": 0.48363964794454084, |
| "learning_rate": 2.982676273665023e-05, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2125380039215088, |
| "step": 1270, |
| "valid_targets_mean": 5045.1, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 2.8333333333333335, |
| "grad_norm": 0.6033207649950939, |
| "learning_rate": 2.97300963593752e-05, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22328922152519226, |
| "step": 1275, |
| "valid_targets_mean": 5039.6, |
| "valid_targets_min": 1597 |
| }, |
| { |
| "epoch": 2.8444444444444446, |
| "grad_norm": 0.5440870025040494, |
| "learning_rate": 2.9633131272171768e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21130454540252686, |
| "step": 1280, |
| "valid_targets_mean": 3933.2, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 2.8555555555555556, |
| "grad_norm": 0.46685874495827057, |
| "learning_rate": 2.953587045182795e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2029666304588318, |
| "step": 1285, |
| "valid_targets_mean": 4932.2, |
| "valid_targets_min": 414 |
| }, |
| { |
| "epoch": 2.8666666666666667, |
| "grad_norm": 0.5083384300553782, |
| "learning_rate": 2.943831688421066e-05, |
| "loss": 0.2263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20045515894889832, |
| "step": 1290, |
| "valid_targets_mean": 3839.1, |
| "valid_targets_min": 2102 |
| }, |
| { |
| "epoch": 2.8777777777777778, |
| "grad_norm": 0.5496306210874803, |
| "learning_rate": 2.9340473564174003e-05, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2500072121620178, |
| "step": 1295, |
| "valid_targets_mean": 4098.8, |
| "valid_targets_min": 417 |
| }, |
| { |
| "epoch": 2.888888888888889, |
| "grad_norm": 0.5194734275085567, |
| "learning_rate": 2.9242343495467396e-05, |
| "loss": 0.2347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22234457731246948, |
| "step": 1300, |
| "valid_targets_mean": 3903.9, |
| "valid_targets_min": 411 |
| }, |
| { |
| "epoch": 2.9, |
| "grad_norm": 0.504766986056304, |
| "learning_rate": 2.9143929690643292e-05, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23288145661354065, |
| "step": 1305, |
| "valid_targets_mean": 5635.0, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 2.911111111111111, |
| "grad_norm": 0.6498390965909955, |
| "learning_rate": 2.9045235170964754e-05, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23700065910816193, |
| "step": 1310, |
| "valid_targets_mean": 4147.7, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 2.9222222222222225, |
| "grad_norm": 0.47655618469018296, |
| "learning_rate": 2.8946262966312652e-05, |
| "loss": 0.2247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20102891325950623, |
| "step": 1315, |
| "valid_targets_mean": 3986.3, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 2.9333333333333336, |
| "grad_norm": 0.444313610842639, |
| "learning_rate": 2.8847016115092686e-05, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20955491065979004, |
| "step": 1320, |
| "valid_targets_mean": 5599.8, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 2.9444444444444446, |
| "grad_norm": 0.5345322272032264, |
| "learning_rate": 2.8747497664142075e-05, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21730177104473114, |
| "step": 1325, |
| "valid_targets_mean": 3947.6, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 2.9555555555555557, |
| "grad_norm": 0.48868872486689147, |
| "learning_rate": 2.8647710668636053e-05, |
| "loss": 0.2251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21820557117462158, |
| "step": 1330, |
| "valid_targets_mean": 4328.9, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 2.966666666666667, |
| "grad_norm": 0.5163666912550201, |
| "learning_rate": 2.8547658191994054e-05, |
| "loss": 0.2159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2369096875190735, |
| "step": 1335, |
| "valid_targets_mean": 3999.9, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 2.977777777777778, |
| "grad_norm": 0.4525486700692223, |
| "learning_rate": 2.844734330578567e-05, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22851812839508057, |
| "step": 1340, |
| "valid_targets_mean": 5680.0, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.988888888888889, |
| "grad_norm": 0.5038511428892624, |
| "learning_rate": 2.834676908963636e-05, |
| "loss": 0.2223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20257601141929626, |
| "step": 1345, |
| "valid_targets_mean": 4431.0, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 0.49413740091680286, |
| "learning_rate": 2.824593863113291e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2500663995742798, |
| "step": 1350, |
| "valid_targets_mean": 5082.1, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 3.011111111111111, |
| "grad_norm": 0.5890237248654047, |
| "learning_rate": 2.814485502572863e-05, |
| "loss": 0.1906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18735849857330322, |
| "step": 1355, |
| "valid_targets_mean": 5022.9, |
| "valid_targets_min": 1330 |
| }, |
| { |
| "epoch": 3.022222222222222, |
| "grad_norm": 0.5397593530227527, |
| "learning_rate": 2.804352137664835e-05, |
| "loss": 0.2145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2516242265701294, |
| "step": 1360, |
| "valid_targets_mean": 5099.1, |
| "valid_targets_min": 360 |
| }, |
| { |
| "epoch": 3.033333333333333, |
| "grad_norm": 0.568525348633587, |
| "learning_rate": 2.7941940794793122e-05, |
| "loss": 0.1982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19268794357776642, |
| "step": 1365, |
| "valid_targets_mean": 3634.8, |
| "valid_targets_min": 294 |
| }, |
| { |
| "epoch": 3.0444444444444443, |
| "grad_norm": 0.504377586126035, |
| "learning_rate": 2.7840116398644742e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19320614635944366, |
| "step": 1370, |
| "valid_targets_mean": 4622.8, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 3.0555555555555554, |
| "grad_norm": 0.6922737256269529, |
| "learning_rate": 2.7738051314169993e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2083386778831482, |
| "step": 1375, |
| "valid_targets_mean": 5940.1, |
| "valid_targets_min": 2844 |
| }, |
| { |
| "epoch": 3.066666666666667, |
| "grad_norm": 0.45807741860705403, |
| "learning_rate": 2.7635748674724702e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17992693185806274, |
| "step": 1380, |
| "valid_targets_mean": 5056.9, |
| "valid_targets_min": 581 |
| }, |
| { |
| "epoch": 3.077777777777778, |
| "grad_norm": 0.49380418579141977, |
| "learning_rate": 2.7533211620957532e-05, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20595912635326385, |
| "step": 1385, |
| "valid_targets_mean": 5148.5, |
| "valid_targets_min": 2209 |
| }, |
| { |
| "epoch": 3.088888888888889, |
| "grad_norm": 0.6287045912836227, |
| "learning_rate": 2.743044330071356e-05, |
| "loss": 0.2061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2235325574874878, |
| "step": 1390, |
| "valid_targets_mean": 3636.7, |
| "valid_targets_min": 382 |
| }, |
| { |
| "epoch": 3.1, |
| "grad_norm": 0.5630479669186463, |
| "learning_rate": 2.7327446868937664e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19244463741779327, |
| "step": 1395, |
| "valid_targets_mean": 5513.7, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 3.111111111111111, |
| "grad_norm": 0.47811337357814554, |
| "learning_rate": 2.7224225487577637e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1944870501756668, |
| "step": 1400, |
| "valid_targets_mean": 5109.3, |
| "valid_targets_min": 214 |
| }, |
| { |
| "epoch": 3.1222222222222222, |
| "grad_norm": 0.5608741822584281, |
| "learning_rate": 2.712078232548714e-05, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1881995052099228, |
| "step": 1405, |
| "valid_targets_mean": 4487.5, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 3.1333333333333333, |
| "grad_norm": 0.5261157563058694, |
| "learning_rate": 2.7017120558328395e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1874210387468338, |
| "step": 1410, |
| "valid_targets_mean": 4228.4, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 3.1444444444444444, |
| "grad_norm": 0.5496647265564715, |
| "learning_rate": 2.6913243368474734e-05, |
| "loss": 0.2034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22300265729427338, |
| "step": 1415, |
| "valid_targets_mean": 4393.3, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 3.1555555555555554, |
| "grad_norm": 0.49758618583607633, |
| "learning_rate": 2.680915394491286e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19458116590976715, |
| "step": 1420, |
| "valid_targets_mean": 4739.6, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 3.1666666666666665, |
| "grad_norm": 0.5218888450001141, |
| "learning_rate": 2.6704855483144973e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21135935187339783, |
| "step": 1425, |
| "valid_targets_mean": 4440.1, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 3.1777777777777776, |
| "grad_norm": 0.5426640353608564, |
| "learning_rate": 2.6600351185090637e-05, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19701051712036133, |
| "step": 1430, |
| "valid_targets_mean": 3513.1, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 3.188888888888889, |
| "grad_norm": 0.5662706793465802, |
| "learning_rate": 2.649564425898853e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21139845252037048, |
| "step": 1435, |
| "valid_targets_mean": 3985.6, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 3.2, |
| "grad_norm": 0.4718898918421046, |
| "learning_rate": 2.6390737919297925e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1822149157524109, |
| "step": 1440, |
| "valid_targets_mean": 5072.8, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 3.2111111111111112, |
| "grad_norm": 0.5271902172821914, |
| "learning_rate": 2.6285635386599983e-05, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1844690442085266, |
| "step": 1445, |
| "valid_targets_mean": 4660.9, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 3.2222222222222223, |
| "grad_norm": 0.7537646783410501, |
| "learning_rate": 2.618033988749895e-05, |
| "loss": 0.2114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20052474737167358, |
| "step": 1450, |
| "valid_targets_mean": 3193.3, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 3.2333333333333334, |
| "grad_norm": 0.4690363852812957, |
| "learning_rate": 2.6074854654523023e-05, |
| "loss": 0.2106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16611334681510925, |
| "step": 1455, |
| "valid_targets_mean": 4196.4, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 3.2444444444444445, |
| "grad_norm": 0.4572908827805106, |
| "learning_rate": 2.596918292602518e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18506214022636414, |
| "step": 1460, |
| "valid_targets_mean": 5220.0, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 3.2555555555555555, |
| "grad_norm": 0.5395419499985299, |
| "learning_rate": 2.586332794608371e-05, |
| "loss": 0.1997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18608039617538452, |
| "step": 1465, |
| "valid_targets_mean": 3894.8, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 3.2666666666666666, |
| "grad_norm": 0.8552816175037915, |
| "learning_rate": 2.5757292964402653e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18753841519355774, |
| "step": 1470, |
| "valid_targets_mean": 4177.2, |
| "valid_targets_min": 357 |
| }, |
| { |
| "epoch": 3.2777777777777777, |
| "grad_norm": 0.6502074224948179, |
| "learning_rate": 2.5651081236212045e-05, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1877031922340393, |
| "step": 1475, |
| "valid_targets_mean": 3714.6, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 3.2888888888888888, |
| "grad_norm": 0.504138623747214, |
| "learning_rate": 2.5544696022167945e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19270633161067963, |
| "step": 1480, |
| "valid_targets_mean": 5232.9, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 3.3, |
| "grad_norm": 0.5562353529549702, |
| "learning_rate": 2.5438140588252367e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23178471624851227, |
| "step": 1485, |
| "valid_targets_mean": 4443.0, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 3.311111111111111, |
| "grad_norm": 0.6990935382908224, |
| "learning_rate": 2.5331418205672988e-05, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1817629337310791, |
| "step": 1490, |
| "valid_targets_mean": 3285.0, |
| "valid_targets_min": 387 |
| }, |
| { |
| "epoch": 3.3222222222222224, |
| "grad_norm": 0.5161517693720137, |
| "learning_rate": 2.522453215076277e-05, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21749022603034973, |
| "step": 1495, |
| "valid_targets_mean": 5134.9, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.546904151431328, |
| "learning_rate": 2.511748570487932e-05, |
| "loss": 0.2122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23374782502651215, |
| "step": 1500, |
| "valid_targets_mean": 4250.7, |
| "valid_targets_min": 588 |
| }, |
| { |
| "epoch": 3.3444444444444446, |
| "grad_norm": 0.47277844481370324, |
| "learning_rate": 2.5010282154304193e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20504996180534363, |
| "step": 1505, |
| "valid_targets_mean": 5340.2, |
| "valid_targets_min": 586 |
| }, |
| { |
| "epoch": 3.3555555555555556, |
| "grad_norm": 0.5412015372324224, |
| "learning_rate": 2.4902924790142004e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20246189832687378, |
| "step": 1510, |
| "valid_targets_mean": 3491.1, |
| "valid_targets_min": 218 |
| }, |
| { |
| "epoch": 3.3666666666666667, |
| "grad_norm": 0.5638774958328592, |
| "learning_rate": 2.479541690821935e-05, |
| "loss": 0.2145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22698086500167847, |
| "step": 1515, |
| "valid_targets_mean": 3940.7, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 3.3777777777777778, |
| "grad_norm": 0.4561709138055978, |
| "learning_rate": 2.4687761808983693e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1643875539302826, |
| "step": 1520, |
| "valid_targets_mean": 5342.7, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 3.388888888888889, |
| "grad_norm": 0.5234462175070752, |
| "learning_rate": 2.457996279740199e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19301840662956238, |
| "step": 1525, |
| "valid_targets_mean": 4052.8, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 3.4, |
| "grad_norm": 0.5228201850030787, |
| "learning_rate": 2.4472023182859257e-05, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18041759729385376, |
| "step": 1530, |
| "valid_targets_mean": 4235.0, |
| "valid_targets_min": 1815 |
| }, |
| { |
| "epoch": 3.411111111111111, |
| "grad_norm": 0.5751004806856855, |
| "learning_rate": 2.4363946279056947e-05, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20007622241973877, |
| "step": 1535, |
| "valid_targets_mean": 5299.6, |
| "valid_targets_min": 1225 |
| }, |
| { |
| "epoch": 3.422222222222222, |
| "grad_norm": 0.5955197652307113, |
| "learning_rate": 2.4255735403911243e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19078674912452698, |
| "step": 1540, |
| "valid_targets_mean": 3658.2, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 3.4333333333333336, |
| "grad_norm": 0.5223462323520682, |
| "learning_rate": 2.4147393879451205e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22115221619606018, |
| "step": 1545, |
| "valid_targets_mean": 4941.4, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 3.4444444444444446, |
| "grad_norm": 0.5358147295716755, |
| "learning_rate": 2.4038925031716755e-05, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1802097111940384, |
| "step": 1550, |
| "valid_targets_mean": 3892.2, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 3.4555555555555557, |
| "grad_norm": 0.5061336217509301, |
| "learning_rate": 2.3930332190656604e-05, |
| "loss": 0.2151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1854897439479828, |
| "step": 1555, |
| "valid_targets_mean": 4797.3, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 3.466666666666667, |
| "grad_norm": 0.6266246922904652, |
| "learning_rate": 2.382161869002599e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2148759663105011, |
| "step": 1560, |
| "valid_targets_mean": 3841.4, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 3.477777777777778, |
| "grad_norm": 0.7044788267096704, |
| "learning_rate": 2.371278786728436e-05, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24996237456798553, |
| "step": 1565, |
| "valid_targets_mean": 2695.3, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 3.488888888888889, |
| "grad_norm": 0.49301848581474994, |
| "learning_rate": 2.3603843063492892e-05, |
| "loss": 0.1948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028578519821167, |
| "step": 1570, |
| "valid_targets_mean": 5528.7, |
| "valid_targets_min": 2284 |
| }, |
| { |
| "epoch": 3.5, |
| "grad_norm": 0.5882627059324441, |
| "learning_rate": 2.3494787623211954e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19135794043540955, |
| "step": 1575, |
| "valid_targets_mean": 3645.6, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 3.511111111111111, |
| "grad_norm": 0.4963690972784803, |
| "learning_rate": 2.3385624894398387e-05, |
| "loss": 0.1973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20491212606430054, |
| "step": 1580, |
| "valid_targets_mean": 5376.0, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 3.522222222222222, |
| "grad_norm": 0.538419155290378, |
| "learning_rate": 2.3276358228302757e-05, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20943906903266907, |
| "step": 1585, |
| "valid_targets_mean": 3945.6, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 3.533333333333333, |
| "grad_norm": 0.6038918409459312, |
| "learning_rate": 2.316699097936646e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1826208233833313, |
| "step": 1590, |
| "valid_targets_mean": 2921.8, |
| "valid_targets_min": 247 |
| }, |
| { |
| "epoch": 3.5444444444444443, |
| "grad_norm": 0.48461226325428114, |
| "learning_rate": 2.305752650511874e-05, |
| "loss": 0.1971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23485904932022095, |
| "step": 1595, |
| "valid_targets_mean": 5048.4, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 3.5555555555555554, |
| "grad_norm": 0.4544047818243079, |
| "learning_rate": 2.2947968166073627e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17371800541877747, |
| "step": 1600, |
| "valid_targets_mean": 4993.6, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 3.5666666666666664, |
| "grad_norm": 0.4627984476791086, |
| "learning_rate": 2.2838319325626746e-05, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17911431193351746, |
| "step": 1605, |
| "valid_targets_mean": 5385.9, |
| "valid_targets_min": 2454 |
| }, |
| { |
| "epoch": 3.5777777777777775, |
| "grad_norm": 0.5655196781582149, |
| "learning_rate": 2.2728583349952094e-05, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18993490934371948, |
| "step": 1610, |
| "valid_targets_mean": 4732.7, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 3.588888888888889, |
| "grad_norm": 0.5352167184955361, |
| "learning_rate": 2.2618763607898666e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1996089518070221, |
| "step": 1615, |
| "valid_targets_mean": 4169.6, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 3.6, |
| "grad_norm": 0.533764539999318, |
| "learning_rate": 2.250886347088707e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1746983379125595, |
| "step": 1620, |
| "valid_targets_mean": 4142.2, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 3.611111111111111, |
| "grad_norm": 0.510040722808607, |
| "learning_rate": 2.2398886312805996e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19001047313213348, |
| "step": 1625, |
| "valid_targets_mean": 5082.9, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 3.6222222222222222, |
| "grad_norm": 0.5755748579267672, |
| "learning_rate": 2.228883550990864e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21132859587669373, |
| "step": 1630, |
| "valid_targets_mean": 4745.2, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 3.6333333333333333, |
| "grad_norm": 0.4921775589074553, |
| "learning_rate": 2.2178714440709084e-05, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1739899069070816, |
| "step": 1635, |
| "valid_targets_mean": 4681.7, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.6444444444444444, |
| "grad_norm": 0.4640557234030302, |
| "learning_rate": 2.206852648587853e-05, |
| "loss": 0.2106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20348605513572693, |
| "step": 1640, |
| "valid_targets_mean": 5669.5, |
| "valid_targets_min": 932 |
| }, |
| { |
| "epoch": 3.6555555555555554, |
| "grad_norm": 0.5916842012997149, |
| "learning_rate": 2.1958275028141566e-05, |
| "loss": 0.2239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27221259474754333, |
| "step": 1645, |
| "valid_targets_mean": 4139.3, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 3.6666666666666665, |
| "grad_norm": 0.5390040585860258, |
| "learning_rate": 2.1847963452172283e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1900901198387146, |
| "step": 1650, |
| "valid_targets_mean": 3726.5, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 3.677777777777778, |
| "grad_norm": 0.5164729678261945, |
| "learning_rate": 2.173759514449037e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19901810586452484, |
| "step": 1655, |
| "valid_targets_mean": 4287.4, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 3.688888888888889, |
| "grad_norm": 0.5897377625071923, |
| "learning_rate": 2.1627173493357167e-05, |
| "loss": 0.1981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2279503494501114, |
| "step": 1660, |
| "valid_targets_mean": 4376.0, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 3.7, |
| "grad_norm": 0.5386462237457673, |
| "learning_rate": 2.1516701888671633e-05, |
| "loss": 0.2009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19399359822273254, |
| "step": 1665, |
| "valid_targets_mean": 4516.8, |
| "valid_targets_min": 1662 |
| }, |
| { |
| "epoch": 3.7111111111111112, |
| "grad_norm": 0.6495411852106558, |
| "learning_rate": 2.1406183721866274e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21747617423534393, |
| "step": 1670, |
| "valid_targets_mean": 3540.1, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 3.7222222222222223, |
| "grad_norm": 0.6306749469465672, |
| "learning_rate": 2.1295622385803036e-05, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2108190804719925, |
| "step": 1675, |
| "valid_targets_mean": 3204.0, |
| "valid_targets_min": 394 |
| }, |
| { |
| "epoch": 3.7333333333333334, |
| "grad_norm": 0.5431455240184233, |
| "learning_rate": 2.118502127466916e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17692044377326965, |
| "step": 1680, |
| "valid_targets_mean": 4319.1, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 3.7444444444444445, |
| "grad_norm": 0.6628241987227439, |
| "learning_rate": 2.1074383783872932e-05, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21650046110153198, |
| "step": 1685, |
| "valid_targets_mean": 4163.4, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 3.7555555555555555, |
| "grad_norm": 0.5030160452803907, |
| "learning_rate": 2.0963713309939516e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18289291858673096, |
| "step": 1690, |
| "valid_targets_mean": 4629.3, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 3.7666666666666666, |
| "grad_norm": 0.4851965144847549, |
| "learning_rate": 2.0853013250406616e-05, |
| "loss": 0.2008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18697203695774078, |
| "step": 1695, |
| "valid_targets_mean": 4800.1, |
| "valid_targets_min": 449 |
| }, |
| { |
| "epoch": 3.7777777777777777, |
| "grad_norm": 0.5785969302326881, |
| "learning_rate": 2.0742287003720207e-05, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21332597732543945, |
| "step": 1700, |
| "valid_targets_mean": 3694.1, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 3.7888888888888888, |
| "grad_norm": 0.5232277659642465, |
| "learning_rate": 2.063153796913022e-05, |
| "loss": 0.1906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18892058730125427, |
| "step": 1705, |
| "valid_targets_mean": 4132.3, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 3.8, |
| "grad_norm": 0.4794174421487984, |
| "learning_rate": 2.0520769546586133e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17793911695480347, |
| "step": 1710, |
| "valid_targets_mean": 4531.4, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 3.811111111111111, |
| "grad_norm": 0.6049071480792642, |
| "learning_rate": 2.040998513663265e-05, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1857706606388092, |
| "step": 1715, |
| "valid_targets_mean": 3913.2, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 3.822222222222222, |
| "grad_norm": 0.5173798800043088, |
| "learning_rate": 2.0299188140305276e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23684772849082947, |
| "step": 1720, |
| "valid_targets_mean": 4988.8, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 3.8333333333333335, |
| "grad_norm": 0.475948457370568, |
| "learning_rate": 2.0188381959025905e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21646377444267273, |
| "step": 1725, |
| "valid_targets_mean": 5030.8, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 3.8444444444444446, |
| "grad_norm": 0.5604528558221183, |
| "learning_rate": 2.007756999449841e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21436989307403564, |
| "step": 1730, |
| "valid_targets_mean": 4397.3, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 3.8555555555555556, |
| "grad_norm": 0.5570797649957374, |
| "learning_rate": 1.9966755648604214e-05, |
| "loss": 0.2082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24257858097553253, |
| "step": 1735, |
| "valid_targets_mean": 4071.1, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 3.8666666666666667, |
| "grad_norm": 0.46080018957317304, |
| "learning_rate": 1.985594232329783e-05, |
| "loss": 0.1974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18925702571868896, |
| "step": 1740, |
| "valid_targets_mean": 5059.1, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.8777777777777778, |
| "grad_norm": 0.4812829548781769, |
| "learning_rate": 1.9745133420502465e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1966492235660553, |
| "step": 1745, |
| "valid_targets_mean": 5313.2, |
| "valid_targets_min": 356 |
| }, |
| { |
| "epoch": 3.888888888888889, |
| "grad_norm": 0.5203906670242995, |
| "learning_rate": 1.963433234200553e-05, |
| "loss": 0.2074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21304510533809662, |
| "step": 1750, |
| "valid_targets_mean": 5512.0, |
| "valid_targets_min": 2531 |
| }, |
| { |
| "epoch": 3.9, |
| "grad_norm": 0.6126769424919433, |
| "learning_rate": 1.9523542489354256e-05, |
| "loss": 0.2047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22729770839214325, |
| "step": 1755, |
| "valid_targets_mean": 5147.4, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 3.911111111111111, |
| "grad_norm": 0.7274046140099543, |
| "learning_rate": 1.941276726375122e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21173256635665894, |
| "step": 1760, |
| "valid_targets_mean": 3680.5, |
| "valid_targets_min": 341 |
| }, |
| { |
| "epoch": 3.9222222222222225, |
| "grad_norm": 0.5066040807104453, |
| "learning_rate": 1.930201006594999e-05, |
| "loss": 0.2063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1861998438835144, |
| "step": 1765, |
| "valid_targets_mean": 4067.4, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 3.9333333333333336, |
| "grad_norm": 0.5122320443909304, |
| "learning_rate": 1.9191274296150636e-05, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1726941615343094, |
| "step": 1770, |
| "valid_targets_mean": 5269.1, |
| "valid_targets_min": 2317 |
| }, |
| { |
| "epoch": 3.9444444444444446, |
| "grad_norm": 0.49916849396763285, |
| "learning_rate": 1.9080563353895468e-05, |
| "loss": 0.2072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22421357035636902, |
| "step": 1775, |
| "valid_targets_mean": 5178.7, |
| "valid_targets_min": 1286 |
| }, |
| { |
| "epoch": 3.9555555555555557, |
| "grad_norm": 0.5416199282424495, |
| "learning_rate": 1.8969880637964523e-05, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20803487300872803, |
| "step": 1780, |
| "valid_targets_mean": 4335.1, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 3.966666666666667, |
| "grad_norm": 0.5193931663669582, |
| "learning_rate": 1.885922954627137e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.189504474401474, |
| "step": 1785, |
| "valid_targets_mean": 4079.9, |
| "valid_targets_min": 238 |
| }, |
| { |
| "epoch": 3.977777777777778, |
| "grad_norm": 0.5499095062300164, |
| "learning_rate": 1.874861347575867e-05, |
| "loss": 0.1983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20028920471668243, |
| "step": 1790, |
| "valid_targets_mean": 3822.6, |
| "valid_targets_min": 289 |
| }, |
| { |
| "epoch": 3.988888888888889, |
| "grad_norm": 0.8033600112574325, |
| "learning_rate": 1.8638035822294e-05, |
| "loss": 0.2081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1908196657896042, |
| "step": 1795, |
| "valid_targets_mean": 3417.7, |
| "valid_targets_min": 579 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 0.5699774855020878, |
| "learning_rate": 1.8527499980565505e-05, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20389728248119354, |
| "step": 1800, |
| "valid_targets_mean": 3703.6, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 4.011111111111111, |
| "grad_norm": 0.5684718820432649, |
| "learning_rate": 1.841700934397776e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16114360094070435, |
| "step": 1805, |
| "valid_targets_mean": 4019.9, |
| "valid_targets_min": 359 |
| }, |
| { |
| "epoch": 4.022222222222222, |
| "grad_norm": 0.8806388269505611, |
| "learning_rate": 1.8306567304547537e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19996638596057892, |
| "step": 1810, |
| "valid_targets_mean": 4715.6, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 4.033333333333333, |
| "grad_norm": 0.51053756371864, |
| "learning_rate": 1.8196177252799715e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17319592833518982, |
| "step": 1815, |
| "valid_targets_mean": 4569.9, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 4.044444444444444, |
| "grad_norm": 0.5334838424279315, |
| "learning_rate": 1.8085842577663152e-05, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17766398191452026, |
| "step": 1820, |
| "valid_targets_mean": 4956.6, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 4.055555555555555, |
| "grad_norm": 0.5972352034988178, |
| "learning_rate": 1.797556666636669e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21527108550071716, |
| "step": 1825, |
| "valid_targets_mean": 4466.4, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 4.066666666666666, |
| "grad_norm": 0.6680425414614198, |
| "learning_rate": 1.786535290433512e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18751859664916992, |
| "step": 1830, |
| "valid_targets_mean": 3271.0, |
| "valid_targets_min": 257 |
| }, |
| { |
| "epoch": 4.0777777777777775, |
| "grad_norm": 0.6531224124175032, |
| "learning_rate": 1.775520467508531e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17578667402267456, |
| "step": 1835, |
| "valid_targets_mean": 4452.1, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 4.088888888888889, |
| "grad_norm": 0.5260657108991496, |
| "learning_rate": 1.7645125360122254e-05, |
| "loss": 0.1968, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1891654133796692, |
| "step": 1840, |
| "valid_targets_mean": 4629.7, |
| "valid_targets_min": 449 |
| }, |
| { |
| "epoch": 4.1, |
| "grad_norm": 0.6623628808793622, |
| "learning_rate": 1.7535118338835358e-05, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20977142453193665, |
| "step": 1845, |
| "valid_targets_mean": 4678.6, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 4.111111111111111, |
| "grad_norm": 0.49817831354909214, |
| "learning_rate": 1.7425186988394586e-05, |
| "loss": 0.1687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15036168694496155, |
| "step": 1850, |
| "valid_targets_mean": 4100.6, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 4.122222222222222, |
| "grad_norm": 0.7692282976104367, |
| "learning_rate": 1.7315334683646898e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2357831746339798, |
| "step": 1855, |
| "valid_targets_mean": 3612.0, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 4.133333333333334, |
| "grad_norm": 0.7604226917728939, |
| "learning_rate": 1.7205564797012523e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18661850690841675, |
| "step": 1860, |
| "valid_targets_mean": 2620.3, |
| "valid_targets_min": 350 |
| }, |
| { |
| "epoch": 4.144444444444445, |
| "grad_norm": 2.0101196160603068, |
| "learning_rate": 1.709588069838154e-05, |
| "loss": 0.1809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724318563938141, |
| "step": 1865, |
| "valid_targets_mean": 5017.0, |
| "valid_targets_min": 1569 |
| }, |
| { |
| "epoch": 4.155555555555556, |
| "grad_norm": 0.5176081748220945, |
| "learning_rate": 1.698628575501034e-05, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19876284897327423, |
| "step": 1870, |
| "valid_targets_mean": 5018.9, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 4.166666666666667, |
| "grad_norm": 0.9808635975742276, |
| "learning_rate": 1.6876783331418298e-05, |
| "loss": 0.1717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1666911095380783, |
| "step": 1875, |
| "valid_targets_mean": 4702.4, |
| "valid_targets_min": 407 |
| }, |
| { |
| "epoch": 4.177777777777778, |
| "grad_norm": 0.5808524542461861, |
| "learning_rate": 1.6767376789284463e-05, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1758621335029602, |
| "step": 1880, |
| "valid_targets_mean": 4182.8, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 4.188888888888889, |
| "grad_norm": 0.6204999195476525, |
| "learning_rate": 1.6658069487344375e-05, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2005249559879303, |
| "step": 1885, |
| "valid_targets_mean": 3792.5, |
| "valid_targets_min": 494 |
| }, |
| { |
| "epoch": 4.2, |
| "grad_norm": 0.5137903997287736, |
| "learning_rate": 1.6548864781286922e-05, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2340593785047531, |
| "step": 1890, |
| "valid_targets_mean": 5812.1, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 4.211111111111111, |
| "grad_norm": 0.6084912042277302, |
| "learning_rate": 1.643976602365136e-05, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16975033283233643, |
| "step": 1895, |
| "valid_targets_mean": 4331.1, |
| "valid_targets_min": 331 |
| }, |
| { |
| "epoch": 4.222222222222222, |
| "grad_norm": 0.6075386711012212, |
| "learning_rate": 1.6330776563724354e-05, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22459827363491058, |
| "step": 1900, |
| "valid_targets_mean": 4126.8, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 4.233333333333333, |
| "grad_norm": 0.5755129056791891, |
| "learning_rate": 1.62218997474372e-05, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21275658905506134, |
| "step": 1905, |
| "valid_targets_mean": 4578.6, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 4.2444444444444445, |
| "grad_norm": 0.48496618553325505, |
| "learning_rate": 1.6113138917263048e-05, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19767220318317413, |
| "step": 1910, |
| "valid_targets_mean": 5804.9, |
| "valid_targets_min": 2846 |
| }, |
| { |
| "epoch": 4.2555555555555555, |
| "grad_norm": 0.4549668072241525, |
| "learning_rate": 1.6004497412114354e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17819060385227203, |
| "step": 1915, |
| "valid_targets_mean": 5614.6, |
| "valid_targets_min": 1831 |
| }, |
| { |
| "epoch": 4.266666666666667, |
| "grad_norm": 0.6183406372685394, |
| "learning_rate": 1.5895978567240314e-05, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15784139931201935, |
| "step": 1920, |
| "valid_targets_mean": 4810.9, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 4.277777777777778, |
| "grad_norm": 0.8322895904947307, |
| "learning_rate": 1.578758571412455e-05, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18652507662773132, |
| "step": 1925, |
| "valid_targets_mean": 4329.2, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 4.288888888888889, |
| "grad_norm": 0.5770135845347438, |
| "learning_rate": 1.5679322180382725e-05, |
| "loss": 0.1811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16608160734176636, |
| "step": 1930, |
| "valid_targets_mean": 4621.5, |
| "valid_targets_min": 311 |
| }, |
| { |
| "epoch": 4.3, |
| "grad_norm": 0.5340562181628422, |
| "learning_rate": 1.5571191289660517e-05, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19259527325630188, |
| "step": 1935, |
| "valid_targets_mean": 4542.4, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 4.311111111111111, |
| "grad_norm": 0.5261906980551986, |
| "learning_rate": 1.5463196361531463e-05, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1652071177959442, |
| "step": 1940, |
| "valid_targets_mean": 4197.6, |
| "valid_targets_min": 351 |
| }, |
| { |
| "epoch": 4.322222222222222, |
| "grad_norm": 0.592935992602908, |
| "learning_rate": 1.5355340711395154e-05, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.173154816031456, |
| "step": 1945, |
| "valid_targets_mean": 3825.3, |
| "valid_targets_min": 362 |
| }, |
| { |
| "epoch": 4.333333333333333, |
| "grad_norm": 0.6272334939060681, |
| "learning_rate": 1.5247627650375356e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2008039653301239, |
| "step": 1950, |
| "valid_targets_mean": 3113.1, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 4.344444444444444, |
| "grad_norm": 0.555228561708398, |
| "learning_rate": 1.5140060485218448e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21200916171073914, |
| "step": 1955, |
| "valid_targets_mean": 4375.6, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 4.355555555555555, |
| "grad_norm": 0.6835598461585742, |
| "learning_rate": 1.5032642518191842e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14425814151763916, |
| "step": 1960, |
| "valid_targets_mean": 3954.5, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 4.366666666666666, |
| "grad_norm": 0.6035952467820439, |
| "learning_rate": 1.4925377046982642e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21049894392490387, |
| "step": 1965, |
| "valid_targets_mean": 4949.8, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 4.377777777777778, |
| "grad_norm": 0.5857625986334895, |
| "learning_rate": 1.4818267364596382e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18046881258487701, |
| "step": 1970, |
| "valid_targets_mean": 4697.1, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 4.388888888888889, |
| "grad_norm": 0.5718012391776226, |
| "learning_rate": 1.4711316759255963e-05, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1622503101825714, |
| "step": 1975, |
| "valid_targets_mean": 3431.1, |
| "valid_targets_min": 354 |
| }, |
| { |
| "epoch": 4.4, |
| "grad_norm": 0.43582007281524776, |
| "learning_rate": 1.4604528514300657e-05, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15850958228111267, |
| "step": 1980, |
| "valid_targets_mean": 5733.1, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 4.411111111111111, |
| "grad_norm": 0.49374637349645484, |
| "learning_rate": 1.449790590808537e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18013733625411987, |
| "step": 1985, |
| "valid_targets_mean": 5131.2, |
| "valid_targets_min": 337 |
| }, |
| { |
| "epoch": 4.4222222222222225, |
| "grad_norm": 0.572851756273217, |
| "learning_rate": 1.4391452213879949e-05, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20474226772785187, |
| "step": 1990, |
| "valid_targets_mean": 4462.7, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 4.433333333333334, |
| "grad_norm": 0.5793355474922025, |
| "learning_rate": 1.428517069976872e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16491413116455078, |
| "step": 1995, |
| "valid_targets_mean": 3528.5, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 4.444444444444445, |
| "grad_norm": 0.5903074938236061, |
| "learning_rate": 1.4179064628550139e-05, |
| "loss": 0.1935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1816416233778, |
| "step": 2000, |
| "valid_targets_mean": 3910.4, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 4.455555555555556, |
| "grad_norm": 0.6305819902409494, |
| "learning_rate": 1.4073137257636664e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19318446516990662, |
| "step": 2005, |
| "valid_targets_mean": 3550.6, |
| "valid_targets_min": 302 |
| }, |
| { |
| "epoch": 4.466666666666667, |
| "grad_norm": 0.4779759860608762, |
| "learning_rate": 1.3967391838954692e-05, |
| "loss": 0.1843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18327465653419495, |
| "step": 2010, |
| "valid_targets_mean": 5106.4, |
| "valid_targets_min": 500 |
| }, |
| { |
| "epoch": 4.477777777777778, |
| "grad_norm": 0.5305939803137136, |
| "learning_rate": 1.3861831618844797e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1693880707025528, |
| "step": 2015, |
| "valid_targets_mean": 4351.6, |
| "valid_targets_min": 229 |
| }, |
| { |
| "epoch": 4.488888888888889, |
| "grad_norm": 0.556324424618143, |
| "learning_rate": 1.3756459837962006e-05, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20899684727191925, |
| "step": 2020, |
| "valid_targets_mean": 4319.3, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 4.5, |
| "grad_norm": 0.511876429216537, |
| "learning_rate": 1.3651279731176364e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17796722054481506, |
| "step": 2025, |
| "valid_targets_mean": 4701.2, |
| "valid_targets_min": 288 |
| }, |
| { |
| "epoch": 4.511111111111111, |
| "grad_norm": 0.483714945780867, |
| "learning_rate": 1.354629452747357e-05, |
| "loss": 0.1912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20415997505187988, |
| "step": 2030, |
| "valid_targets_mean": 5413.3, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 4.522222222222222, |
| "grad_norm": 0.550003762747203, |
| "learning_rate": 1.3441507449855914e-05, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19250717759132385, |
| "step": 2035, |
| "valid_targets_mean": 4369.6, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 4.533333333333333, |
| "grad_norm": 0.6783462987349089, |
| "learning_rate": 1.3336921715243269e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19246190786361694, |
| "step": 2040, |
| "valid_targets_mean": 3528.1, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 4.544444444444444, |
| "grad_norm": 0.5408235091774686, |
| "learning_rate": 1.323254053437438e-05, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17241522669792175, |
| "step": 2045, |
| "valid_targets_mean": 4255.3, |
| "valid_targets_min": 369 |
| }, |
| { |
| "epoch": 4.555555555555555, |
| "grad_norm": 0.6039322559430673, |
| "learning_rate": 1.3128367111708263e-05, |
| "loss": 0.1996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2341468334197998, |
| "step": 2050, |
| "valid_targets_mean": 3956.6, |
| "valid_targets_min": 394 |
| }, |
| { |
| "epoch": 4.566666666666666, |
| "grad_norm": 0.5210903518867492, |
| "learning_rate": 1.3024404645325852e-05, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15793342888355255, |
| "step": 2055, |
| "valid_targets_mean": 4055.9, |
| "valid_targets_min": 445 |
| }, |
| { |
| "epoch": 4.5777777777777775, |
| "grad_norm": 0.5833872344585873, |
| "learning_rate": 1.2920656326831802e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1832209825515747, |
| "step": 2060, |
| "valid_targets_mean": 4347.2, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 4.588888888888889, |
| "grad_norm": 0.6031674137203222, |
| "learning_rate": 1.2817125341256533e-05, |
| "loss": 0.1744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1834879219532013, |
| "step": 2065, |
| "valid_targets_mean": 4529.2, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 4.6, |
| "grad_norm": 0.5606753056516752, |
| "learning_rate": 1.271381486695841e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19605132937431335, |
| "step": 2070, |
| "valid_targets_mean": 4212.9, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 4.611111111111111, |
| "grad_norm": 0.5776621511116948, |
| "learning_rate": 1.2610728075526226e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18587753176689148, |
| "step": 2075, |
| "valid_targets_mean": 4053.1, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 4.622222222222222, |
| "grad_norm": 0.5798129503418713, |
| "learning_rate": 1.250786813168176e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20402874052524567, |
| "step": 2080, |
| "valid_targets_mean": 3672.6, |
| "valid_targets_min": 344 |
| }, |
| { |
| "epoch": 4.633333333333333, |
| "grad_norm": 0.6919963067401517, |
| "learning_rate": 1.2405238193182711e-05, |
| "loss": 0.1854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17745724320411682, |
| "step": 2085, |
| "valid_targets_mean": 4872.3, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 4.644444444444445, |
| "grad_norm": 0.5410119427822812, |
| "learning_rate": 1.2302841410725664e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15331071615219116, |
| "step": 2090, |
| "valid_targets_mean": 3988.9, |
| "valid_targets_min": 428 |
| }, |
| { |
| "epoch": 4.655555555555556, |
| "grad_norm": 0.7216545479667651, |
| "learning_rate": 1.2200680927849447e-05, |
| "loss": 0.1981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1797543466091156, |
| "step": 2095, |
| "valid_targets_mean": 2614.6, |
| "valid_targets_min": 251 |
| }, |
| { |
| "epoch": 4.666666666666667, |
| "grad_norm": 0.5002180832671941, |
| "learning_rate": 1.2098759880838562e-05, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18461236357688904, |
| "step": 2100, |
| "valid_targets_mean": 4813.4, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 4.677777777777778, |
| "grad_norm": 0.6182929611883429, |
| "learning_rate": 1.1997081398626951e-05, |
| "loss": 0.1859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2105226218700409, |
| "step": 2105, |
| "valid_targets_mean": 4094.2, |
| "valid_targets_min": 323 |
| }, |
| { |
| "epoch": 4.688888888888889, |
| "grad_norm": 0.4881507674799763, |
| "learning_rate": 1.18956486027019e-05, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19194287061691284, |
| "step": 2110, |
| "valid_targets_mean": 5929.9, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 4.7, |
| "grad_norm": 0.5040091679866664, |
| "learning_rate": 1.179446460700824e-05, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16895370185375214, |
| "step": 2115, |
| "valid_targets_mean": 4929.5, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 4.711111111111111, |
| "grad_norm": 0.6224311426866647, |
| "learning_rate": 1.1693532517852723e-05, |
| "loss": 0.1854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19463957846164703, |
| "step": 2120, |
| "valid_targets_mean": 3470.4, |
| "valid_targets_min": 274 |
| }, |
| { |
| "epoch": 4.722222222222222, |
| "grad_norm": 0.5006685355462409, |
| "learning_rate": 1.1592855433808694e-05, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18951840698719025, |
| "step": 2125, |
| "valid_targets_mean": 4650.5, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 4.733333333333333, |
| "grad_norm": 0.5583432290318547, |
| "learning_rate": 1.1492436445620925e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2058507204055786, |
| "step": 2130, |
| "valid_targets_mean": 4445.6, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 4.7444444444444445, |
| "grad_norm": 0.6115562244324856, |
| "learning_rate": 1.1392278636110779e-05, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1816525161266327, |
| "step": 2135, |
| "valid_targets_mean": 3926.6, |
| "valid_targets_min": 317 |
| }, |
| { |
| "epoch": 4.7555555555555555, |
| "grad_norm": 0.6799289643246074, |
| "learning_rate": 1.1292385080081517e-05, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18920482695102692, |
| "step": 2140, |
| "valid_targets_mean": 3852.1, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 4.766666666666667, |
| "grad_norm": 0.5372580596002592, |
| "learning_rate": 1.1192758844223936e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19938793778419495, |
| "step": 2145, |
| "valid_targets_mean": 4286.1, |
| "valid_targets_min": 1315 |
| }, |
| { |
| "epoch": 4.777777777777778, |
| "grad_norm": 0.6680811833814686, |
| "learning_rate": 1.1093402987022213e-05, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1695014089345932, |
| "step": 2150, |
| "valid_targets_mean": 3701.4, |
| "valid_targets_min": 490 |
| }, |
| { |
| "epoch": 4.788888888888889, |
| "grad_norm": 0.532047483958881, |
| "learning_rate": 1.0994320558660027e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17513462901115417, |
| "step": 2155, |
| "valid_targets_mean": 4425.6, |
| "valid_targets_min": 433 |
| }, |
| { |
| "epoch": 4.8, |
| "grad_norm": 0.48955367777151076, |
| "learning_rate": 1.0895514600926885e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17399895191192627, |
| "step": 2160, |
| "valid_targets_mean": 5218.5, |
| "valid_targets_min": 214 |
| }, |
| { |
| "epoch": 4.811111111111111, |
| "grad_norm": 0.5389514735096081, |
| "learning_rate": 1.0796988147124767e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17753294110298157, |
| "step": 2165, |
| "valid_targets_mean": 4527.4, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 4.822222222222222, |
| "grad_norm": 0.9507144410317093, |
| "learning_rate": 1.0698744221974992e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16774040460586548, |
| "step": 2170, |
| "valid_targets_mean": 4067.5, |
| "valid_targets_min": 326 |
| }, |
| { |
| "epoch": 4.833333333333333, |
| "grad_norm": 0.7577965149578579, |
| "learning_rate": 1.0600785841525387e-05, |
| "loss": 0.1856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.171237975358963, |
| "step": 2175, |
| "valid_targets_mean": 2212.1, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 4.844444444444444, |
| "grad_norm": 0.6346378233034229, |
| "learning_rate": 1.050311601305765e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19538968801498413, |
| "step": 2180, |
| "valid_targets_mean": 3583.8, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 4.855555555555555, |
| "grad_norm": 0.4998326129850529, |
| "learning_rate": 1.0405737734995083e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18201160430908203, |
| "step": 2185, |
| "valid_targets_mean": 5208.7, |
| "valid_targets_min": 532 |
| }, |
| { |
| "epoch": 4.866666666666667, |
| "grad_norm": 0.4912406558278592, |
| "learning_rate": 1.0308653996810464e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1872013956308365, |
| "step": 2190, |
| "valid_targets_mean": 5092.2, |
| "valid_targets_min": 425 |
| }, |
| { |
| "epoch": 4.877777777777778, |
| "grad_norm": 0.49376056988072214, |
| "learning_rate": 1.0211867778934367e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1690564602613449, |
| "step": 2195, |
| "valid_targets_mean": 4442.9, |
| "valid_targets_min": 429 |
| }, |
| { |
| "epoch": 4.888888888888889, |
| "grad_norm": 0.508817245830961, |
| "learning_rate": 1.0115382052663585e-05, |
| "loss": 0.1694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18353170156478882, |
| "step": 2200, |
| "valid_targets_mean": 4733.5, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 4.9, |
| "grad_norm": 0.6203985436463371, |
| "learning_rate": 1.0019199780069964e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186293363571167, |
| "step": 2205, |
| "valid_targets_mean": 5280.8, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 4.911111111111111, |
| "grad_norm": 0.5435822402870782, |
| "learning_rate": 9.923323913909432e-06, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16027119755744934, |
| "step": 2210, |
| "valid_targets_mean": 4576.7, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 4.9222222222222225, |
| "grad_norm": 0.4813208514339158, |
| "learning_rate": 9.827757397531373e-06, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18010596930980682, |
| "step": 2215, |
| "valid_targets_mean": 4874.1, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 4.933333333333334, |
| "grad_norm": 0.47571932658220617, |
| "learning_rate": 9.732503164788251e-06, |
| "loss": 0.1855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2023318111896515, |
| "step": 2220, |
| "valid_targets_mean": 5265.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 4.944444444444445, |
| "grad_norm": 0.5094329037736811, |
| "learning_rate": 9.637564139945576e-06, |
| "loss": 0.1875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17661988735198975, |
| "step": 2225, |
| "valid_targets_mean": 4558.8, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 4.955555555555556, |
| "grad_norm": 0.4793807998595178, |
| "learning_rate": 9.542943237592087e-06, |
| "loss": 0.1849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16008728742599487, |
| "step": 2230, |
| "valid_targets_mean": 4763.2, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 4.966666666666667, |
| "grad_norm": 0.5198576392426981, |
| "learning_rate": 9.448643362550289e-06, |
| "loss": 0.1765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1592457890510559, |
| "step": 2235, |
| "valid_targets_mean": 4264.2, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 4.977777777777778, |
| "grad_norm": 0.6619815493156004, |
| "learning_rate": 9.354667409787293e-06, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2216649353504181, |
| "step": 2240, |
| "valid_targets_mean": 3992.6, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 4.988888888888889, |
| "grad_norm": 0.6140070608373793, |
| "learning_rate": 9.261018264325934e-06, |
| "loss": 0.1891, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19572074711322784, |
| "step": 2245, |
| "valid_targets_mean": 4591.1, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.501892983243998, |
| "learning_rate": 9.16769880115619e-06, |
| "loss": 0.1883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1657697856426239, |
| "step": 2250, |
| "valid_targets_mean": 4708.9, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 5.011111111111111, |
| "grad_norm": 0.5678698075193299, |
| "learning_rate": 9.074711885146928e-06, |
| "loss": 0.1815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18971869349479675, |
| "step": 2255, |
| "valid_targets_mean": 4164.5, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 5.022222222222222, |
| "grad_norm": 0.4976115195176415, |
| "learning_rate": 8.982060370957953e-06, |
| "loss": 0.1665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1750781536102295, |
| "step": 2260, |
| "valid_targets_mean": 5020.1, |
| "valid_targets_min": 290 |
| }, |
| { |
| "epoch": 5.033333333333333, |
| "grad_norm": 0.684873203009687, |
| "learning_rate": 8.889747102952388e-06, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18005429208278656, |
| "step": 2265, |
| "valid_targets_mean": 3440.0, |
| "valid_targets_min": 307 |
| }, |
| { |
| "epoch": 5.044444444444444, |
| "grad_norm": 0.5033230409129855, |
| "learning_rate": 8.79777491510932e-06, |
| "loss": 0.1776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18455460667610168, |
| "step": 2270, |
| "valid_targets_mean": 5328.9, |
| "valid_targets_min": 247 |
| }, |
| { |
| "epoch": 5.055555555555555, |
| "grad_norm": 0.5173477816105783, |
| "learning_rate": 8.706146630936833e-06, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16611988842487335, |
| "step": 2275, |
| "valid_targets_mean": 4557.4, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 5.066666666666666, |
| "grad_norm": 0.6042166823752133, |
| "learning_rate": 8.6148650633853e-06, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16022253036499023, |
| "step": 2280, |
| "valid_targets_mean": 4060.4, |
| "valid_targets_min": 406 |
| }, |
| { |
| "epoch": 5.0777777777777775, |
| "grad_norm": 0.6312726838673673, |
| "learning_rate": 8.523933014761038e-06, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1730879247188568, |
| "step": 2285, |
| "valid_targets_mean": 3444.7, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 5.088888888888889, |
| "grad_norm": 0.5063988724236291, |
| "learning_rate": 8.43335327664027e-06, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17903856933116913, |
| "step": 2290, |
| "valid_targets_mean": 4995.8, |
| "valid_targets_min": 362 |
| }, |
| { |
| "epoch": 5.1, |
| "grad_norm": 0.596851968168963, |
| "learning_rate": 8.343128629783457e-06, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1816779375076294, |
| "step": 2295, |
| "valid_targets_mean": 5093.5, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 5.111111111111111, |
| "grad_norm": 0.5710225280632183, |
| "learning_rate": 8.253261844049883e-06, |
| "loss": 0.1854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.168840691447258, |
| "step": 2300, |
| "valid_targets_mean": 4315.1, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 5.122222222222222, |
| "grad_norm": 0.4748229596313232, |
| "learning_rate": 8.163755678312651e-06, |
| "loss": 0.1897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2132357954978943, |
| "step": 2305, |
| "valid_targets_mean": 5789.9, |
| "valid_targets_min": 283 |
| }, |
| { |
| "epoch": 5.133333333333334, |
| "grad_norm": 0.5287110732175844, |
| "learning_rate": 8.074612880373972e-06, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1418144404888153, |
| "step": 2310, |
| "valid_targets_mean": 4440.9, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 5.144444444444445, |
| "grad_norm": 0.5936650959791397, |
| "learning_rate": 7.985836186880836e-06, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1570664495229721, |
| "step": 2315, |
| "valid_targets_mean": 4190.9, |
| "valid_targets_min": 335 |
| }, |
| { |
| "epoch": 5.155555555555556, |
| "grad_norm": 0.5901961361581314, |
| "learning_rate": 7.897428323240961e-06, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14300040900707245, |
| "step": 2320, |
| "valid_targets_mean": 4530.4, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 5.166666666666667, |
| "grad_norm": 0.6401412212898742, |
| "learning_rate": 7.809392003539142e-06, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18366971611976624, |
| "step": 2325, |
| "valid_targets_mean": 4497.3, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 5.177777777777778, |
| "grad_norm": 0.5870360837488321, |
| "learning_rate": 7.72172993045393e-06, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19780203700065613, |
| "step": 2330, |
| "valid_targets_mean": 4467.4, |
| "valid_targets_min": 229 |
| }, |
| { |
| "epoch": 5.188888888888889, |
| "grad_norm": 0.6222022824851804, |
| "learning_rate": 7.634444795174671e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1735324114561081, |
| "step": 2335, |
| "valid_targets_mean": 3150.3, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 5.2, |
| "grad_norm": 0.612607191802424, |
| "learning_rate": 7.547539277318861e-06, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17350366711616516, |
| "step": 2340, |
| "valid_targets_mean": 4619.4, |
| "valid_targets_min": 2673 |
| }, |
| { |
| "epoch": 5.211111111111111, |
| "grad_norm": 0.7049036474479938, |
| "learning_rate": 7.461016044849918e-06, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1929350346326828, |
| "step": 2345, |
| "valid_targets_mean": 3115.6, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 5.222222222222222, |
| "grad_norm": 0.5410958789958754, |
| "learning_rate": 7.374877753995224e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1535416543483734, |
| "step": 2350, |
| "valid_targets_mean": 4524.3, |
| "valid_targets_min": 270 |
| }, |
| { |
| "epoch": 5.233333333333333, |
| "grad_norm": 0.6124896649786123, |
| "learning_rate": 7.289127049164648e-06, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19674161076545715, |
| "step": 2355, |
| "valid_targets_mean": 4170.1, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 5.2444444444444445, |
| "grad_norm": 0.4994651140821769, |
| "learning_rate": 7.203766562869303e-06, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17009888589382172, |
| "step": 2360, |
| "valid_targets_mean": 5436.4, |
| "valid_targets_min": 231 |
| }, |
| { |
| "epoch": 5.2555555555555555, |
| "grad_norm": 0.6480412371115537, |
| "learning_rate": 7.118798915640779e-06, |
| "loss": 0.1703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17472770810127258, |
| "step": 2365, |
| "valid_targets_mean": 3678.0, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 5.266666666666667, |
| "grad_norm": 1.0624757859362757, |
| "learning_rate": 7.03422671595065e-06, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1649678647518158, |
| "step": 2370, |
| "valid_targets_mean": 4187.2, |
| "valid_targets_min": 576 |
| }, |
| { |
| "epoch": 5.277777777777778, |
| "grad_norm": 0.5370386672344407, |
| "learning_rate": 6.950052560130414e-06, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16847020387649536, |
| "step": 2375, |
| "valid_targets_mean": 4683.0, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 5.288888888888889, |
| "grad_norm": 0.6286328398732474, |
| "learning_rate": 6.866279032291792e-06, |
| "loss": 0.1574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15064719319343567, |
| "step": 2380, |
| "valid_targets_mean": 3968.8, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 5.3, |
| "grad_norm": 0.5874233077841997, |
| "learning_rate": 6.782908704247404e-06, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1599939465522766, |
| "step": 2385, |
| "valid_targets_mean": 4385.2, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 5.311111111111111, |
| "grad_norm": 1.3591182836953655, |
| "learning_rate": 6.699944135431788e-06, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15932810306549072, |
| "step": 2390, |
| "valid_targets_mean": 3961.2, |
| "valid_targets_min": 312 |
| }, |
| { |
| "epoch": 5.322222222222222, |
| "grad_norm": 0.5070411136628474, |
| "learning_rate": 6.617387872822842e-06, |
| "loss": 0.1614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17544835805892944, |
| "step": 2395, |
| "valid_targets_mean": 5117.5, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 5.333333333333333, |
| "grad_norm": 0.53150416040399, |
| "learning_rate": 6.535242450863632e-06, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18131661415100098, |
| "step": 2400, |
| "valid_targets_mean": 4886.9, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 5.344444444444444, |
| "grad_norm": 0.5740042351970523, |
| "learning_rate": 6.453510391384606e-06, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17442232370376587, |
| "step": 2405, |
| "valid_targets_mean": 3791.2, |
| "valid_targets_min": 423 |
| }, |
| { |
| "epoch": 5.355555555555555, |
| "grad_norm": 0.46895250507011754, |
| "learning_rate": 6.372194203526121e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1439400017261505, |
| "step": 2410, |
| "valid_targets_mean": 5206.1, |
| "valid_targets_min": 546 |
| }, |
| { |
| "epoch": 5.366666666666666, |
| "grad_norm": 0.6356884401904439, |
| "learning_rate": 6.2912963836614916e-06, |
| "loss": 0.178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20238983631134033, |
| "step": 2415, |
| "valid_targets_mean": 3916.1, |
| "valid_targets_min": 259 |
| }, |
| { |
| "epoch": 5.377777777777778, |
| "grad_norm": 0.6215829652547431, |
| "learning_rate": 6.210819415320253e-06, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14836809039115906, |
| "step": 2420, |
| "valid_targets_mean": 4363.0, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 5.388888888888889, |
| "grad_norm": 0.5563038744061828, |
| "learning_rate": 6.130765769112024e-06, |
| "loss": 0.1663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17539286613464355, |
| "step": 2425, |
| "valid_targets_mean": 4587.9, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 5.4, |
| "grad_norm": 0.5854838140260286, |
| "learning_rate": 6.051137902650575e-06, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1495419442653656, |
| "step": 2430, |
| "valid_targets_mean": 5041.7, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 5.411111111111111, |
| "grad_norm": 0.5363335763908142, |
| "learning_rate": 5.9719382604784405e-06, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16383875906467438, |
| "step": 2435, |
| "valid_targets_mean": 4707.6, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 5.4222222222222225, |
| "grad_norm": 0.6920747040184556, |
| "learning_rate": 5.893169273991825e-06, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20277723670005798, |
| "step": 2440, |
| "valid_targets_mean": 3596.3, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 5.433333333333334, |
| "grad_norm": 0.5506429671164328, |
| "learning_rate": 5.8148333613659945e-06, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16613167524337769, |
| "step": 2445, |
| "valid_targets_mean": 4807.0, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 5.444444444444445, |
| "grad_norm": 0.5643735346992593, |
| "learning_rate": 5.736932927481016e-06, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1531161069869995, |
| "step": 2450, |
| "valid_targets_mean": 4414.6, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 5.455555555555556, |
| "grad_norm": 0.4966057762741589, |
| "learning_rate": 5.659470363847956e-06, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15961554646492004, |
| "step": 2455, |
| "valid_targets_mean": 5181.2, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 5.466666666666667, |
| "grad_norm": 0.597256774781567, |
| "learning_rate": 5.5824480485354315e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19598601758480072, |
| "step": 2460, |
| "valid_targets_mean": 5393.7, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 5.477777777777778, |
| "grad_norm": 0.47416903570786223, |
| "learning_rate": 5.505868346096623e-06, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17863276600837708, |
| "step": 2465, |
| "valid_targets_mean": 5649.1, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 5.488888888888889, |
| "grad_norm": 0.656500574854733, |
| "learning_rate": 5.429733607496674e-06, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15013918280601501, |
| "step": 2470, |
| "valid_targets_mean": 3773.6, |
| "valid_targets_min": 442 |
| }, |
| { |
| "epoch": 5.5, |
| "grad_norm": 0.5765586477143745, |
| "learning_rate": 5.354046170040537e-06, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18464767932891846, |
| "step": 2475, |
| "valid_targets_mean": 4310.9, |
| "valid_targets_min": 359 |
| }, |
| { |
| "epoch": 5.511111111111111, |
| "grad_norm": 0.513219195279251, |
| "learning_rate": 5.278808357301186e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16760313510894775, |
| "step": 2480, |
| "valid_targets_mean": 4913.3, |
| "valid_targets_min": 259 |
| }, |
| { |
| "epoch": 5.522222222222222, |
| "grad_norm": 0.6307469353575386, |
| "learning_rate": 5.204022479048325e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18006855249404907, |
| "step": 2485, |
| "valid_targets_mean": 3771.8, |
| "valid_targets_min": 419 |
| }, |
| { |
| "epoch": 5.533333333333333, |
| "grad_norm": 0.6063474311283815, |
| "learning_rate": 5.129690831177425e-06, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1837840974330902, |
| "step": 2490, |
| "valid_targets_mean": 3647.8, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 5.544444444444444, |
| "grad_norm": 0.5318846921681258, |
| "learning_rate": 5.055815695639303e-06, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1946224868297577, |
| "step": 2495, |
| "valid_targets_mean": 4591.3, |
| "valid_targets_min": 433 |
| }, |
| { |
| "epoch": 5.555555555555555, |
| "grad_norm": 0.593321647760732, |
| "learning_rate": 4.982399340370017e-06, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18851664662361145, |
| "step": 2500, |
| "valid_targets_mean": 4363.1, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 5.566666666666666, |
| "grad_norm": 0.5435021274855566, |
| "learning_rate": 4.909444019221274e-06, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1688232570886612, |
| "step": 2505, |
| "valid_targets_mean": 4495.8, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 5.5777777777777775, |
| "grad_norm": 0.4945201322111143, |
| "learning_rate": 4.836951971891215e-06, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14214378595352173, |
| "step": 2510, |
| "valid_targets_mean": 5189.9, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 5.588888888888889, |
| "grad_norm": 0.5455726240398745, |
| "learning_rate": 4.764925423855669e-06, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1754768192768097, |
| "step": 2515, |
| "valid_targets_mean": 4304.2, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 5.6, |
| "grad_norm": 0.6294730140787744, |
| "learning_rate": 4.693366586299824e-06, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15617169439792633, |
| "step": 2520, |
| "valid_targets_mean": 3736.4, |
| "valid_targets_min": 218 |
| }, |
| { |
| "epoch": 5.611111111111111, |
| "grad_norm": 0.5250062129007003, |
| "learning_rate": 4.622277656050369e-06, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17956486344337463, |
| "step": 2525, |
| "valid_targets_mean": 5230.8, |
| "valid_targets_min": 2431 |
| }, |
| { |
| "epoch": 5.622222222222222, |
| "grad_norm": 0.7086051651918763, |
| "learning_rate": 4.551660815508012e-06, |
| "loss": 0.1786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1606767177581787, |
| "step": 2530, |
| "valid_targets_mean": 4573.8, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 5.633333333333333, |
| "grad_norm": 0.48064688634395325, |
| "learning_rate": 4.481518232580515e-06, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1643509864807129, |
| "step": 2535, |
| "valid_targets_mean": 5939.2, |
| "valid_targets_min": 2884 |
| }, |
| { |
| "epoch": 5.644444444444445, |
| "grad_norm": 0.5324700467948121, |
| "learning_rate": 4.411852060616115e-06, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1770201474428177, |
| "step": 2540, |
| "valid_targets_mean": 5397.2, |
| "valid_targets_min": 283 |
| }, |
| { |
| "epoch": 5.655555555555556, |
| "grad_norm": 0.5436206325195655, |
| "learning_rate": 4.342664438337447e-06, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14190086722373962, |
| "step": 2545, |
| "valid_targets_mean": 4431.3, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 5.666666666666667, |
| "grad_norm": 0.4773318240610541, |
| "learning_rate": 4.273957489775862e-06, |
| "loss": 0.1726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15811610221862793, |
| "step": 2550, |
| "valid_targets_mean": 4552.0, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 5.677777777777778, |
| "grad_norm": 0.5208734691655355, |
| "learning_rate": 4.205733324206216e-06, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16764241456985474, |
| "step": 2555, |
| "valid_targets_mean": 4251.2, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 5.688888888888889, |
| "grad_norm": 0.4928403449962443, |
| "learning_rate": 4.137994036082138e-06, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.175938218832016, |
| "step": 2560, |
| "valid_targets_mean": 5055.7, |
| "valid_targets_min": 365 |
| }, |
| { |
| "epoch": 5.7, |
| "grad_norm": 0.5244262215031825, |
| "learning_rate": 4.070741704971726e-06, |
| "loss": 0.1744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2002006471157074, |
| "step": 2565, |
| "valid_targets_mean": 4992.8, |
| "valid_targets_min": 377 |
| }, |
| { |
| "epoch": 5.711111111111111, |
| "grad_norm": 0.661490029880272, |
| "learning_rate": 4.003978395493682e-06, |
| "loss": 0.1849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1974271535873413, |
| "step": 2570, |
| "valid_targets_mean": 3547.4, |
| "valid_targets_min": 490 |
| }, |
| { |
| "epoch": 5.722222222222222, |
| "grad_norm": 1.7114236198419897, |
| "learning_rate": 3.937706157253971e-06, |
| "loss": 0.1776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20456838607788086, |
| "step": 2575, |
| "valid_targets_mean": 3842.5, |
| "valid_targets_min": 206 |
| }, |
| { |
| "epoch": 5.733333333333333, |
| "grad_norm": 0.6837291674161498, |
| "learning_rate": 3.871927024782838e-06, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14637309312820435, |
| "step": 2580, |
| "valid_targets_mean": 4026.7, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 5.7444444444444445, |
| "grad_norm": 0.7514815970637514, |
| "learning_rate": 3.80664301747242e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18412163853645325, |
| "step": 2585, |
| "valid_targets_mean": 2986.9, |
| "valid_targets_min": 295 |
| }, |
| { |
| "epoch": 5.7555555555555555, |
| "grad_norm": 0.5388048398379085, |
| "learning_rate": 3.741856139514706e-06, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16334733366966248, |
| "step": 2590, |
| "valid_targets_mean": 4902.1, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 5.766666666666667, |
| "grad_norm": 0.5233222496715474, |
| "learning_rate": 3.677568379840011e-06, |
| "loss": 0.1621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16272562742233276, |
| "step": 2595, |
| "valid_targets_mean": 4434.1, |
| "valid_targets_min": 462 |
| }, |
| { |
| "epoch": 5.777777777777778, |
| "grad_norm": 0.5705709741002777, |
| "learning_rate": 3.613781712055935e-06, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17690132558345795, |
| "step": 2600, |
| "valid_targets_mean": 4264.3, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 5.788888888888889, |
| "grad_norm": 0.5479756129178118, |
| "learning_rate": 3.5504980943867538e-06, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16624002158641815, |
| "step": 2605, |
| "valid_targets_mean": 5080.0, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 5.8, |
| "grad_norm": 0.6635653151891525, |
| "learning_rate": 3.487719469613331e-06, |
| "loss": 0.1811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028333991765976, |
| "step": 2610, |
| "valid_targets_mean": 3572.5, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 5.811111111111111, |
| "grad_norm": 0.44665022968089857, |
| "learning_rate": 3.4254477650134367e-06, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1494394838809967, |
| "step": 2615, |
| "valid_targets_mean": 5941.5, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 5.822222222222222, |
| "grad_norm": 0.661754201811149, |
| "learning_rate": 3.3636848923026257e-06, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18834251165390015, |
| "step": 2620, |
| "valid_targets_mean": 2994.5, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 5.833333333333333, |
| "grad_norm": 0.6849647049787121, |
| "learning_rate": 3.30243274757549e-06, |
| "loss": 0.1702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16348251700401306, |
| "step": 2625, |
| "valid_targets_mean": 2972.6, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 5.844444444444444, |
| "grad_norm": 0.6231070446255984, |
| "learning_rate": 3.2416932112475207e-06, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15320156514644623, |
| "step": 2630, |
| "valid_targets_mean": 4418.4, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 5.855555555555555, |
| "grad_norm": 0.5713999743603262, |
| "learning_rate": 3.1814681479973154e-06, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16935516893863678, |
| "step": 2635, |
| "valid_targets_mean": 4568.5, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 5.866666666666667, |
| "grad_norm": 1.2779543648973395, |
| "learning_rate": 3.121759406709386e-06, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18024687469005585, |
| "step": 2640, |
| "valid_targets_mean": 4624.9, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 5.877777777777778, |
| "grad_norm": 0.527748772279261, |
| "learning_rate": 3.062568820417353e-06, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19535987079143524, |
| "step": 2645, |
| "valid_targets_mean": 5047.5, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 5.888888888888889, |
| "grad_norm": 0.5667121076341758, |
| "learning_rate": 3.003898206247704e-06, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724199652671814, |
| "step": 2650, |
| "valid_targets_mean": 4225.3, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 5.9, |
| "grad_norm": 0.5448499086146226, |
| "learning_rate": 2.9457493653639856e-06, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16028910875320435, |
| "step": 2655, |
| "valid_targets_mean": 4420.4, |
| "valid_targets_min": 2211 |
| }, |
| { |
| "epoch": 5.911111111111111, |
| "grad_norm": 0.5833160229189241, |
| "learning_rate": 2.8881240829115453e-06, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.173763245344162, |
| "step": 2660, |
| "valid_targets_mean": 3861.1, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 5.9222222222222225, |
| "grad_norm": 0.5633050658584287, |
| "learning_rate": 2.8310241279626784e-06, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18552720546722412, |
| "step": 2665, |
| "valid_targets_mean": 4328.1, |
| "valid_targets_min": 406 |
| }, |
| { |
| "epoch": 5.933333333333334, |
| "grad_norm": 0.6139575137201317, |
| "learning_rate": 2.774451253462356e-06, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17860981822013855, |
| "step": 2670, |
| "valid_targets_mean": 3716.5, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 5.944444444444445, |
| "grad_norm": 0.5214170522074714, |
| "learning_rate": 2.718407196174391e-06, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18364687263965607, |
| "step": 2675, |
| "valid_targets_mean": 5053.6, |
| "valid_targets_min": 238 |
| }, |
| { |
| "epoch": 5.955555555555556, |
| "grad_norm": 0.6469395857790785, |
| "learning_rate": 2.6628936766281375e-06, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19230781495571136, |
| "step": 2680, |
| "valid_targets_mean": 3862.8, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 5.966666666666667, |
| "grad_norm": 0.5114626457093362, |
| "learning_rate": 2.607912399065646e-06, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1596902310848236, |
| "step": 2685, |
| "valid_targets_mean": 5641.2, |
| "valid_targets_min": 306 |
| }, |
| { |
| "epoch": 5.977777777777778, |
| "grad_norm": 0.5327080602996671, |
| "learning_rate": 2.5534650513893787e-06, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14958997070789337, |
| "step": 2690, |
| "valid_targets_mean": 5039.9, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 5.988888888888889, |
| "grad_norm": 0.6076035884975858, |
| "learning_rate": 2.4995533051103448e-06, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15890420973300934, |
| "step": 2695, |
| "valid_targets_mean": 3991.2, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 6.0, |
| "grad_norm": 0.5398509197397203, |
| "learning_rate": 2.446178815296838e-06, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.159483402967453, |
| "step": 2700, |
| "valid_targets_mean": 4043.2, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 6.011111111111111, |
| "grad_norm": 0.5913571273369431, |
| "learning_rate": 2.393343220523581e-06, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17935341596603394, |
| "step": 2705, |
| "valid_targets_mean": 4581.9, |
| "valid_targets_min": 1063 |
| }, |
| { |
| "epoch": 6.022222222222222, |
| "grad_norm": 0.66752029438305, |
| "learning_rate": 2.3410481428214602e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1461348831653595, |
| "step": 2710, |
| "valid_targets_mean": 3675.8, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 6.033333333333333, |
| "grad_norm": 0.5056815928149037, |
| "learning_rate": 2.2892951876276983e-06, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17451688647270203, |
| "step": 2715, |
| "valid_targets_mean": 4982.4, |
| "valid_targets_min": 193 |
| }, |
| { |
| "epoch": 6.044444444444444, |
| "grad_norm": 0.5787722267858811, |
| "learning_rate": 2.2380859437365855e-06, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1561371088027954, |
| "step": 2720, |
| "valid_targets_mean": 4155.3, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 6.055555555555555, |
| "grad_norm": 0.5915320981288767, |
| "learning_rate": 2.187421983250695e-06, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16373848915100098, |
| "step": 2725, |
| "valid_targets_mean": 3869.1, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 6.066666666666666, |
| "grad_norm": 0.6317568161952004, |
| "learning_rate": 2.1373048615326385e-06, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1501501202583313, |
| "step": 2730, |
| "valid_targets_mean": 3157.3, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 6.0777777777777775, |
| "grad_norm": 0.5928916539006913, |
| "learning_rate": 2.0877361171572953e-06, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16607831418514252, |
| "step": 2735, |
| "valid_targets_mean": 5381.1, |
| "valid_targets_min": 366 |
| }, |
| { |
| "epoch": 6.088888888888889, |
| "grad_norm": 0.5449211144644974, |
| "learning_rate": 2.0387172718645853e-06, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14824213087558746, |
| "step": 2740, |
| "valid_targets_mean": 4073.2, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 6.1, |
| "grad_norm": 0.5683455633442686, |
| "learning_rate": 1.990249830512756e-06, |
| "loss": 0.153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16184581816196442, |
| "step": 2745, |
| "valid_targets_mean": 4750.2, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 6.111111111111111, |
| "grad_norm": 0.42667335878897045, |
| "learning_rate": 1.942335281032188e-06, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12961864471435547, |
| "step": 2750, |
| "valid_targets_mean": 6349.4, |
| "valid_targets_min": 2625 |
| }, |
| { |
| "epoch": 6.122222222222222, |
| "grad_norm": 0.5436823867806183, |
| "learning_rate": 1.8949750943797051e-06, |
| "loss": 0.1562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14522790908813477, |
| "step": 2755, |
| "valid_targets_mean": 4269.0, |
| "valid_targets_min": 324 |
| }, |
| { |
| "epoch": 6.133333333333334, |
| "grad_norm": 0.6448799255936731, |
| "learning_rate": 1.8481707244934232e-06, |
| "loss": 0.1582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15584322810173035, |
| "step": 2760, |
| "valid_targets_mean": 4016.6, |
| "valid_targets_min": 445 |
| }, |
| { |
| "epoch": 6.144444444444445, |
| "grad_norm": 0.5421598615393723, |
| "learning_rate": 1.8019236082481063e-06, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1767968237400055, |
| "step": 2765, |
| "valid_targets_mean": 4966.3, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 6.155555555555556, |
| "grad_norm": 0.5685111593837506, |
| "learning_rate": 1.7562351654110776e-06, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1697826236486435, |
| "step": 2770, |
| "valid_targets_mean": 4455.9, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 6.166666666666667, |
| "grad_norm": 0.5013193289509864, |
| "learning_rate": 1.711106798598603e-06, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14647771418094635, |
| "step": 2775, |
| "valid_targets_mean": 4696.4, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 6.177777777777778, |
| "grad_norm": 0.5765680957861777, |
| "learning_rate": 1.6665398932328615e-06, |
| "loss": 0.1843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21099118888378143, |
| "step": 2780, |
| "valid_targets_mean": 4673.8, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 6.188888888888889, |
| "grad_norm": 0.6071624204964592, |
| "learning_rate": 1.6225358174993866e-06, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15273860096931458, |
| "step": 2785, |
| "valid_targets_mean": 4286.6, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 6.2, |
| "grad_norm": 0.6182352698209433, |
| "learning_rate": 1.5790959223050761e-06, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19237971305847168, |
| "step": 2790, |
| "valid_targets_mean": 3695.6, |
| "valid_targets_min": 344 |
| }, |
| { |
| "epoch": 6.211111111111111, |
| "grad_norm": 0.588213406617714, |
| "learning_rate": 1.5362215412367198e-06, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15135380625724792, |
| "step": 2795, |
| "valid_targets_mean": 3756.7, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 6.222222222222222, |
| "grad_norm": 0.6346814814248117, |
| "learning_rate": 1.493913990520066e-06, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20901688933372498, |
| "step": 2800, |
| "valid_targets_mean": 4734.8, |
| "valid_targets_min": 360 |
| }, |
| { |
| "epoch": 6.233333333333333, |
| "grad_norm": 0.6257271615557687, |
| "learning_rate": 1.4521745689793942e-06, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15938270092010498, |
| "step": 2805, |
| "valid_targets_mean": 5421.2, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 6.2444444444444445, |
| "grad_norm": 0.559553595120576, |
| "learning_rate": 1.4110045579976638e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16130048036575317, |
| "step": 2810, |
| "valid_targets_mean": 4333.5, |
| "valid_targets_min": 586 |
| }, |
| { |
| "epoch": 6.2555555555555555, |
| "grad_norm": 0.5866773758858824, |
| "learning_rate": 1.3704052214771513e-06, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20442438125610352, |
| "step": 2815, |
| "valid_targets_mean": 4559.4, |
| "valid_targets_min": 491 |
| }, |
| { |
| "epoch": 6.266666666666667, |
| "grad_norm": 0.5344071459257823, |
| "learning_rate": 1.3303778058006844e-06, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1532367765903473, |
| "step": 2820, |
| "valid_targets_mean": 4964.8, |
| "valid_targets_min": 1225 |
| }, |
| { |
| "epoch": 6.277777777777778, |
| "grad_norm": 0.4690750876544389, |
| "learning_rate": 1.2909235397933429e-06, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18918469548225403, |
| "step": 2825, |
| "valid_targets_mean": 6092.4, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 6.288888888888889, |
| "grad_norm": 0.5452380646504179, |
| "learning_rate": 1.2520436346847498e-06, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1750721037387848, |
| "step": 2830, |
| "valid_targets_mean": 4615.1, |
| "valid_targets_min": 231 |
| }, |
| { |
| "epoch": 6.3, |
| "grad_norm": 0.7863745243804952, |
| "learning_rate": 1.213739284071891e-06, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1903843879699707, |
| "step": 2835, |
| "valid_targets_mean": 3657.9, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 6.311111111111111, |
| "grad_norm": 0.5931382218715537, |
| "learning_rate": 1.176011663882466e-06, |
| "loss": 0.1702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17225001752376556, |
| "step": 2840, |
| "valid_targets_mean": 3728.6, |
| "valid_targets_min": 394 |
| }, |
| { |
| "epoch": 6.322222222222222, |
| "grad_norm": 0.5189346871656337, |
| "learning_rate": 1.1388619323387884e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17915725708007812, |
| "step": 2845, |
| "valid_targets_mean": 5191.2, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 6.333333333333333, |
| "grad_norm": 0.5685337335007038, |
| "learning_rate": 1.1022912299222387e-06, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16851413249969482, |
| "step": 2850, |
| "valid_targets_mean": 4485.8, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 6.344444444444444, |
| "grad_norm": 0.7195861370160256, |
| "learning_rate": 1.0663006793382214e-06, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1574927270412445, |
| "step": 2855, |
| "valid_targets_mean": 3559.8, |
| "valid_targets_min": 576 |
| }, |
| { |
| "epoch": 6.355555555555555, |
| "grad_norm": 0.5762158096256034, |
| "learning_rate": 1.0308913854817425e-06, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1543298363685608, |
| "step": 2860, |
| "valid_targets_mean": 4227.9, |
| "valid_targets_min": 450 |
| }, |
| { |
| "epoch": 6.366666666666666, |
| "grad_norm": 0.581243646224178, |
| "learning_rate": 9.960644354034544e-07, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16603925824165344, |
| "step": 2865, |
| "valid_targets_mean": 3848.9, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 6.377777777777778, |
| "grad_norm": 0.5860189314743979, |
| "learning_rate": 9.618208982763045e-07, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17424118518829346, |
| "step": 2870, |
| "valid_targets_mean": 4603.6, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 6.388888888888889, |
| "grad_norm": 0.5260553051504206, |
| "learning_rate": 9.281618253626967e-07, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1587425321340561, |
| "step": 2875, |
| "valid_targets_mean": 4868.8, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 6.4, |
| "grad_norm": 0.5709882539258184, |
| "learning_rate": 8.950882499822322e-07, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18391573429107666, |
| "step": 2880, |
| "valid_targets_mean": 4826.9, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 6.411111111111111, |
| "grad_norm": 0.5644788262306717, |
| "learning_rate": 8.626011874799723e-07, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18057206273078918, |
| "step": 2885, |
| "valid_targets_mean": 4512.6, |
| "valid_targets_min": 219 |
| }, |
| { |
| "epoch": 6.4222222222222225, |
| "grad_norm": 0.576346831291659, |
| "learning_rate": 8.307016351952857e-07, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.166375070810318, |
| "step": 2890, |
| "valid_targets_mean": 4210.4, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 6.433333333333334, |
| "grad_norm": 0.5757462663579878, |
| "learning_rate": 7.993905724312156e-07, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1599673181772232, |
| "step": 2895, |
| "valid_targets_mean": 4139.4, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 6.444444444444445, |
| "grad_norm": 0.5623689294928453, |
| "learning_rate": 7.686689604244191e-07, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19040706753730774, |
| "step": 2900, |
| "valid_targets_mean": 4728.7, |
| "valid_targets_min": 992 |
| }, |
| { |
| "epoch": 6.455555555555556, |
| "grad_norm": 0.598246014236927, |
| "learning_rate": 7.385377423156592e-07, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1700592339038849, |
| "step": 2905, |
| "valid_targets_mean": 3927.4, |
| "valid_targets_min": 507 |
| }, |
| { |
| "epoch": 6.466666666666667, |
| "grad_norm": 0.6203480477245517, |
| "learning_rate": 7.0899784312086e-07, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1759098470211029, |
| "step": 2910, |
| "valid_targets_mean": 3698.8, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 6.477777777777778, |
| "grad_norm": 0.7017472734434613, |
| "learning_rate": 6.800501697026817e-07, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1844363808631897, |
| "step": 2915, |
| "valid_targets_mean": 3652.4, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 6.488888888888889, |
| "grad_norm": 0.8080719060022912, |
| "learning_rate": 6.516956107427241e-07, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1818864643573761, |
| "step": 2920, |
| "valid_targets_mean": 3598.4, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 6.5, |
| "grad_norm": 0.6080050661997464, |
| "learning_rate": 6.239350367141872e-07, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1631316989660263, |
| "step": 2925, |
| "valid_targets_mean": 3850.2, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 6.511111111111111, |
| "grad_norm": 0.5218209158596074, |
| "learning_rate": 5.967692998552088e-07, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1616230010986328, |
| "step": 2930, |
| "valid_targets_mean": 4195.7, |
| "valid_targets_min": 214 |
| }, |
| { |
| "epoch": 6.522222222222222, |
| "grad_norm": 0.583948409979544, |
| "learning_rate": 5.701992341426499e-07, |
| "loss": 0.1708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16667166352272034, |
| "step": 2935, |
| "valid_targets_mean": 4227.6, |
| "valid_targets_min": 443 |
| }, |
| { |
| "epoch": 6.533333333333333, |
| "grad_norm": 0.6357686417725928, |
| "learning_rate": 5.442256552665326e-07, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1789218783378601, |
| "step": 2940, |
| "valid_targets_mean": 4223.6, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 6.544444444444444, |
| "grad_norm": 0.5545850268570705, |
| "learning_rate": 5.188493606049672e-07, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16391915082931519, |
| "step": 2945, |
| "valid_targets_mean": 4468.6, |
| "valid_targets_min": 306 |
| }, |
| { |
| "epoch": 6.555555555555555, |
| "grad_norm": 0.5370700566695868, |
| "learning_rate": 4.940711291996891e-07, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1655001938343048, |
| "step": 2950, |
| "valid_targets_mean": 4653.1, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 6.566666666666666, |
| "grad_norm": 0.5816674164537832, |
| "learning_rate": 4.698917217321408e-07, |
| "loss": 0.1593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16322006285190582, |
| "step": 2955, |
| "valid_targets_mean": 4279.8, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 6.5777777777777775, |
| "grad_norm": 0.591268448436149, |
| "learning_rate": 4.4631188050011654e-07, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15823054313659668, |
| "step": 2960, |
| "valid_targets_mean": 4439.2, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 6.588888888888889, |
| "grad_norm": 0.5923470499206334, |
| "learning_rate": 4.2333232939498094e-07, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15806478261947632, |
| "step": 2965, |
| "valid_targets_mean": 4299.8, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 6.6, |
| "grad_norm": 0.604171037099629, |
| "learning_rate": 4.009537738794289e-07, |
| "loss": 0.1624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18534332513809204, |
| "step": 2970, |
| "valid_targets_mean": 3794.3, |
| "valid_targets_min": 1163 |
| }, |
| { |
| "epoch": 6.611111111111111, |
| "grad_norm": 0.5959118836475591, |
| "learning_rate": 3.791769009658497e-07, |
| "loss": 0.1744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17430004477500916, |
| "step": 2975, |
| "valid_targets_mean": 4548.9, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 6.622222222222222, |
| "grad_norm": 0.7602527640872502, |
| "learning_rate": 3.5800237919522363e-07, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1884760558605194, |
| "step": 2980, |
| "valid_targets_mean": 4584.7, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 6.633333333333333, |
| "grad_norm": 0.5214769514587413, |
| "learning_rate": 3.3743085861659643e-07, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16529062390327454, |
| "step": 2985, |
| "valid_targets_mean": 4972.1, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 6.644444444444445, |
| "grad_norm": 0.5344722245636476, |
| "learning_rate": 3.1746297076713504e-07, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14969675242900848, |
| "step": 2990, |
| "valid_targets_mean": 4986.3, |
| "valid_targets_min": 1685 |
| }, |
| { |
| "epoch": 6.655555555555556, |
| "grad_norm": 0.5351628577936627, |
| "learning_rate": 2.9809932865271893e-07, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16871917247772217, |
| "step": 2995, |
| "valid_targets_mean": 4784.9, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.5030921817708136, |
| "learning_rate": 2.793405267291505e-07, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15890008211135864, |
| "step": 3000, |
| "valid_targets_mean": 5473.4, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 6.677777777777778, |
| "grad_norm": 0.6571885910780609, |
| "learning_rate": 2.6118714088386954e-07, |
| "loss": 0.168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18136438727378845, |
| "step": 3005, |
| "valid_targets_mean": 3401.2, |
| "valid_targets_min": 257 |
| }, |
| { |
| "epoch": 6.688888888888889, |
| "grad_norm": 0.6046227631736789, |
| "learning_rate": 2.436397284183123e-07, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1641228199005127, |
| "step": 3010, |
| "valid_targets_mean": 3765.2, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 6.7, |
| "grad_norm": 0.5844047544930174, |
| "learning_rate": 2.2669882803076916e-07, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15143552422523499, |
| "step": 3015, |
| "valid_targets_mean": 4498.2, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 6.711111111111111, |
| "grad_norm": 0.6149713586123504, |
| "learning_rate": 2.1036495979986692e-07, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15604856610298157, |
| "step": 3020, |
| "valid_targets_mean": 3861.8, |
| "valid_targets_min": 225 |
| }, |
| { |
| "epoch": 6.722222222222222, |
| "grad_norm": 0.5723560396309636, |
| "learning_rate": 1.9463862516859277e-07, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12534162402153015, |
| "step": 3025, |
| "valid_targets_mean": 3602.2, |
| "valid_targets_min": 401 |
| }, |
| { |
| "epoch": 6.733333333333333, |
| "grad_norm": 0.4850032616094909, |
| "learning_rate": 1.7952030692891086e-07, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1640266627073288, |
| "step": 3030, |
| "valid_targets_mean": 4796.8, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 6.7444444444444445, |
| "grad_norm": 0.5571942927801525, |
| "learning_rate": 1.6501046920692986e-07, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18630409240722656, |
| "step": 3035, |
| "valid_targets_mean": 4979.9, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 6.7555555555555555, |
| "grad_norm": 0.6261160646072778, |
| "learning_rate": 1.511095574486543e-07, |
| "loss": 0.1509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13854405283927917, |
| "step": 3040, |
| "valid_targets_mean": 3824.3, |
| "valid_targets_min": 449 |
| }, |
| { |
| "epoch": 6.766666666666667, |
| "grad_norm": 0.6318415495546549, |
| "learning_rate": 1.378179984063177e-07, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186091810464859, |
| "step": 3045, |
| "valid_targets_mean": 4292.3, |
| "valid_targets_min": 389 |
| }, |
| { |
| "epoch": 6.777777777777778, |
| "grad_norm": 0.6057679446128716, |
| "learning_rate": 1.2513620012528427e-07, |
| "loss": 0.1819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18621055781841278, |
| "step": 3050, |
| "valid_targets_mean": 4053.4, |
| "valid_targets_min": 289 |
| }, |
| { |
| "epoch": 6.788888888888889, |
| "grad_norm": 0.8744644549026661, |
| "learning_rate": 1.1306455193150323e-07, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20955529808998108, |
| "step": 3055, |
| "valid_targets_mean": 3671.4, |
| "valid_targets_min": 482 |
| }, |
| { |
| "epoch": 6.8, |
| "grad_norm": 0.6599223412568986, |
| "learning_rate": 1.0160342441957626e-07, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19978420436382294, |
| "step": 3060, |
| "valid_targets_mean": 3478.9, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 6.811111111111111, |
| "grad_norm": 0.5322339408865758, |
| "learning_rate": 9.07531694413688e-08, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14194843173027039, |
| "step": 3065, |
| "valid_targets_mean": 5484.3, |
| "valid_targets_min": 2467 |
| }, |
| { |
| "epoch": 6.822222222222222, |
| "grad_norm": 0.5448297735203173, |
| "learning_rate": 8.051412009521864e-08, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15910744667053223, |
| "step": 3070, |
| "valid_targets_mean": 4950.7, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 6.833333333333333, |
| "grad_norm": 0.5207228811956566, |
| "learning_rate": 7.08865907156997e-08, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15996085107326508, |
| "step": 3075, |
| "valid_targets_mean": 5696.6, |
| "valid_targets_min": 1801 |
| }, |
| { |
| "epoch": 6.844444444444444, |
| "grad_norm": 0.588737424620841, |
| "learning_rate": 6.187087686397641e-08, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16847629845142365, |
| "step": 3080, |
| "valid_targets_mean": 3962.7, |
| "valid_targets_min": 243 |
| }, |
| { |
| "epoch": 6.855555555555555, |
| "grad_norm": 0.8953529078704728, |
| "learning_rate": 5.3467255318726544e-08, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1842920035123825, |
| "step": 3085, |
| "valid_targets_mean": 3766.0, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 6.866666666666667, |
| "grad_norm": 0.6312232512655556, |
| "learning_rate": 4.567598406765461e-08, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14916302263736725, |
| "step": 3090, |
| "valid_targets_mean": 4468.3, |
| "valid_targets_min": 292 |
| }, |
| { |
| "epoch": 6.877777777777778, |
| "grad_norm": 0.5616637532565867, |
| "learning_rate": 3.84973022995605e-08, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13993391394615173, |
| "step": 3095, |
| "valid_targets_mean": 4598.1, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 6.888888888888889, |
| "grad_norm": 0.5833668585034318, |
| "learning_rate": 3.193143039700086e-08, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1864895224571228, |
| "step": 3100, |
| "valid_targets_mean": 4208.8, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 6.9, |
| "grad_norm": 0.571580775093832, |
| "learning_rate": 2.597856992952341e-08, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16089646518230438, |
| "step": 3105, |
| "valid_targets_mean": 5259.4, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 6.911111111111111, |
| "grad_norm": 0.5133595187461827, |
| "learning_rate": 2.063890364748078e-08, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1508500874042511, |
| "step": 3110, |
| "valid_targets_mean": 5170.9, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 6.9222222222222225, |
| "grad_norm": 0.5585279295675786, |
| "learning_rate": 1.5912595476414993e-08, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17111481726169586, |
| "step": 3115, |
| "valid_targets_mean": 4617.8, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 6.933333333333334, |
| "grad_norm": 0.5333435138003515, |
| "learning_rate": 1.1799790512030395e-08, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14488770067691803, |
| "step": 3120, |
| "valid_targets_mean": 4679.4, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 6.944444444444445, |
| "grad_norm": 0.5560785893229921, |
| "learning_rate": 8.300615015734981e-09, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14593376219272614, |
| "step": 3125, |
| "valid_targets_mean": 4246.2, |
| "valid_targets_min": 616 |
| }, |
| { |
| "epoch": 6.955555555555556, |
| "grad_norm": 0.7126140858082262, |
| "learning_rate": 5.415176410765721e-09, |
| "loss": 0.1727, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18622633814811707, |
| "step": 3130, |
| "valid_targets_mean": 3116.1, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 6.966666666666667, |
| "grad_norm": 0.5293643056538982, |
| "learning_rate": 3.1435632788956448e-09, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14810457825660706, |
| "step": 3135, |
| "valid_targets_mean": 4385.9, |
| "valid_targets_min": 369 |
| }, |
| { |
| "epoch": 6.977777777777778, |
| "grad_norm": 0.6565261395938169, |
| "learning_rate": 1.4858453577071275e-09, |
| "loss": 0.1593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16837093234062195, |
| "step": 3140, |
| "valid_targets_mean": 3301.8, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 6.988888888888889, |
| "grad_norm": 0.53850752681232, |
| "learning_rate": 4.4207353845360234e-10, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17763689160346985, |
| "step": 3145, |
| "valid_targets_mean": 5262.4, |
| "valid_targets_min": 2341 |
| }, |
| { |
| "epoch": 7.0, |
| "grad_norm": 0.6203043399932429, |
| "learning_rate": 1.2279864494146865e-11, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19432786107063293, |
| "step": 3150, |
| "valid_targets_mean": 4280.6, |
| "valid_targets_min": 315 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19432786107063293, |
| "step": 3150, |
| "total_flos": 1055465597173760.0, |
| "train_loss": 0.21853318925887819, |
| "train_runtime": 17876.6321, |
| "train_samples_per_second": 2.818, |
| "train_steps_per_second": 0.176, |
| "valid_targets_mean": 4280.6, |
| "valid_targets_min": 315 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 3150, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1055465597173760.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|