exp_tas_temp_0_5_traces / trainer_state.json
penfever's picture
End of training
417dcb5 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4410,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007936507936507936,
"grad_norm": 7.791894551319325,
"learning_rate": 3.6281179138322e-07,
"loss": 0.7972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3812609314918518,
"step": 5,
"valid_targets_mean": 2755.6,
"valid_targets_min": 1231
},
{
"epoch": 0.015873015873015872,
"grad_norm": 7.455912538367786,
"learning_rate": 8.163265306122449e-07,
"loss": 0.8212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37411224842071533,
"step": 10,
"valid_targets_mean": 3696.9,
"valid_targets_min": 1315
},
{
"epoch": 0.023809523809523808,
"grad_norm": 7.4947876547841865,
"learning_rate": 1.26984126984127e-06,
"loss": 0.798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37891465425491333,
"step": 15,
"valid_targets_mean": 3647.1,
"valid_targets_min": 1396
},
{
"epoch": 0.031746031746031744,
"grad_norm": 5.997591663796195,
"learning_rate": 1.723356009070295e-06,
"loss": 0.7689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33539754152297974,
"step": 20,
"valid_targets_mean": 2617.8,
"valid_targets_min": 1177
},
{
"epoch": 0.03968253968253968,
"grad_norm": 4.498581839487113,
"learning_rate": 2.17687074829932e-06,
"loss": 0.7181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38529515266418457,
"step": 25,
"valid_targets_mean": 3182.4,
"valid_targets_min": 2220
},
{
"epoch": 0.047619047619047616,
"grad_norm": 3.279401177139959,
"learning_rate": 2.6303854875283447e-06,
"loss": 0.6841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3477422297000885,
"step": 30,
"valid_targets_mean": 3296.5,
"valid_targets_min": 1629
},
{
"epoch": 0.05555555555555555,
"grad_norm": 2.65642172394517,
"learning_rate": 3.08390022675737e-06,
"loss": 0.697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3257293105125427,
"step": 35,
"valid_targets_mean": 3436.6,
"valid_targets_min": 1517
},
{
"epoch": 0.06349206349206349,
"grad_norm": 2.141011741114798,
"learning_rate": 3.537414965986395e-06,
"loss": 0.6551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3501768410205841,
"step": 40,
"valid_targets_mean": 3314.8,
"valid_targets_min": 615
},
{
"epoch": 0.07142857142857142,
"grad_norm": 1.4253116818930238,
"learning_rate": 3.99092970521542e-06,
"loss": 0.6421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22955095767974854,
"step": 45,
"valid_targets_mean": 2430.1,
"valid_targets_min": 1407
},
{
"epoch": 0.07936507936507936,
"grad_norm": 1.144109550309547,
"learning_rate": 4.444444444444444e-06,
"loss": 0.6267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2753365933895111,
"step": 50,
"valid_targets_mean": 3324.9,
"valid_targets_min": 1255
},
{
"epoch": 0.0873015873015873,
"grad_norm": 1.0559927514309588,
"learning_rate": 4.897959183673469e-06,
"loss": 0.5787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3343765139579773,
"step": 55,
"valid_targets_mean": 3959.4,
"valid_targets_min": 1390
},
{
"epoch": 0.09523809523809523,
"grad_norm": 1.089174983738798,
"learning_rate": 5.3514739229024945e-06,
"loss": 0.5769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921941876411438,
"step": 60,
"valid_targets_mean": 2628.2,
"valid_targets_min": 1050
},
{
"epoch": 0.10317460317460317,
"grad_norm": 0.9352039163105647,
"learning_rate": 5.80498866213152e-06,
"loss": 0.5802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31847676634788513,
"step": 65,
"valid_targets_mean": 5229.6,
"valid_targets_min": 2258
},
{
"epoch": 0.1111111111111111,
"grad_norm": 0.7821250269316058,
"learning_rate": 6.258503401360545e-06,
"loss": 0.5822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24337267875671387,
"step": 70,
"valid_targets_mean": 3637.1,
"valid_targets_min": 731
},
{
"epoch": 0.11904761904761904,
"grad_norm": 0.8049140841034186,
"learning_rate": 6.71201814058957e-06,
"loss": 0.5711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31313028931617737,
"step": 75,
"valid_targets_mean": 3684.1,
"valid_targets_min": 1474
},
{
"epoch": 0.12698412698412698,
"grad_norm": 0.9345065106303573,
"learning_rate": 7.165532879818595e-06,
"loss": 0.5511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718881070613861,
"step": 80,
"valid_targets_mean": 2535.2,
"valid_targets_min": 1217
},
{
"epoch": 0.1349206349206349,
"grad_norm": 0.7003907932134493,
"learning_rate": 7.61904761904762e-06,
"loss": 0.5241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26534807682037354,
"step": 85,
"valid_targets_mean": 4012.6,
"valid_targets_min": 2198
},
{
"epoch": 0.14285714285714285,
"grad_norm": 0.7511620568435198,
"learning_rate": 8.072562358276645e-06,
"loss": 0.5339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23427170515060425,
"step": 90,
"valid_targets_mean": 2802.2,
"valid_targets_min": 1022
},
{
"epoch": 0.15079365079365079,
"grad_norm": 0.8328109025616128,
"learning_rate": 8.52607709750567e-06,
"loss": 0.5245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2510078549385071,
"step": 95,
"valid_targets_mean": 2489.6,
"valid_targets_min": 1273
},
{
"epoch": 0.15873015873015872,
"grad_norm": 0.7816118772554373,
"learning_rate": 8.979591836734695e-06,
"loss": 0.4958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29513928294181824,
"step": 100,
"valid_targets_mean": 3522.4,
"valid_targets_min": 649
},
{
"epoch": 0.16666666666666666,
"grad_norm": 0.7279446724813006,
"learning_rate": 9.43310657596372e-06,
"loss": 0.5014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23042386770248413,
"step": 105,
"valid_targets_mean": 3128.6,
"valid_targets_min": 1456
},
{
"epoch": 0.1746031746031746,
"grad_norm": 0.5890418553585118,
"learning_rate": 9.886621315192746e-06,
"loss": 0.4927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21733567118644714,
"step": 110,
"valid_targets_mean": 4134.9,
"valid_targets_min": 1335
},
{
"epoch": 0.18253968253968253,
"grad_norm": 0.7116158842930445,
"learning_rate": 1.034013605442177e-05,
"loss": 0.4823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22764775156974792,
"step": 115,
"valid_targets_mean": 4014.4,
"valid_targets_min": 1400
},
{
"epoch": 0.19047619047619047,
"grad_norm": 0.8008016401079758,
"learning_rate": 1.0793650793650794e-05,
"loss": 0.4857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24580729007720947,
"step": 120,
"valid_targets_mean": 2738.6,
"valid_targets_min": 838
},
{
"epoch": 0.1984126984126984,
"grad_norm": 0.6667752435108454,
"learning_rate": 1.124716553287982e-05,
"loss": 0.4606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22335901856422424,
"step": 125,
"valid_targets_mean": 5113.5,
"valid_targets_min": 1774
},
{
"epoch": 0.20634920634920634,
"grad_norm": 0.7810365614559169,
"learning_rate": 1.1700680272108845e-05,
"loss": 0.4855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30480098724365234,
"step": 130,
"valid_targets_mean": 4073.2,
"valid_targets_min": 1473
},
{
"epoch": 0.21428571428571427,
"grad_norm": 0.5971746973534208,
"learning_rate": 1.215419501133787e-05,
"loss": 0.4614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14763841032981873,
"step": 135,
"valid_targets_mean": 3988.2,
"valid_targets_min": 824
},
{
"epoch": 0.2222222222222222,
"grad_norm": 0.6922843878731343,
"learning_rate": 1.2607709750566895e-05,
"loss": 0.4444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036367654800415,
"step": 140,
"valid_targets_mean": 3281.9,
"valid_targets_min": 1672
},
{
"epoch": 0.23015873015873015,
"grad_norm": 0.6226231983750194,
"learning_rate": 1.3061224489795918e-05,
"loss": 0.4632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24707484245300293,
"step": 145,
"valid_targets_mean": 4809.4,
"valid_targets_min": 1577
},
{
"epoch": 0.23809523809523808,
"grad_norm": 0.8326186713780263,
"learning_rate": 1.3514739229024945e-05,
"loss": 0.4941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23414701223373413,
"step": 150,
"valid_targets_mean": 3326.1,
"valid_targets_min": 1153
},
{
"epoch": 0.24603174603174602,
"grad_norm": 0.6395050003229518,
"learning_rate": 1.3968253968253968e-05,
"loss": 0.444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22398585081100464,
"step": 155,
"valid_targets_mean": 3925.0,
"valid_targets_min": 486
},
{
"epoch": 0.25396825396825395,
"grad_norm": 0.9256622944985334,
"learning_rate": 1.4421768707482994e-05,
"loss": 0.4619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29537683725357056,
"step": 160,
"valid_targets_mean": 2947.2,
"valid_targets_min": 801
},
{
"epoch": 0.2619047619047619,
"grad_norm": 0.7551814432848716,
"learning_rate": 1.4875283446712018e-05,
"loss": 0.463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23746734857559204,
"step": 165,
"valid_targets_mean": 3384.1,
"valid_targets_min": 958
},
{
"epoch": 0.2698412698412698,
"grad_norm": 0.7006392151761067,
"learning_rate": 1.5328798185941044e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23496189713478088,
"step": 170,
"valid_targets_mean": 3901.6,
"valid_targets_min": 1496
},
{
"epoch": 0.2777777777777778,
"grad_norm": 0.6782345715181035,
"learning_rate": 1.578231292517007e-05,
"loss": 0.4643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2183074653148651,
"step": 175,
"valid_targets_mean": 3844.2,
"valid_targets_min": 780
},
{
"epoch": 0.2857142857142857,
"grad_norm": 0.7454470024354803,
"learning_rate": 1.6235827664399097e-05,
"loss": 0.4341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22839799523353577,
"step": 180,
"valid_targets_mean": 3672.9,
"valid_targets_min": 741
},
{
"epoch": 0.29365079365079366,
"grad_norm": 0.7104945798231723,
"learning_rate": 1.668934240362812e-05,
"loss": 0.4184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20457884669303894,
"step": 185,
"valid_targets_mean": 3345.2,
"valid_targets_min": 1448
},
{
"epoch": 0.30158730158730157,
"grad_norm": 0.8232451122305295,
"learning_rate": 1.7142857142857142e-05,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19103802740573883,
"step": 190,
"valid_targets_mean": 2470.0,
"valid_targets_min": 694
},
{
"epoch": 0.30952380952380953,
"grad_norm": 0.7204209957946106,
"learning_rate": 1.759637188208617e-05,
"loss": 0.455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24723023176193237,
"step": 195,
"valid_targets_mean": 3233.0,
"valid_targets_min": 1414
},
{
"epoch": 0.31746031746031744,
"grad_norm": 0.7248505685281441,
"learning_rate": 1.8049886621315194e-05,
"loss": 0.4606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18277300894260406,
"step": 200,
"valid_targets_mean": 2704.4,
"valid_targets_min": 988
},
{
"epoch": 0.3253968253968254,
"grad_norm": 0.8433557218499257,
"learning_rate": 1.8503401360544218e-05,
"loss": 0.4426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20108163356781006,
"step": 205,
"valid_targets_mean": 2836.4,
"valid_targets_min": 874
},
{
"epoch": 0.3333333333333333,
"grad_norm": 0.7780860618594482,
"learning_rate": 1.8956916099773243e-05,
"loss": 0.4492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2229580283164978,
"step": 210,
"valid_targets_mean": 3097.6,
"valid_targets_min": 1283
},
{
"epoch": 0.3412698412698413,
"grad_norm": 0.7441717737312311,
"learning_rate": 1.941043083900227e-05,
"loss": 0.4214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16947849094867706,
"step": 215,
"valid_targets_mean": 2817.4,
"valid_targets_min": 1820
},
{
"epoch": 0.3492063492063492,
"grad_norm": 0.9092379058979357,
"learning_rate": 1.9863945578231295e-05,
"loss": 0.4468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2582654356956482,
"step": 220,
"valid_targets_mean": 2500.8,
"valid_targets_min": 949
},
{
"epoch": 0.35714285714285715,
"grad_norm": 0.6589744304007081,
"learning_rate": 2.031746031746032e-05,
"loss": 0.4167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21442869305610657,
"step": 225,
"valid_targets_mean": 4276.1,
"valid_targets_min": 1357
},
{
"epoch": 0.36507936507936506,
"grad_norm": 0.6323891462731305,
"learning_rate": 2.0770975056689343e-05,
"loss": 0.4101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991756558418274,
"step": 230,
"valid_targets_mean": 4364.2,
"valid_targets_min": 1985
},
{
"epoch": 0.373015873015873,
"grad_norm": 0.6300499913534073,
"learning_rate": 2.122448979591837e-05,
"loss": 0.4235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1824556291103363,
"step": 235,
"valid_targets_mean": 4333.2,
"valid_targets_min": 1767
},
{
"epoch": 0.38095238095238093,
"grad_norm": 0.7575279487592979,
"learning_rate": 2.1678004535147395e-05,
"loss": 0.4325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17709918320178986,
"step": 240,
"valid_targets_mean": 2336.2,
"valid_targets_min": 563
},
{
"epoch": 0.3888888888888889,
"grad_norm": 0.7262739017659442,
"learning_rate": 2.213151927437642e-05,
"loss": 0.4123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2349386066198349,
"step": 245,
"valid_targets_mean": 3695.9,
"valid_targets_min": 820
},
{
"epoch": 0.3968253968253968,
"grad_norm": 0.6666197654683886,
"learning_rate": 2.2585034013605444e-05,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19883863627910614,
"step": 250,
"valid_targets_mean": 3917.5,
"valid_targets_min": 1650
},
{
"epoch": 0.40476190476190477,
"grad_norm": 0.8818322001559287,
"learning_rate": 2.3038548752834472e-05,
"loss": 0.4031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2325284481048584,
"step": 255,
"valid_targets_mean": 4317.1,
"valid_targets_min": 1046
},
{
"epoch": 0.4126984126984127,
"grad_norm": 0.8421416866948682,
"learning_rate": 2.3492063492063496e-05,
"loss": 0.4295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28885674476623535,
"step": 260,
"valid_targets_mean": 3573.9,
"valid_targets_min": 1326
},
{
"epoch": 0.42063492063492064,
"grad_norm": 0.5853157764437146,
"learning_rate": 2.394557823129252e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15830400586128235,
"step": 265,
"valid_targets_mean": 3754.9,
"valid_targets_min": 1835
},
{
"epoch": 0.42857142857142855,
"grad_norm": 0.8503179082208167,
"learning_rate": 2.439909297052154e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22213050723075867,
"step": 270,
"valid_targets_mean": 2988.8,
"valid_targets_min": 1303
},
{
"epoch": 0.4365079365079365,
"grad_norm": 0.7148417560197586,
"learning_rate": 2.4852607709750566e-05,
"loss": 0.4223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17101828753948212,
"step": 275,
"valid_targets_mean": 2654.6,
"valid_targets_min": 993
},
{
"epoch": 0.4444444444444444,
"grad_norm": 0.7488294120655374,
"learning_rate": 2.5306122448979597e-05,
"loss": 0.4057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22752045094966888,
"step": 280,
"valid_targets_mean": 3658.4,
"valid_targets_min": 628
},
{
"epoch": 0.4523809523809524,
"grad_norm": 0.819013125702064,
"learning_rate": 2.5759637188208618e-05,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18698972463607788,
"step": 285,
"valid_targets_mean": 3620.4,
"valid_targets_min": 338
},
{
"epoch": 0.4603174603174603,
"grad_norm": 0.8764147766183873,
"learning_rate": 2.6213151927437642e-05,
"loss": 0.4258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2131589949131012,
"step": 290,
"valid_targets_mean": 2699.6,
"valid_targets_min": 998
},
{
"epoch": 0.46825396825396826,
"grad_norm": 0.7879977167108214,
"learning_rate": 2.6666666666666667e-05,
"loss": 0.4163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1819707751274109,
"step": 295,
"valid_targets_mean": 2660.6,
"valid_targets_min": 810
},
{
"epoch": 0.47619047619047616,
"grad_norm": 0.7627064380571622,
"learning_rate": 2.7120181405895694e-05,
"loss": 0.3933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631428837776184,
"step": 300,
"valid_targets_mean": 4265.4,
"valid_targets_min": 1689
},
{
"epoch": 0.48412698412698413,
"grad_norm": 0.8689936550923171,
"learning_rate": 2.757369614512472e-05,
"loss": 0.396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1952773928642273,
"step": 305,
"valid_targets_mean": 3231.6,
"valid_targets_min": 848
},
{
"epoch": 0.49206349206349204,
"grad_norm": 0.6751339015061344,
"learning_rate": 2.8027210884353743e-05,
"loss": 0.4131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20138613879680634,
"step": 310,
"valid_targets_mean": 3902.9,
"valid_targets_min": 1826
},
{
"epoch": 0.5,
"grad_norm": 0.8543806139476121,
"learning_rate": 2.8480725623582767e-05,
"loss": 0.4131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23939643800258636,
"step": 315,
"valid_targets_mean": 3292.4,
"valid_targets_min": 1588
},
{
"epoch": 0.5079365079365079,
"grad_norm": 0.7658147806021045,
"learning_rate": 2.893424036281179e-05,
"loss": 0.4181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23602905869483948,
"step": 320,
"valid_targets_mean": 4239.2,
"valid_targets_min": 1031
},
{
"epoch": 0.5158730158730159,
"grad_norm": 0.6595384619915944,
"learning_rate": 2.938775510204082e-05,
"loss": 0.383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23135556280612946,
"step": 325,
"valid_targets_mean": 4404.8,
"valid_targets_min": 1369
},
{
"epoch": 0.5238095238095238,
"grad_norm": 0.7133459488389239,
"learning_rate": 2.9841269841269844e-05,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19045504927635193,
"step": 330,
"valid_targets_mean": 3302.9,
"valid_targets_min": 881
},
{
"epoch": 0.5317460317460317,
"grad_norm": 0.816501934646045,
"learning_rate": 3.0294784580498868e-05,
"loss": 0.3857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21776193380355835,
"step": 335,
"valid_targets_mean": 3168.0,
"valid_targets_min": 877
},
{
"epoch": 0.5396825396825397,
"grad_norm": 0.7547862179719467,
"learning_rate": 3.074829931972789e-05,
"loss": 0.3946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25766003131866455,
"step": 340,
"valid_targets_mean": 3334.1,
"valid_targets_min": 1054
},
{
"epoch": 0.5476190476190477,
"grad_norm": 0.7456441513111814,
"learning_rate": 3.1201814058956924e-05,
"loss": 0.3904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2486940622329712,
"step": 345,
"valid_targets_mean": 4429.5,
"valid_targets_min": 990
},
{
"epoch": 0.5555555555555556,
"grad_norm": 0.7657984461471989,
"learning_rate": 3.1655328798185945e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721412479877472,
"step": 350,
"valid_targets_mean": 4107.6,
"valid_targets_min": 762
},
{
"epoch": 0.5634920634920635,
"grad_norm": 0.7508109310293009,
"learning_rate": 3.2108843537414965e-05,
"loss": 0.4011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2144778072834015,
"step": 355,
"valid_targets_mean": 3111.6,
"valid_targets_min": 1302
},
{
"epoch": 0.5714285714285714,
"grad_norm": 0.7203641872399225,
"learning_rate": 3.256235827664399e-05,
"loss": 0.4204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1992923766374588,
"step": 360,
"valid_targets_mean": 3283.1,
"valid_targets_min": 955
},
{
"epoch": 0.5793650793650794,
"grad_norm": 0.8767754163538739,
"learning_rate": 3.3015873015873014e-05,
"loss": 0.3836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18871556222438812,
"step": 365,
"valid_targets_mean": 2312.6,
"valid_targets_min": 1135
},
{
"epoch": 0.5873015873015873,
"grad_norm": 0.7936761727417533,
"learning_rate": 3.346938775510204e-05,
"loss": 0.4144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2474576234817505,
"step": 370,
"valid_targets_mean": 3684.5,
"valid_targets_min": 1271
},
{
"epoch": 0.5952380952380952,
"grad_norm": 0.7531283113396905,
"learning_rate": 3.392290249433107e-05,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2062309980392456,
"step": 375,
"valid_targets_mean": 3048.8,
"valid_targets_min": 1440
},
{
"epoch": 0.6031746031746031,
"grad_norm": 0.75475705688863,
"learning_rate": 3.437641723356009e-05,
"loss": 0.3928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1992933750152588,
"step": 380,
"valid_targets_mean": 3318.6,
"valid_targets_min": 1709
},
{
"epoch": 0.6111111111111112,
"grad_norm": 0.6780236377117146,
"learning_rate": 3.482993197278912e-05,
"loss": 0.3817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662087678909302,
"step": 385,
"valid_targets_mean": 4945.2,
"valid_targets_min": 2317
},
{
"epoch": 0.6190476190476191,
"grad_norm": 0.7877440224609804,
"learning_rate": 3.5283446712018146e-05,
"loss": 0.3818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17678651213645935,
"step": 390,
"valid_targets_mean": 3275.4,
"valid_targets_min": 1605
},
{
"epoch": 0.626984126984127,
"grad_norm": 0.7191554661780377,
"learning_rate": 3.573696145124717e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25680381059646606,
"step": 395,
"valid_targets_mean": 4801.4,
"valid_targets_min": 2557
},
{
"epoch": 0.6349206349206349,
"grad_norm": 0.7021848250259723,
"learning_rate": 3.6190476190476195e-05,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.181675523519516,
"step": 400,
"valid_targets_mean": 3404.2,
"valid_targets_min": 1675
},
{
"epoch": 0.6428571428571429,
"grad_norm": 0.7099201322215687,
"learning_rate": 3.6643990929705216e-05,
"loss": 0.3986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1909167766571045,
"step": 405,
"valid_targets_mean": 3180.8,
"valid_targets_min": 1215
},
{
"epoch": 0.6507936507936508,
"grad_norm": 0.6475933862451292,
"learning_rate": 3.7097505668934243e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15484705567359924,
"step": 410,
"valid_targets_mean": 3154.2,
"valid_targets_min": 1356
},
{
"epoch": 0.6587301587301587,
"grad_norm": 0.7601788500031307,
"learning_rate": 3.755102040816327e-05,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19706499576568604,
"step": 415,
"valid_targets_mean": 3226.2,
"valid_targets_min": 959
},
{
"epoch": 0.6666666666666666,
"grad_norm": 0.7989603824606386,
"learning_rate": 3.800453514739229e-05,
"loss": 0.3795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20341980457305908,
"step": 420,
"valid_targets_mean": 2154.1,
"valid_targets_min": 1042
},
{
"epoch": 0.6746031746031746,
"grad_norm": 0.8589861103070494,
"learning_rate": 3.845804988662132e-05,
"loss": 0.4057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528594732284546,
"step": 425,
"valid_targets_mean": 3353.6,
"valid_targets_min": 891
},
{
"epoch": 0.6825396825396826,
"grad_norm": 0.6923698776091382,
"learning_rate": 3.891156462585034e-05,
"loss": 0.3722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22147980332374573,
"step": 430,
"valid_targets_mean": 4294.6,
"valid_targets_min": 1399
},
{
"epoch": 0.6904761904761905,
"grad_norm": 0.6835864581969211,
"learning_rate": 3.936507936507937e-05,
"loss": 0.3824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19371160864830017,
"step": 435,
"valid_targets_mean": 3578.5,
"valid_targets_min": 1759
},
{
"epoch": 0.6984126984126984,
"grad_norm": 0.6628481402738557,
"learning_rate": 3.9818594104308396e-05,
"loss": 0.3852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1930302232503891,
"step": 440,
"valid_targets_mean": 3477.0,
"valid_targets_min": 1703
},
{
"epoch": 0.7063492063492064,
"grad_norm": 0.6502431105225167,
"learning_rate": 3.999994361288785e-05,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16785907745361328,
"step": 445,
"valid_targets_mean": 3585.5,
"valid_targets_min": 1717
},
{
"epoch": 0.7142857142857143,
"grad_norm": 0.7344445982650616,
"learning_rate": 3.9999599026131644e-05,
"loss": 0.4005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26353609561920166,
"step": 450,
"valid_targets_mean": 3787.4,
"valid_targets_min": 1206
},
{
"epoch": 0.7222222222222222,
"grad_norm": 0.7393938445809128,
"learning_rate": 3.999894118418342e-05,
"loss": 0.3823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2211625725030899,
"step": 455,
"valid_targets_mean": 2948.5,
"valid_targets_min": 1663
},
{
"epoch": 0.7301587301587301,
"grad_norm": 0.6960634624059825,
"learning_rate": 3.999797009734697e-05,
"loss": 0.3951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21404457092285156,
"step": 460,
"valid_targets_mean": 3528.6,
"valid_targets_min": 1449
},
{
"epoch": 0.7380952380952381,
"grad_norm": 0.7184877621518291,
"learning_rate": 3.999668578083253e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20007619261741638,
"step": 465,
"valid_targets_mean": 4320.4,
"valid_targets_min": 1497
},
{
"epoch": 0.746031746031746,
"grad_norm": 0.5728045234335117,
"learning_rate": 3.9995088254756434e-05,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16080446541309357,
"step": 470,
"valid_targets_mean": 4607.4,
"valid_targets_min": 1481
},
{
"epoch": 0.753968253968254,
"grad_norm": 0.6475372333254459,
"learning_rate": 3.999317754414084e-05,
"loss": 0.3492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24191340804100037,
"step": 475,
"valid_targets_mean": 4953.6,
"valid_targets_min": 586
},
{
"epoch": 0.7619047619047619,
"grad_norm": 0.6843058759524845,
"learning_rate": 3.999095367891337e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1674070954322815,
"step": 480,
"valid_targets_mean": 3345.8,
"valid_targets_min": 1521
},
{
"epoch": 0.7698412698412699,
"grad_norm": 0.7811323772346972,
"learning_rate": 3.9988416693906563e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17297232151031494,
"step": 485,
"valid_targets_mean": 2783.2,
"valid_targets_min": 1135
},
{
"epoch": 0.7777777777777778,
"grad_norm": 0.6346318209661107,
"learning_rate": 3.9985566628857425e-05,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2082044929265976,
"step": 490,
"valid_targets_mean": 3855.1,
"valid_targets_min": 2018
},
{
"epoch": 0.7857142857142857,
"grad_norm": 0.636191038245321,
"learning_rate": 3.998240352840672e-05,
"loss": 0.3734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16644376516342163,
"step": 495,
"valid_targets_mean": 3555.9,
"valid_targets_min": 1613
},
{
"epoch": 0.7936507936507936,
"grad_norm": 0.7677265538591346,
"learning_rate": 3.997892744209833e-05,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19620782136917114,
"step": 500,
"valid_targets_mean": 3067.5,
"valid_targets_min": 755
},
{
"epoch": 0.8015873015873016,
"grad_norm": 0.6946489087789731,
"learning_rate": 3.997513842437845e-05,
"loss": 0.3817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1887287199497223,
"step": 505,
"valid_targets_mean": 3885.8,
"valid_targets_min": 1515
},
{
"epoch": 0.8095238095238095,
"grad_norm": 0.6017170952436831,
"learning_rate": 3.997103653459475e-05,
"loss": 0.3623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1097162514925003,
"step": 510,
"valid_targets_mean": 2377.0,
"valid_targets_min": 997
},
{
"epoch": 0.8174603174603174,
"grad_norm": 0.8117871434459484,
"learning_rate": 3.996662183699541e-05,
"loss": 0.3789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2122984677553177,
"step": 515,
"valid_targets_mean": 2203.6,
"valid_targets_min": 1206
},
{
"epoch": 0.8253968253968254,
"grad_norm": 1.099868973186974,
"learning_rate": 3.996189440072818e-05,
"loss": 0.3733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2121431827545166,
"step": 520,
"valid_targets_mean": 1926.2,
"valid_targets_min": 1015
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.7894079145469358,
"learning_rate": 3.9956854299839246e-05,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19006070494651794,
"step": 525,
"valid_targets_mean": 2125.8,
"valid_targets_min": 1140
},
{
"epoch": 0.8412698412698413,
"grad_norm": 0.5713509671754762,
"learning_rate": 3.9951501613272076e-05,
"loss": 0.3877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13354474306106567,
"step": 530,
"valid_targets_mean": 3074.2,
"valid_targets_min": 1520
},
{
"epoch": 0.8492063492063492,
"grad_norm": 0.6881625716625266,
"learning_rate": 3.994583642486618e-05,
"loss": 0.3482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1768343448638916,
"step": 535,
"valid_targets_mean": 3562.4,
"valid_targets_min": 2059
},
{
"epoch": 0.8571428571428571,
"grad_norm": 0.899503970041781,
"learning_rate": 3.993985882335584e-05,
"loss": 0.3879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21532076597213745,
"step": 540,
"valid_targets_mean": 2230.4,
"valid_targets_min": 1046
},
{
"epoch": 0.8650793650793651,
"grad_norm": 0.7723136033497726,
"learning_rate": 3.993356890236866e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16664713621139526,
"step": 545,
"valid_targets_mean": 3265.4,
"valid_targets_min": 1553
},
{
"epoch": 0.873015873015873,
"grad_norm": 0.6301346388180525,
"learning_rate": 3.992696676042414e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10019686818122864,
"step": 550,
"valid_targets_mean": 2215.4,
"valid_targets_min": 1273
},
{
"epoch": 0.8809523809523809,
"grad_norm": 0.6543508925534741,
"learning_rate": 3.992005250093211e-05,
"loss": 0.3598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17179307341575623,
"step": 555,
"valid_targets_mean": 3047.4,
"valid_targets_min": 485
},
{
"epoch": 0.8888888888888888,
"grad_norm": 0.8123556394552758,
"learning_rate": 3.991282623219113e-05,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1461830735206604,
"step": 560,
"valid_targets_mean": 2082.2,
"valid_targets_min": 781
},
{
"epoch": 0.8968253968253969,
"grad_norm": 0.7331475325077027,
"learning_rate": 3.9905288067386776e-05,
"loss": 0.3681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19923052191734314,
"step": 565,
"valid_targets_mean": 3274.1,
"valid_targets_min": 1872
},
{
"epoch": 0.9047619047619048,
"grad_norm": 0.7153118596407079,
"learning_rate": 3.989743812458987e-05,
"loss": 0.3826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14115799963474274,
"step": 570,
"valid_targets_mean": 2320.8,
"valid_targets_min": 693
},
{
"epoch": 0.9126984126984127,
"grad_norm": 0.7016335318916914,
"learning_rate": 3.9889276526754664e-05,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16912700235843658,
"step": 575,
"valid_targets_mean": 2482.8,
"valid_targets_min": 538
},
{
"epoch": 0.9206349206349206,
"grad_norm": 0.7194115163831962,
"learning_rate": 3.988080340171685e-05,
"loss": 0.3746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13386040925979614,
"step": 580,
"valid_targets_mean": 2249.6,
"valid_targets_min": 1316
},
{
"epoch": 0.9285714285714286,
"grad_norm": 0.6158476314889361,
"learning_rate": 3.987201888219161e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599443256855011,
"step": 585,
"valid_targets_mean": 3076.1,
"valid_targets_min": 1577
},
{
"epoch": 0.9365079365079365,
"grad_norm": 0.6585146139697904,
"learning_rate": 3.986292310577153e-05,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14659200608730316,
"step": 590,
"valid_targets_mean": 3358.4,
"valid_targets_min": 648
},
{
"epoch": 0.9444444444444444,
"grad_norm": 0.6835718384960962,
"learning_rate": 3.9853516214924416e-05,
"loss": 0.3721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13478732109069824,
"step": 595,
"valid_targets_mean": 2055.1,
"valid_targets_min": 1013
},
{
"epoch": 0.9523809523809523,
"grad_norm": 0.6959839449645118,
"learning_rate": 3.9843798356991096e-05,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.176021009683609,
"step": 600,
"valid_targets_mean": 3608.4,
"valid_targets_min": 1354
},
{
"epoch": 0.9603174603174603,
"grad_norm": 0.6388041844606942,
"learning_rate": 3.9833769684183104e-05,
"loss": 0.354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1868162751197815,
"step": 605,
"valid_targets_mean": 4381.1,
"valid_targets_min": 1644
},
{
"epoch": 0.9682539682539683,
"grad_norm": 0.589355661451599,
"learning_rate": 3.982343035358026e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1337076723575592,
"step": 610,
"valid_targets_mean": 4026.0,
"valid_targets_min": 1246
},
{
"epoch": 0.9761904761904762,
"grad_norm": 0.7138102765349207,
"learning_rate": 3.981278052712827e-05,
"loss": 0.3765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21860548853874207,
"step": 615,
"valid_targets_mean": 3400.8,
"valid_targets_min": 1221
},
{
"epoch": 0.9841269841269841,
"grad_norm": 0.7189437980532786,
"learning_rate": 3.9801820371636157e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14498873054981232,
"step": 620,
"valid_targets_mean": 2650.0,
"valid_targets_min": 948
},
{
"epoch": 0.9920634920634921,
"grad_norm": 0.7615356151418823,
"learning_rate": 3.979055005877364e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15953488647937775,
"step": 625,
"valid_targets_mean": 2240.5,
"valid_targets_min": 663
},
{
"epoch": 1.0,
"grad_norm": 0.6621991671174888,
"learning_rate": 3.977896976506845e-05,
"loss": 0.3623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603941172361374,
"step": 630,
"valid_targets_mean": 3363.9,
"valid_targets_min": 1638
},
{
"epoch": 1.007936507936508,
"grad_norm": 0.6550331659262137,
"learning_rate": 3.976707967190358e-05,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17896458506584167,
"step": 635,
"valid_targets_mean": 4749.9,
"valid_targets_min": 1178
},
{
"epoch": 1.0158730158730158,
"grad_norm": 1.4617398692123404,
"learning_rate": 3.9754879965514456e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17083466053009033,
"step": 640,
"valid_targets_mean": 2990.1,
"valid_targets_min": 1347
},
{
"epoch": 1.0238095238095237,
"grad_norm": 0.6853201850501975,
"learning_rate": 3.9742370836985956e-05,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18801261484622955,
"step": 645,
"valid_targets_mean": 3202.0,
"valid_targets_min": 1392
},
{
"epoch": 1.0317460317460316,
"grad_norm": 0.7335116899022144,
"learning_rate": 3.972955248224949e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14001566171646118,
"step": 650,
"valid_targets_mean": 2526.6,
"valid_targets_min": 879
},
{
"epoch": 1.0396825396825398,
"grad_norm": 0.7803286501692405,
"learning_rate": 3.971642510207989e-05,
"loss": 0.3406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11908479779958725,
"step": 655,
"valid_targets_mean": 2010.4,
"valid_targets_min": 834
},
{
"epoch": 1.0476190476190477,
"grad_norm": 0.669641003705267,
"learning_rate": 3.9702988902092274e-05,
"loss": 0.3404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1486767828464508,
"step": 660,
"valid_targets_mean": 3876.1,
"valid_targets_min": 1169
},
{
"epoch": 1.0555555555555556,
"grad_norm": 0.7374591920294192,
"learning_rate": 3.968924409273884e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1979072391986847,
"step": 665,
"valid_targets_mean": 3748.1,
"valid_targets_min": 806
},
{
"epoch": 1.0634920634920635,
"grad_norm": 0.7083687479977528,
"learning_rate": 3.9675190889305545e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19211263954639435,
"step": 670,
"valid_targets_mean": 4064.2,
"valid_targets_min": 1686
},
{
"epoch": 1.0714285714285714,
"grad_norm": 0.8099558494020401,
"learning_rate": 3.966082951190874e-05,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15523111820220947,
"step": 675,
"valid_targets_mean": 2294.0,
"valid_targets_min": 1479
},
{
"epoch": 1.0793650793650793,
"grad_norm": 0.8193510612362526,
"learning_rate": 3.9646160185491756e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16692380607128143,
"step": 680,
"valid_targets_mean": 2352.2,
"valid_targets_min": 1492
},
{
"epoch": 1.0873015873015872,
"grad_norm": 0.6631812506670042,
"learning_rate": 3.963118313982131e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16724464297294617,
"step": 685,
"valid_targets_mean": 3532.9,
"valid_targets_min": 1559
},
{
"epoch": 1.0952380952380953,
"grad_norm": 0.6330184363082058,
"learning_rate": 3.961589860948399e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13762444257736206,
"step": 690,
"valid_targets_mean": 3628.2,
"valid_targets_min": 1599
},
{
"epoch": 1.1031746031746033,
"grad_norm": 0.7395137202968401,
"learning_rate": 3.960030683388251e-05,
"loss": 0.3298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1789383590221405,
"step": 695,
"valid_targets_mean": 2894.2,
"valid_targets_min": 659
},
{
"epoch": 1.1111111111111112,
"grad_norm": 0.7567445910162289,
"learning_rate": 3.9584408057232e-05,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13180208206176758,
"step": 700,
"valid_targets_mean": 2321.5,
"valid_targets_min": 1053
},
{
"epoch": 1.119047619047619,
"grad_norm": 0.7029746538069985,
"learning_rate": 3.956820252855618e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23373830318450928,
"step": 705,
"valid_targets_mean": 3848.2,
"valid_targets_min": 698
},
{
"epoch": 1.126984126984127,
"grad_norm": 0.8217697460107479,
"learning_rate": 3.955169050168343e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11867678910493851,
"step": 710,
"valid_targets_mean": 1995.0,
"valid_targets_min": 700
},
{
"epoch": 1.1349206349206349,
"grad_norm": 0.6237928838837601,
"learning_rate": 3.953487223524283e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20738816261291504,
"step": 715,
"valid_targets_mean": 4893.6,
"valid_targets_min": 791
},
{
"epoch": 1.1428571428571428,
"grad_norm": 0.6340353953231894,
"learning_rate": 3.951774799266014e-05,
"loss": 0.3248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17009267210960388,
"step": 720,
"valid_targets_mean": 3876.5,
"valid_targets_min": 836
},
{
"epoch": 1.1507936507936507,
"grad_norm": 0.7509419852778023,
"learning_rate": 3.950031804215364e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22996996343135834,
"step": 725,
"valid_targets_mean": 4188.8,
"valid_targets_min": 1473
},
{
"epoch": 1.1587301587301586,
"grad_norm": 0.6070513438056959,
"learning_rate": 3.948258265672991e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12374967336654663,
"step": 730,
"valid_targets_mean": 3161.9,
"valid_targets_min": 715
},
{
"epoch": 1.1666666666666667,
"grad_norm": 0.8005848521113644,
"learning_rate": 3.946454211417961e-05,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19525708258152008,
"step": 735,
"valid_targets_mean": 2452.2,
"valid_targets_min": 851
},
{
"epoch": 1.1746031746031746,
"grad_norm": 0.7223216527088103,
"learning_rate": 3.944619669707309e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19071514904499054,
"step": 740,
"valid_targets_mean": 2636.9,
"valid_targets_min": 1016
},
{
"epoch": 1.1825396825396826,
"grad_norm": 0.769530384992589,
"learning_rate": 3.9427546692755946e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15291930735111237,
"step": 745,
"valid_targets_mean": 1790.5,
"valid_targets_min": 680
},
{
"epoch": 1.1904761904761905,
"grad_norm": 0.8609161127919669,
"learning_rate": 3.9408592393344596e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18366797268390656,
"step": 750,
"valid_targets_mean": 2313.8,
"valid_targets_min": 888
},
{
"epoch": 1.1984126984126984,
"grad_norm": 0.7460458484078427,
"learning_rate": 3.9389334095721606e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18691663444042206,
"step": 755,
"valid_targets_mean": 2993.1,
"valid_targets_min": 1669
},
{
"epoch": 1.2063492063492063,
"grad_norm": 0.6569460078100842,
"learning_rate": 3.936977210153113e-05,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1891995668411255,
"step": 760,
"valid_targets_mean": 4634.4,
"valid_targets_min": 1431
},
{
"epoch": 1.2142857142857142,
"grad_norm": 0.8065057390599204,
"learning_rate": 3.93499067171741e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16406933963298798,
"step": 765,
"valid_targets_mean": 2047.8,
"valid_targets_min": 611
},
{
"epoch": 1.2222222222222223,
"grad_norm": 0.6735826463574247,
"learning_rate": 3.932973825380351e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1321011185646057,
"step": 770,
"valid_targets_mean": 3697.6,
"valid_targets_min": 1243
},
{
"epoch": 1.2301587301587302,
"grad_norm": 0.6532987965485518,
"learning_rate": 3.9309267027319485e-05,
"loss": 0.3284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20019066333770752,
"step": 775,
"valid_targets_mean": 5117.1,
"valid_targets_min": 923
},
{
"epoch": 1.2380952380952381,
"grad_norm": 0.6721008291547677,
"learning_rate": 3.928849335836435e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16830293834209442,
"step": 780,
"valid_targets_mean": 3834.2,
"valid_targets_min": 707
},
{
"epoch": 1.246031746031746,
"grad_norm": 0.672719770061112,
"learning_rate": 3.926741757231761e-05,
"loss": 0.3179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14843882620334625,
"step": 785,
"valid_targets_mean": 2557.2,
"valid_targets_min": 1395
},
{
"epoch": 1.253968253968254,
"grad_norm": 0.6540553828853359,
"learning_rate": 3.924603999929086e-05,
"loss": 0.3359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036338448524475,
"step": 790,
"valid_targets_mean": 4443.6,
"valid_targets_min": 905
},
{
"epoch": 1.2619047619047619,
"grad_norm": 0.6995738559163635,
"learning_rate": 3.9224360974122584e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15793496370315552,
"step": 795,
"valid_targets_mean": 2658.4,
"valid_targets_min": 682
},
{
"epoch": 1.2698412698412698,
"grad_norm": 0.6963704328628288,
"learning_rate": 3.920238083637297e-05,
"loss": 0.322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15149086713790894,
"step": 800,
"valid_targets_mean": 2722.5,
"valid_targets_min": 848
},
{
"epoch": 1.2777777777777777,
"grad_norm": 0.5568936443457445,
"learning_rate": 3.9180099930318524e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1571732759475708,
"step": 805,
"valid_targets_mean": 4953.6,
"valid_targets_min": 782
},
{
"epoch": 1.2857142857142856,
"grad_norm": 0.7021372758165298,
"learning_rate": 3.915751860494672e-05,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1892794370651245,
"step": 810,
"valid_targets_mean": 3306.2,
"valid_targets_min": 993
},
{
"epoch": 1.2936507936507937,
"grad_norm": 0.7165579981094458,
"learning_rate": 3.913463721395051e-05,
"loss": 0.3397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1962992250919342,
"step": 815,
"valid_targets_mean": 3322.0,
"valid_targets_min": 1297
},
{
"epoch": 1.3015873015873016,
"grad_norm": 0.6672225363936888,
"learning_rate": 3.911145611572282e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13479071855545044,
"step": 820,
"valid_targets_mean": 2435.1,
"valid_targets_min": 971
},
{
"epoch": 1.3095238095238095,
"grad_norm": 0.6373647212783545,
"learning_rate": 3.908797567335089e-05,
"loss": 0.3476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14948585629463196,
"step": 825,
"valid_targets_mean": 2808.1,
"valid_targets_min": 907
},
{
"epoch": 1.3174603174603174,
"grad_norm": 1.153607480771756,
"learning_rate": 3.906419625461062e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14141523838043213,
"step": 830,
"valid_targets_mean": 1876.9,
"valid_targets_min": 900
},
{
"epoch": 1.3253968253968254,
"grad_norm": 0.6466191823091932,
"learning_rate": 3.90401182319608e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16680654883384705,
"step": 835,
"valid_targets_mean": 3402.9,
"valid_targets_min": 1345
},
{
"epoch": 1.3333333333333333,
"grad_norm": 0.762601991381067,
"learning_rate": 3.9015741982537265e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18606701493263245,
"step": 840,
"valid_targets_mean": 3056.8,
"valid_targets_min": 957
},
{
"epoch": 1.3412698412698414,
"grad_norm": 0.5962344088673996,
"learning_rate": 3.899106788814701e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1680346578359604,
"step": 845,
"valid_targets_mean": 3557.2,
"valid_targets_min": 1508
},
{
"epoch": 1.3492063492063493,
"grad_norm": 0.6079281739641783,
"learning_rate": 3.896609633526219e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18283489346504211,
"step": 850,
"valid_targets_mean": 4741.0,
"valid_targets_min": 2597
},
{
"epoch": 1.3571428571428572,
"grad_norm": 0.6433520532374093,
"learning_rate": 3.894082771501407e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.224579855799675,
"step": 855,
"valid_targets_mean": 5688.9,
"valid_targets_min": 2441
},
{
"epoch": 1.3650793650793651,
"grad_norm": 0.6236488281351981,
"learning_rate": 3.891526242318692e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12770557403564453,
"step": 860,
"valid_targets_mean": 2938.4,
"valid_targets_min": 1391
},
{
"epoch": 1.373015873015873,
"grad_norm": 0.6758191068090547,
"learning_rate": 3.8889400860211785e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1711861491203308,
"step": 865,
"valid_targets_mean": 4322.4,
"valid_targets_min": 1282
},
{
"epoch": 1.380952380952381,
"grad_norm": 0.7829861176740196,
"learning_rate": 3.886324343116023e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14786922931671143,
"step": 870,
"valid_targets_mean": 2398.6,
"valid_targets_min": 1527
},
{
"epoch": 1.3888888888888888,
"grad_norm": 0.6137417239069314,
"learning_rate": 3.883679054573799e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12261499464511871,
"step": 875,
"valid_targets_mean": 3248.4,
"valid_targets_min": 1341
},
{
"epoch": 1.3968253968253967,
"grad_norm": 0.7275067900304849,
"learning_rate": 3.881004261827856e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13986937701702118,
"step": 880,
"valid_targets_mean": 2470.4,
"valid_targets_min": 939
},
{
"epoch": 1.4047619047619047,
"grad_norm": 0.573567853532649,
"learning_rate": 3.878300006773669e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11593329906463623,
"step": 885,
"valid_targets_mean": 3373.0,
"valid_targets_min": 1433
},
{
"epoch": 1.4126984126984126,
"grad_norm": 0.6421889204633251,
"learning_rate": 3.875566331768184e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16899876296520233,
"step": 890,
"valid_targets_mean": 3735.2,
"valid_targets_min": 1422
},
{
"epoch": 1.4206349206349207,
"grad_norm": 0.636113488826798,
"learning_rate": 3.872803279629155e-05,
"loss": 0.3247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18453936278820038,
"step": 895,
"valid_targets_mean": 4604.8,
"valid_targets_min": 1210
},
{
"epoch": 1.4285714285714286,
"grad_norm": 0.8348881833927589,
"learning_rate": 3.8700108936344705e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15507002174854279,
"step": 900,
"valid_targets_mean": 4224.5,
"valid_targets_min": 1205
},
{
"epoch": 1.4365079365079365,
"grad_norm": 0.6263889168583548,
"learning_rate": 3.867189217521477e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17729918658733368,
"step": 905,
"valid_targets_mean": 4577.2,
"valid_targets_min": 1831
},
{
"epoch": 1.4444444444444444,
"grad_norm": 0.6333671939834843,
"learning_rate": 3.864338295486297e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.230592280626297,
"step": 910,
"valid_targets_mean": 4192.1,
"valid_targets_min": 1671
},
{
"epoch": 1.4523809523809523,
"grad_norm": 0.7922900343139502,
"learning_rate": 3.8614581721831316e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1534234583377838,
"step": 915,
"valid_targets_mean": 2057.8,
"valid_targets_min": 938
},
{
"epoch": 1.4603174603174602,
"grad_norm": 0.6383017464464749,
"learning_rate": 3.858548892723563e-05,
"loss": 0.3535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13009271025657654,
"step": 920,
"valid_targets_mean": 3326.5,
"valid_targets_min": 1077
},
{
"epoch": 1.4682539682539684,
"grad_norm": 0.651551125180835,
"learning_rate": 3.855610502675851e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22951310873031616,
"step": 925,
"valid_targets_mean": 4700.6,
"valid_targets_min": 1678
},
{
"epoch": 1.4761904761904763,
"grad_norm": 0.6753131034311983,
"learning_rate": 3.852643048064215e-05,
"loss": 0.3219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15419398248195648,
"step": 930,
"valid_targets_mean": 3162.8,
"valid_targets_min": 1095
},
{
"epoch": 1.4841269841269842,
"grad_norm": 0.6537814645059444,
"learning_rate": 3.8496465753681145e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15850700438022614,
"step": 935,
"valid_targets_mean": 3159.0,
"valid_targets_min": 1387
},
{
"epoch": 1.492063492063492,
"grad_norm": 0.6873845352603423,
"learning_rate": 3.846621131521522e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22871655225753784,
"step": 940,
"valid_targets_mean": 3588.6,
"valid_targets_min": 859
},
{
"epoch": 1.5,
"grad_norm": 0.5815861421834687,
"learning_rate": 3.843566763912187e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1536579430103302,
"step": 945,
"valid_targets_mean": 4438.8,
"valid_targets_min": 1272
},
{
"epoch": 1.507936507936508,
"grad_norm": 0.6185343070978655,
"learning_rate": 3.840483520380896e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11785129457712173,
"step": 950,
"valid_targets_mean": 3136.1,
"valid_targets_min": 1054
},
{
"epoch": 1.5158730158730158,
"grad_norm": 0.7109509570702359,
"learning_rate": 3.837371449220717e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18690654635429382,
"step": 955,
"valid_targets_mean": 3742.0,
"valid_targets_min": 1121
},
{
"epoch": 1.5238095238095237,
"grad_norm": 0.7752023546341235,
"learning_rate": 3.834230599176251e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1134377121925354,
"step": 960,
"valid_targets_mean": 1666.9,
"valid_targets_min": 567
},
{
"epoch": 1.5317460317460316,
"grad_norm": 0.642223551798259,
"learning_rate": 3.831061019442864e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1406305432319641,
"step": 965,
"valid_targets_mean": 3459.5,
"valid_targets_min": 944
},
{
"epoch": 1.5396825396825395,
"grad_norm": 0.7389463906485425,
"learning_rate": 3.827862759665916e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17435957491397858,
"step": 970,
"valid_targets_mean": 2838.5,
"valid_targets_min": 752
},
{
"epoch": 1.5476190476190477,
"grad_norm": 0.9324752016602136,
"learning_rate": 3.8246358699399853e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16448692977428436,
"step": 975,
"valid_targets_mean": 2016.4,
"valid_targets_min": 1003
},
{
"epoch": 1.5555555555555556,
"grad_norm": 0.7164291842449987,
"learning_rate": 3.8213804008080824e-05,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21906238794326782,
"step": 980,
"valid_targets_mean": 4072.2,
"valid_targets_min": 1473
},
{
"epoch": 1.5634920634920635,
"grad_norm": 0.6920532471489735,
"learning_rate": 3.818096403260862e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18423213064670563,
"step": 985,
"valid_targets_mean": 3113.2,
"valid_targets_min": 636
},
{
"epoch": 1.5714285714285714,
"grad_norm": 0.5959713542415751,
"learning_rate": 3.8147839287358185e-05,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15230652689933777,
"step": 990,
"valid_targets_mean": 3757.6,
"valid_targets_min": 1066
},
{
"epoch": 1.5793650793650795,
"grad_norm": 0.823279374199861,
"learning_rate": 3.8114430291164836e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13656845688819885,
"step": 995,
"valid_targets_mean": 1662.8,
"valid_targets_min": 875
},
{
"epoch": 1.5873015873015874,
"grad_norm": 0.6873357420736661,
"learning_rate": 3.808073756731615e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15334893763065338,
"step": 1000,
"valid_targets_mean": 3311.2,
"valid_targets_min": 1291
},
{
"epoch": 1.5952380952380953,
"grad_norm": 0.6484825809948287,
"learning_rate": 3.8046761643543734e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1463339626789093,
"step": 1005,
"valid_targets_mean": 4150.1,
"valid_targets_min": 1798
},
{
"epoch": 1.6031746031746033,
"grad_norm": 0.6817054528039794,
"learning_rate": 3.8012503052014996e-05,
"loss": 0.3656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17801718413829803,
"step": 1010,
"valid_targets_mean": 3748.4,
"valid_targets_min": 1955
},
{
"epoch": 1.6111111111111112,
"grad_norm": 0.7872906055674049,
"learning_rate": 3.797796232932476e-05,
"loss": 0.3287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1268722265958786,
"step": 1015,
"valid_targets_mean": 2023.8,
"valid_targets_min": 1156
},
{
"epoch": 1.619047619047619,
"grad_norm": 0.651529600042665,
"learning_rate": 3.794314001648692e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14170636236667633,
"step": 1020,
"valid_targets_mean": 2843.0,
"valid_targets_min": 922
},
{
"epoch": 1.626984126984127,
"grad_norm": 0.6171435300769704,
"learning_rate": 3.7908036658925926e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16796676814556122,
"step": 1025,
"valid_targets_mean": 2937.6,
"valid_targets_min": 750
},
{
"epoch": 1.6349206349206349,
"grad_norm": 0.7476071653963485,
"learning_rate": 3.787265280646825e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16783180832862854,
"step": 1030,
"valid_targets_mean": 2927.6,
"valid_targets_min": 726
},
{
"epoch": 1.6428571428571428,
"grad_norm": 0.6644484494281356,
"learning_rate": 3.7836989013333776e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13871848583221436,
"step": 1035,
"valid_targets_mean": 3492.8,
"valid_targets_min": 1748
},
{
"epoch": 1.6507936507936507,
"grad_norm": 0.5725806618836755,
"learning_rate": 3.780104583812712e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16656331717967987,
"step": 1040,
"valid_targets_mean": 4105.2,
"valid_targets_min": 908
},
{
"epoch": 1.6587301587301586,
"grad_norm": 0.7354883976199714,
"learning_rate": 3.7764823843828883e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18832966685295105,
"step": 1045,
"valid_targets_mean": 3323.4,
"valid_targets_min": 1571
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.6548011282202095,
"learning_rate": 3.7728323597786834e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11662226915359497,
"step": 1050,
"valid_targets_mean": 2727.0,
"valid_targets_min": 1221
},
{
"epoch": 1.6746031746031746,
"grad_norm": 0.7662281834478178,
"learning_rate": 3.7691545671707007e-05,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16389185190200806,
"step": 1055,
"valid_targets_mean": 2433.9,
"valid_targets_min": 1068
},
{
"epoch": 1.6825396825396826,
"grad_norm": 0.6191057387381401,
"learning_rate": 3.765449064164477e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09424316883087158,
"step": 1060,
"valid_targets_mean": 2522.8,
"valid_targets_min": 1517
},
{
"epoch": 1.6904761904761905,
"grad_norm": 0.7089163950388633,
"learning_rate": 3.7617159087995784e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16477319598197937,
"step": 1065,
"valid_targets_mean": 4247.1,
"valid_targets_min": 808
},
{
"epoch": 1.6984126984126984,
"grad_norm": 0.7336010684393983,
"learning_rate": 3.757955159548693e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1567060947418213,
"step": 1070,
"valid_targets_mean": 2002.9,
"valid_targets_min": 819
},
{
"epoch": 1.7063492063492065,
"grad_norm": 0.5551974094945166,
"learning_rate": 3.754166875316713e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18975624442100525,
"step": 1075,
"valid_targets_mean": 5140.1,
"valid_targets_min": 1990
},
{
"epoch": 1.7142857142857144,
"grad_norm": 0.7790486862381991,
"learning_rate": 3.750351115439812e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16643652319908142,
"step": 1080,
"valid_targets_mean": 3622.6,
"valid_targets_min": 1729
},
{
"epoch": 1.7222222222222223,
"grad_norm": 0.6895583697751339,
"learning_rate": 3.746507939684519e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1543181836605072,
"step": 1085,
"valid_targets_mean": 2840.0,
"valid_targets_min": 1084
},
{
"epoch": 1.7301587301587302,
"grad_norm": 0.6649886180118483,
"learning_rate": 3.742637408246779e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20172613859176636,
"step": 1090,
"valid_targets_mean": 4078.4,
"valid_targets_min": 702
},
{
"epoch": 1.7380952380952381,
"grad_norm": 0.6986475804737025,
"learning_rate": 3.73873958175101e-05,
"loss": 0.3242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1479484736919403,
"step": 1095,
"valid_targets_mean": 3294.2,
"valid_targets_min": 671
},
{
"epoch": 1.746031746031746,
"grad_norm": 0.7108510865696669,
"learning_rate": 3.734814521249156e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1519460678100586,
"step": 1100,
"valid_targets_mean": 3030.0,
"valid_targets_min": 1151
},
{
"epoch": 1.753968253968254,
"grad_norm": 0.780130184905361,
"learning_rate": 3.7308622882197294e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11438941955566406,
"step": 1105,
"valid_targets_mean": 2342.4,
"valid_targets_min": 968
},
{
"epoch": 1.7619047619047619,
"grad_norm": 0.6919296705990884,
"learning_rate": 3.7268829445668456e-05,
"loss": 0.3304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1509092152118683,
"step": 1110,
"valid_targets_mean": 2715.0,
"valid_targets_min": 1656
},
{
"epoch": 1.7698412698412698,
"grad_norm": 0.7095337197458086,
"learning_rate": 3.722876552619257e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1642485111951828,
"step": 1115,
"valid_targets_mean": 3003.0,
"valid_targets_min": 1832
},
{
"epoch": 1.7777777777777777,
"grad_norm": 0.6623605599103729,
"learning_rate": 3.718843175129378e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656493842601776,
"step": 1120,
"valid_targets_mean": 3344.5,
"valid_targets_min": 1639
},
{
"epoch": 1.7857142857142856,
"grad_norm": 0.6509353975185467,
"learning_rate": 3.7147828752722944e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16948366165161133,
"step": 1125,
"valid_targets_mean": 3909.0,
"valid_targets_min": 2076
},
{
"epoch": 1.7936507936507935,
"grad_norm": 0.7055857265594317,
"learning_rate": 3.7106957166447834e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.182726189494133,
"step": 1130,
"valid_targets_mean": 3147.1,
"valid_targets_min": 719
},
{
"epoch": 1.8015873015873016,
"grad_norm": 0.5821370256541043,
"learning_rate": 3.7065817632643115e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20441317558288574,
"step": 1135,
"valid_targets_mean": 6269.5,
"valid_targets_min": 2700
},
{
"epoch": 1.8095238095238095,
"grad_norm": 0.6271222096362784,
"learning_rate": 3.7024410795680326e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14290623366832733,
"step": 1140,
"valid_targets_mean": 3049.8,
"valid_targets_min": 671
},
{
"epoch": 1.8174603174603174,
"grad_norm": 0.5742957360318593,
"learning_rate": 3.698273730411782e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1737782061100006,
"step": 1145,
"valid_targets_mean": 4881.1,
"valid_targets_min": 1050
},
{
"epoch": 1.8253968253968254,
"grad_norm": 0.7237896853510777,
"learning_rate": 3.694079781069053e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605367660522461,
"step": 1150,
"valid_targets_mean": 2798.1,
"valid_targets_min": 1461
},
{
"epoch": 1.8333333333333335,
"grad_norm": 0.7796561546026146,
"learning_rate": 3.6898592972299875e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14959201216697693,
"step": 1155,
"valid_targets_mean": 2855.1,
"valid_targets_min": 1206
},
{
"epoch": 1.8412698412698414,
"grad_norm": 0.7814814222422569,
"learning_rate": 3.6856123450003306e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18412166833877563,
"step": 1160,
"valid_targets_mean": 3015.8,
"valid_targets_min": 994
},
{
"epoch": 1.8492063492063493,
"grad_norm": 0.6571893565564805,
"learning_rate": 3.68133899090041e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12655168771743774,
"step": 1165,
"valid_targets_mean": 2925.4,
"valid_targets_min": 1490
},
{
"epoch": 1.8571428571428572,
"grad_norm": 0.5625971515672297,
"learning_rate": 3.677039301864085e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15519466996192932,
"step": 1170,
"valid_targets_mean": 3959.8,
"valid_targets_min": 978
},
{
"epoch": 1.8650793650793651,
"grad_norm": 0.7022395536958516,
"learning_rate": 3.672713345237701e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12823298573493958,
"step": 1175,
"valid_targets_mean": 2513.6,
"valid_targets_min": 1325
},
{
"epoch": 1.873015873015873,
"grad_norm": 0.7382776756172028,
"learning_rate": 3.6683611887790356e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2348577082157135,
"step": 1180,
"valid_targets_mean": 3610.5,
"valid_targets_min": 1258
},
{
"epoch": 1.880952380952381,
"grad_norm": 0.6379811831724779,
"learning_rate": 3.663982900656236e-05,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1788225919008255,
"step": 1185,
"valid_targets_mean": 3843.0,
"valid_targets_min": 1043
},
{
"epoch": 1.8888888888888888,
"grad_norm": 0.6677114190374929,
"learning_rate": 3.6595785494467516e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1895446628332138,
"step": 1190,
"valid_targets_mean": 4057.9,
"valid_targets_min": 493
},
{
"epoch": 1.8968253968253967,
"grad_norm": 0.554324996485495,
"learning_rate": 3.655148204136259e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370246708393097,
"step": 1195,
"valid_targets_mean": 4461.0,
"valid_targets_min": 1147
},
{
"epoch": 1.9047619047619047,
"grad_norm": 0.5714890741512307,
"learning_rate": 3.650691934117584e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1589963287115097,
"step": 1200,
"valid_targets_mean": 4565.9,
"valid_targets_min": 1407
},
{
"epoch": 1.9126984126984126,
"grad_norm": 0.7448282050971057,
"learning_rate": 3.646209809189611e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20559057593345642,
"step": 1205,
"valid_targets_mean": 3693.9,
"valid_targets_min": 1229
},
{
"epoch": 1.9206349206349205,
"grad_norm": 0.6320209854193637,
"learning_rate": 3.641701899556192e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24096056818962097,
"step": 1210,
"valid_targets_mean": 5899.9,
"valid_targets_min": 1722
},
{
"epoch": 1.9285714285714286,
"grad_norm": 0.5359385368169469,
"learning_rate": 3.63716827582505e-05,
"loss": 0.295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11727620661258698,
"step": 1215,
"valid_targets_mean": 2772.8,
"valid_targets_min": 1515
},
{
"epoch": 1.9365079365079365,
"grad_norm": 0.643091990151274,
"learning_rate": 3.632609009006665e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13127782940864563,
"step": 1220,
"valid_targets_mean": 3445.0,
"valid_targets_min": 1638
},
{
"epoch": 1.9444444444444444,
"grad_norm": 0.7242904191833993,
"learning_rate": 3.62802417051317e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19884291291236877,
"step": 1225,
"valid_targets_mean": 3024.6,
"valid_targets_min": 1055
},
{
"epoch": 1.9523809523809523,
"grad_norm": 0.7142658889462979,
"learning_rate": 3.6234138321572274e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16410435736179352,
"step": 1230,
"valid_targets_mean": 2792.0,
"valid_targets_min": 1235
},
{
"epoch": 1.9603174603174605,
"grad_norm": 0.7622407534270608,
"learning_rate": 3.6187780661509074e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13600055873394012,
"step": 1235,
"valid_targets_mean": 2606.2,
"valid_targets_min": 1292
},
{
"epoch": 1.9682539682539684,
"grad_norm": 2.0519892124143264,
"learning_rate": 3.6141169451045526e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22042493522167206,
"step": 1240,
"valid_targets_mean": 3888.2,
"valid_targets_min": 1648
},
{
"epoch": 1.9761904761904763,
"grad_norm": 0.661985430252956,
"learning_rate": 3.609430542025646e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17805568873882294,
"step": 1245,
"valid_targets_mean": 3606.0,
"valid_targets_min": 463
},
{
"epoch": 1.9841269841269842,
"grad_norm": 0.6677192065899155,
"learning_rate": 3.604718930317664e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11548539996147156,
"step": 1250,
"valid_targets_mean": 2009.4,
"valid_targets_min": 966
},
{
"epoch": 1.992063492063492,
"grad_norm": 0.6535363195362384,
"learning_rate": 3.5999821837789275e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13011835515499115,
"step": 1255,
"valid_targets_mean": 3151.8,
"valid_targets_min": 905
},
{
"epoch": 2.0,
"grad_norm": 0.6667531440533361,
"learning_rate": 3.595220376601447e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19327494502067566,
"step": 1260,
"valid_targets_mean": 3476.6,
"valid_targets_min": 628
},
{
"epoch": 2.007936507936508,
"grad_norm": 0.6583520262553467,
"learning_rate": 3.590433583369758e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11713065207004547,
"step": 1265,
"valid_targets_mean": 3390.6,
"valid_targets_min": 319
},
{
"epoch": 2.015873015873016,
"grad_norm": 0.6184665053818716,
"learning_rate": 3.5856218790597554e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1123209297657013,
"step": 1270,
"valid_targets_mean": 3809.2,
"valid_targets_min": 1431
},
{
"epoch": 2.0238095238095237,
"grad_norm": 0.7493002816181802,
"learning_rate": 3.580785339037519e-05,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16529607772827148,
"step": 1275,
"valid_targets_mean": 3118.0,
"valid_targets_min": 1336
},
{
"epoch": 2.0317460317460316,
"grad_norm": 0.7741262247536087,
"learning_rate": 3.57592403905813e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12097487598657608,
"step": 1280,
"valid_targets_mean": 2530.2,
"valid_targets_min": 798
},
{
"epoch": 2.0396825396825395,
"grad_norm": 0.6230151198360837,
"learning_rate": 3.571038055264489e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14992347359657288,
"step": 1285,
"valid_targets_mean": 5069.0,
"valid_targets_min": 2124
},
{
"epoch": 2.0476190476190474,
"grad_norm": 0.810562148405268,
"learning_rate": 3.566127464186119e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21131475269794464,
"step": 1290,
"valid_targets_mean": 3328.2,
"valid_targets_min": 538
},
{
"epoch": 2.0555555555555554,
"grad_norm": 0.5476942649122561,
"learning_rate": 3.56119234273797e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13968425989151,
"step": 1295,
"valid_targets_mean": 5129.4,
"valid_targets_min": 1461
},
{
"epoch": 2.0634920634920633,
"grad_norm": 0.5657998227607735,
"learning_rate": 3.5562327682192134e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20042595267295837,
"step": 1300,
"valid_targets_mean": 5548.2,
"valid_targets_min": 1233
},
{
"epoch": 2.0714285714285716,
"grad_norm": 0.6072758802013452,
"learning_rate": 3.5512488183120286e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1297391653060913,
"step": 1305,
"valid_targets_mean": 3396.8,
"valid_targets_min": 1489
},
{
"epoch": 2.0793650793650795,
"grad_norm": 0.6816298909752555,
"learning_rate": 3.54624057108039e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14064955711364746,
"step": 1310,
"valid_targets_mean": 3406.9,
"valid_targets_min": 961
},
{
"epoch": 2.0873015873015874,
"grad_norm": 0.6703325281786866,
"learning_rate": 3.5412081049688444e-05,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1433454304933548,
"step": 1315,
"valid_targets_mean": 3164.2,
"valid_targets_min": 1504
},
{
"epoch": 2.0952380952380953,
"grad_norm": 0.6835358753375542,
"learning_rate": 3.5361514988012774e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09970133751630783,
"step": 1320,
"valid_targets_mean": 2335.0,
"valid_targets_min": 674
},
{
"epoch": 2.1031746031746033,
"grad_norm": 0.6326834094504827,
"learning_rate": 3.5310708317796844e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1121712401509285,
"step": 1325,
"valid_targets_mean": 2643.4,
"valid_targets_min": 1202
},
{
"epoch": 2.111111111111111,
"grad_norm": 3.950868272026065,
"learning_rate": 3.5259661834829266e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14811912178993225,
"step": 1330,
"valid_targets_mean": 3642.4,
"valid_targets_min": 1865
},
{
"epoch": 2.119047619047619,
"grad_norm": 0.6816657238059641,
"learning_rate": 3.5208376338654866e-05,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1544703096151352,
"step": 1335,
"valid_targets_mean": 3581.6,
"valid_targets_min": 791
},
{
"epoch": 2.126984126984127,
"grad_norm": 0.6047101996393489,
"learning_rate": 3.515685263256214e-05,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12545567750930786,
"step": 1340,
"valid_targets_mean": 3086.5,
"valid_targets_min": 1125
},
{
"epoch": 2.134920634920635,
"grad_norm": 0.7668214060032036,
"learning_rate": 3.51050915235707e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15387457609176636,
"step": 1345,
"valid_targets_mean": 2922.4,
"valid_targets_min": 1243
},
{
"epoch": 2.142857142857143,
"grad_norm": 0.6341428031092777,
"learning_rate": 3.5053093822418596e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18130765855312347,
"step": 1350,
"valid_targets_mean": 4195.0,
"valid_targets_min": 955
},
{
"epoch": 2.1507936507936507,
"grad_norm": 0.6248047434099063,
"learning_rate": 3.500086034354966e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1647244542837143,
"step": 1355,
"valid_targets_mean": 4345.2,
"valid_targets_min": 1896
},
{
"epoch": 2.1587301587301586,
"grad_norm": 0.6747528154705348,
"learning_rate": 3.494839190510071e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12260128557682037,
"step": 1360,
"valid_targets_mean": 2796.8,
"valid_targets_min": 1616
},
{
"epoch": 2.1666666666666665,
"grad_norm": 0.7118102595286983,
"learning_rate": 3.489568932888877e-05,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16787979006767273,
"step": 1365,
"valid_targets_mean": 2947.5,
"valid_targets_min": 1622
},
{
"epoch": 2.1746031746031744,
"grad_norm": 0.6385054350831572,
"learning_rate": 3.484275344039815e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14596769213676453,
"step": 1370,
"valid_targets_mean": 3821.0,
"valid_targets_min": 1046
},
{
"epoch": 2.1825396825396823,
"grad_norm": 0.7154596844294332,
"learning_rate": 3.478958506876759e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1572347730398178,
"step": 1375,
"valid_targets_mean": 3031.8,
"valid_targets_min": 1016
},
{
"epoch": 2.1904761904761907,
"grad_norm": 0.6664826932154091,
"learning_rate": 3.47361850467772e-05,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14033150672912598,
"step": 1380,
"valid_targets_mean": 3299.4,
"valid_targets_min": 1159
},
{
"epoch": 2.1984126984126986,
"grad_norm": 0.6285119796929689,
"learning_rate": 3.468255421083546e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15819507837295532,
"step": 1385,
"valid_targets_mean": 3849.9,
"valid_targets_min": 974
},
{
"epoch": 2.2063492063492065,
"grad_norm": 0.7275694931249483,
"learning_rate": 3.46286934009661e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13317999243736267,
"step": 1390,
"valid_targets_mean": 2756.9,
"valid_targets_min": 1007
},
{
"epoch": 2.2142857142857144,
"grad_norm": 0.6358951472501403,
"learning_rate": 3.457460346079495e-05,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13068701326847076,
"step": 1395,
"valid_targets_mean": 3634.2,
"valid_targets_min": 1807
},
{
"epoch": 2.2222222222222223,
"grad_norm": 2.0139879928616233,
"learning_rate": 3.452028523753673e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745387613773346,
"step": 1400,
"valid_targets_mean": 3817.2,
"valid_targets_min": 708
},
{
"epoch": 2.2301587301587302,
"grad_norm": 0.6465986757489767,
"learning_rate": 3.446573958198176e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14092761278152466,
"step": 1405,
"valid_targets_mean": 3375.8,
"valid_targets_min": 776
},
{
"epoch": 2.238095238095238,
"grad_norm": 0.7747629398813702,
"learning_rate": 3.4410967348482666e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10323482751846313,
"step": 1410,
"valid_targets_mean": 1944.0,
"valid_targets_min": 705
},
{
"epoch": 2.246031746031746,
"grad_norm": 0.597350797307689,
"learning_rate": 3.435596939494098e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10818013548851013,
"step": 1415,
"valid_targets_mean": 3180.1,
"valid_targets_min": 1579
},
{
"epoch": 2.253968253968254,
"grad_norm": 0.6699385734099821,
"learning_rate": 3.430074658279369e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1064271479845047,
"step": 1420,
"valid_targets_mean": 2770.2,
"valid_targets_min": 1171
},
{
"epoch": 2.261904761904762,
"grad_norm": 0.75576808503992,
"learning_rate": 3.424529977699977e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14628705382347107,
"step": 1425,
"valid_targets_mean": 2557.9,
"valid_targets_min": 1104
},
{
"epoch": 2.2698412698412698,
"grad_norm": 0.6025560694996105,
"learning_rate": 3.418962984602661e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11078731715679169,
"step": 1430,
"valid_targets_mean": 2991.8,
"valid_targets_min": 858
},
{
"epoch": 2.2777777777777777,
"grad_norm": 0.7739932318724013,
"learning_rate": 3.413373766183646e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12117686867713928,
"step": 1435,
"valid_targets_mean": 1849.1,
"valid_targets_min": 586
},
{
"epoch": 2.2857142857142856,
"grad_norm": 0.6235979138790416,
"learning_rate": 3.40776240998727e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1533014178276062,
"step": 1440,
"valid_targets_mean": 4757.4,
"valid_targets_min": 1467
},
{
"epoch": 2.2936507936507935,
"grad_norm": 0.745768264262844,
"learning_rate": 3.4021290039046184e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1377353072166443,
"step": 1445,
"valid_targets_mean": 2300.9,
"valid_targets_min": 719
},
{
"epoch": 2.3015873015873014,
"grad_norm": 0.6254453190255295,
"learning_rate": 3.396473636172146e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12696042656898499,
"step": 1450,
"valid_targets_mean": 3798.0,
"valid_targets_min": 1759
},
{
"epoch": 2.3095238095238093,
"grad_norm": 0.6457999463573912,
"learning_rate": 3.390796395370294e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14060063660144806,
"step": 1455,
"valid_targets_mean": 3829.0,
"valid_targets_min": 933
},
{
"epoch": 2.317460317460317,
"grad_norm": 0.746423663933539,
"learning_rate": 3.385097370422102e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1291799396276474,
"step": 1460,
"valid_targets_mean": 2310.8,
"valid_targets_min": 1472
},
{
"epoch": 2.3253968253968256,
"grad_norm": 0.6768216692086332,
"learning_rate": 3.3793766505918185e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1252336949110031,
"step": 1465,
"valid_targets_mean": 2343.1,
"valid_targets_min": 959
},
{
"epoch": 2.3333333333333335,
"grad_norm": 0.8554015943268323,
"learning_rate": 3.3736343254834994e-05,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14149311184883118,
"step": 1470,
"valid_targets_mean": 3089.0,
"valid_targets_min": 1826
},
{
"epoch": 2.3412698412698414,
"grad_norm": 0.5699352738058534,
"learning_rate": 3.3678704850396045e-05,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1736626923084259,
"step": 1475,
"valid_targets_mean": 5070.6,
"valid_targets_min": 1119
},
{
"epoch": 2.3492063492063493,
"grad_norm": 0.678427343004129,
"learning_rate": 3.362085219539592e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17105717957019806,
"step": 1480,
"valid_targets_mean": 3659.2,
"valid_targets_min": 1391
},
{
"epoch": 2.357142857142857,
"grad_norm": 0.6478379778271129,
"learning_rate": 3.3562786195985025e-05,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13324151933193207,
"step": 1485,
"valid_targets_mean": 3253.6,
"valid_targets_min": 356
},
{
"epoch": 2.365079365079365,
"grad_norm": 0.676700032911331,
"learning_rate": 3.350450776165535e-05,
"loss": 0.2684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11475967615842819,
"step": 1490,
"valid_targets_mean": 2737.2,
"valid_targets_min": 1414
},
{
"epoch": 2.373015873015873,
"grad_norm": 0.7360708037445938,
"learning_rate": 3.344601780522634e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12047970294952393,
"step": 1495,
"valid_targets_mean": 2303.1,
"valid_targets_min": 986
},
{
"epoch": 2.380952380952381,
"grad_norm": 0.7144328682757947,
"learning_rate": 3.3387317242830466e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11342642456293106,
"step": 1500,
"valid_targets_mean": 2235.1,
"valid_targets_min": 1201
},
{
"epoch": 2.388888888888889,
"grad_norm": 0.6778072852737712,
"learning_rate": 3.332840699389897e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11429885029792786,
"step": 1505,
"valid_targets_mean": 4177.8,
"valid_targets_min": 1508
},
{
"epoch": 2.3968253968253967,
"grad_norm": 0.6602113352709741,
"learning_rate": 3.32692879811474e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09258200228214264,
"step": 1510,
"valid_targets_mean": 2555.5,
"valid_targets_min": 662
},
{
"epoch": 2.4047619047619047,
"grad_norm": 0.7944569505936786,
"learning_rate": 3.320996113056123e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14962106943130493,
"step": 1515,
"valid_targets_mean": 2968.1,
"valid_targets_min": 905
},
{
"epoch": 2.4126984126984126,
"grad_norm": 0.7895832341518009,
"learning_rate": 3.315042737138128e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.128577321767807,
"step": 1520,
"valid_targets_mean": 2297.6,
"valid_targets_min": 1123
},
{
"epoch": 2.4206349206349205,
"grad_norm": 0.6113596264456261,
"learning_rate": 3.309068763608919e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14215974509716034,
"step": 1525,
"valid_targets_mean": 4635.9,
"valid_targets_min": 1311
},
{
"epoch": 2.4285714285714284,
"grad_norm": 0.7606294131509589,
"learning_rate": 3.303074286039285e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15265774726867676,
"step": 1530,
"valid_targets_mean": 3241.4,
"valid_targets_min": 703
},
{
"epoch": 2.4365079365079367,
"grad_norm": 0.6597348036859395,
"learning_rate": 3.2970593983211694e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16022004187107086,
"step": 1535,
"valid_targets_mean": 4045.4,
"valid_targets_min": 1319
},
{
"epoch": 2.4444444444444446,
"grad_norm": 0.6418418930113634,
"learning_rate": 3.2910241946661993e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1274852603673935,
"step": 1540,
"valid_targets_mean": 3660.1,
"valid_targets_min": 1576
},
{
"epoch": 2.4523809523809526,
"grad_norm": 0.5596752424003796,
"learning_rate": 3.2849687696042165e-05,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12781956791877747,
"step": 1545,
"valid_targets_mean": 3888.6,
"valid_targets_min": 930
},
{
"epoch": 2.4603174603174605,
"grad_norm": 0.6298774595726288,
"learning_rate": 3.2788932179817886e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12249404937028885,
"step": 1550,
"valid_targets_mean": 3024.8,
"valid_targets_min": 938
},
{
"epoch": 2.4682539682539684,
"grad_norm": 0.8294293286080818,
"learning_rate": 3.2727976349607276e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16689524054527283,
"step": 1555,
"valid_targets_mean": 3518.5,
"valid_targets_min": 995
},
{
"epoch": 2.4761904761904763,
"grad_norm": 0.8170059407606398,
"learning_rate": 3.266682116016599e-05,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15669232606887817,
"step": 1560,
"valid_targets_mean": 2421.6,
"valid_targets_min": 1520
},
{
"epoch": 2.484126984126984,
"grad_norm": 0.6500010061538937,
"learning_rate": 3.260546756937227e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10150349140167236,
"step": 1565,
"valid_targets_mean": 2195.6,
"valid_targets_min": 1602
},
{
"epoch": 2.492063492063492,
"grad_norm": 0.8474876828092535,
"learning_rate": 3.254391653821192e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16686615347862244,
"step": 1570,
"valid_targets_mean": 2120.5,
"valid_targets_min": 1215
},
{
"epoch": 2.5,
"grad_norm": 0.6084457929463493,
"learning_rate": 3.248216903076328e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11863277852535248,
"step": 1575,
"valid_targets_mean": 3777.1,
"valid_targets_min": 1557
},
{
"epoch": 2.507936507936508,
"grad_norm": 0.6549666435127953,
"learning_rate": 3.24202260141821e-05,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1478644460439682,
"step": 1580,
"valid_targets_mean": 3566.9,
"valid_targets_min": 992
},
{
"epoch": 2.515873015873016,
"grad_norm": 0.7084095804077182,
"learning_rate": 3.235808845868641e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13560350239276886,
"step": 1585,
"valid_targets_mean": 3083.1,
"valid_targets_min": 654
},
{
"epoch": 2.5238095238095237,
"grad_norm": 0.7283622693375735,
"learning_rate": 3.229575733754132e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13665327429771423,
"step": 1590,
"valid_targets_mean": 3873.9,
"valid_targets_min": 1988
},
{
"epoch": 2.5317460317460316,
"grad_norm": 0.7813924734763139,
"learning_rate": 3.2233233627043765e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18560901284217834,
"step": 1595,
"valid_targets_mean": 3023.4,
"valid_targets_min": 1717
},
{
"epoch": 2.5396825396825395,
"grad_norm": 0.7724895632284718,
"learning_rate": 3.217051830650722e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13543711602687836,
"step": 1600,
"valid_targets_mean": 2324.1,
"valid_targets_min": 1243
},
{
"epoch": 2.5476190476190474,
"grad_norm": 0.631251167859757,
"learning_rate": 3.210761235824639e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19025763869285583,
"step": 1605,
"valid_targets_mean": 4070.1,
"valid_targets_min": 1186
},
{
"epoch": 2.5555555555555554,
"grad_norm": 0.6693047102178958,
"learning_rate": 3.204451676756175e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13068076968193054,
"step": 1610,
"valid_targets_mean": 2703.6,
"valid_targets_min": 733
},
{
"epoch": 2.5634920634920633,
"grad_norm": 0.6793425587783933,
"learning_rate": 3.198123252272419e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15108279883861542,
"step": 1615,
"valid_targets_mean": 3861.0,
"valid_targets_min": 2115
},
{
"epoch": 2.571428571428571,
"grad_norm": 0.7533398118442075,
"learning_rate": 3.1917760614959505e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17746326327323914,
"step": 1620,
"valid_targets_mean": 3869.5,
"valid_targets_min": 2101
},
{
"epoch": 2.5793650793650795,
"grad_norm": 0.6401603357735229,
"learning_rate": 3.1854102038432856e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0972735583782196,
"step": 1625,
"valid_targets_mean": 2536.4,
"valid_targets_min": 853
},
{
"epoch": 2.5873015873015874,
"grad_norm": 0.6534800131136479,
"learning_rate": 3.17902577902332e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1368650197982788,
"step": 1630,
"valid_targets_mean": 3628.0,
"valid_targets_min": 1049
},
{
"epoch": 2.5952380952380953,
"grad_norm": 0.6723421200741301,
"learning_rate": 3.172622887035771e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16636143624782562,
"step": 1635,
"valid_targets_mean": 3449.6,
"valid_targets_min": 1366
},
{
"epoch": 2.6031746031746033,
"grad_norm": 0.6086043667473161,
"learning_rate": 3.1662016281696073e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077192947268486,
"step": 1640,
"valid_targets_mean": 3127.9,
"valid_targets_min": 1693
},
{
"epoch": 2.611111111111111,
"grad_norm": 0.5976415874014748,
"learning_rate": 3.15976210300148e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08958538621664047,
"step": 1645,
"valid_targets_mean": 2533.8,
"valid_targets_min": 1440
},
{
"epoch": 2.619047619047619,
"grad_norm": 0.7581524318153838,
"learning_rate": 3.153304412394143e-05,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1573348343372345,
"step": 1650,
"valid_targets_mean": 2123.6,
"valid_targets_min": 1378
},
{
"epoch": 2.626984126984127,
"grad_norm": 0.754404491585718,
"learning_rate": 3.146828657494883e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14607343077659607,
"step": 1655,
"valid_targets_mean": 2874.5,
"valid_targets_min": 702
},
{
"epoch": 2.634920634920635,
"grad_norm": 0.7776622806557849,
"learning_rate": 3.140334939733924e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15422557294368744,
"step": 1660,
"valid_targets_mean": 2812.4,
"valid_targets_min": 682
},
{
"epoch": 2.642857142857143,
"grad_norm": 0.7851829681510233,
"learning_rate": 3.1338233608228455e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17594920098781586,
"step": 1665,
"valid_targets_mean": 4304.4,
"valid_targets_min": 1584
},
{
"epoch": 2.6507936507936507,
"grad_norm": 0.6186866548868446,
"learning_rate": 3.127294022752988e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12931489944458008,
"step": 1670,
"valid_targets_mean": 4241.0,
"valid_targets_min": 1549
},
{
"epoch": 2.6587301587301586,
"grad_norm": 0.6404478009955566,
"learning_rate": 3.120747027793854e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313716024160385,
"step": 1675,
"valid_targets_mean": 3436.2,
"valid_targets_min": 1122
},
{
"epoch": 2.6666666666666665,
"grad_norm": 0.6424760221978681,
"learning_rate": 3.114182478491509e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14358645677566528,
"step": 1680,
"valid_targets_mean": 3566.9,
"valid_targets_min": 1824
},
{
"epoch": 2.674603174603175,
"grad_norm": 0.6212608954505446,
"learning_rate": 3.107600477666969e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11525902152061462,
"step": 1685,
"valid_targets_mean": 4901.4,
"valid_targets_min": 1684
},
{
"epoch": 2.682539682539683,
"grad_norm": 0.7373215482236564,
"learning_rate": 3.1010011284146004e-05,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15655554831027985,
"step": 1690,
"valid_targets_mean": 2539.5,
"valid_targets_min": 836
},
{
"epoch": 2.6904761904761907,
"grad_norm": 0.7711994151976389,
"learning_rate": 3.0943845341004944e-05,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15932291746139526,
"step": 1695,
"valid_targets_mean": 2453.8,
"valid_targets_min": 627
},
{
"epoch": 2.6984126984126986,
"grad_norm": 0.5832119782072631,
"learning_rate": 3.087750798360856e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09954415261745453,
"step": 1700,
"valid_targets_mean": 3089.4,
"valid_targets_min": 982
},
{
"epoch": 2.7063492063492065,
"grad_norm": 0.6507828484721623,
"learning_rate": 3.0811000251003774e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15949490666389465,
"step": 1705,
"valid_targets_mean": 3973.5,
"valid_targets_min": 1863
},
{
"epoch": 2.7142857142857144,
"grad_norm": 0.647286678324319,
"learning_rate": 3.074432318490608e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16663986444473267,
"step": 1710,
"valid_targets_mean": 3909.6,
"valid_targets_min": 1870
},
{
"epoch": 2.7222222222222223,
"grad_norm": 0.5662716434730383,
"learning_rate": 3.067747782968328e-05,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12369729578495026,
"step": 1715,
"valid_targets_mean": 4857.1,
"valid_targets_min": 2173
},
{
"epoch": 2.7301587301587302,
"grad_norm": 0.6836298091917609,
"learning_rate": 3.0610465232339096e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11899368464946747,
"step": 1720,
"valid_targets_mean": 3117.0,
"valid_targets_min": 899
},
{
"epoch": 2.738095238095238,
"grad_norm": 0.611020228050993,
"learning_rate": 3.054328644249677e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11934395879507065,
"step": 1725,
"valid_targets_mean": 2926.1,
"valid_targets_min": 1033
},
{
"epoch": 2.746031746031746,
"grad_norm": 0.7971191409966951,
"learning_rate": 3.047594251238265e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18401601910591125,
"step": 1730,
"valid_targets_mean": 3678.5,
"valid_targets_min": 1815
},
{
"epoch": 2.753968253968254,
"grad_norm": 0.6824521691463085,
"learning_rate": 3.0408434496809643e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14168040454387665,
"step": 1735,
"valid_targets_mean": 2618.5,
"valid_targets_min": 1130
},
{
"epoch": 2.761904761904762,
"grad_norm": 0.7071997600045877,
"learning_rate": 3.034076345316079e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13625219464302063,
"step": 1740,
"valid_targets_mean": 3389.4,
"valid_targets_min": 777
},
{
"epoch": 2.7698412698412698,
"grad_norm": 0.6570185747900452,
"learning_rate": 3.0272930441372628e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12578660249710083,
"step": 1745,
"valid_targets_mean": 3387.0,
"valid_targets_min": 873
},
{
"epoch": 2.7777777777777777,
"grad_norm": 0.5756355415915643,
"learning_rate": 3.02049365239186e-05,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13883277773857117,
"step": 1750,
"valid_targets_mean": 4081.4,
"valid_targets_min": 984
},
{
"epoch": 2.7857142857142856,
"grad_norm": 0.6741636937753623,
"learning_rate": 3.0136782765792455e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14945513010025024,
"step": 1755,
"valid_targets_mean": 3490.8,
"valid_targets_min": 824
},
{
"epoch": 2.7936507936507935,
"grad_norm": 0.6285050348403557,
"learning_rate": 3.0068470234491517e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16284587979316711,
"step": 1760,
"valid_targets_mean": 4642.1,
"valid_targets_min": 1071
},
{
"epoch": 2.8015873015873014,
"grad_norm": 0.6692873837736333,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11234371364116669,
"step": 1765,
"valid_targets_mean": 3148.2,
"valid_targets_min": 532
},
{
"epoch": 2.8095238095238093,
"grad_norm": 0.6308462732358487,
"learning_rate": 2.993137313477223e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09374731779098511,
"step": 1770,
"valid_targets_mean": 2508.5,
"valid_targets_min": 1356
},
{
"epoch": 2.817460317460317,
"grad_norm": 0.7007377433335262,
"learning_rate": 2.9862590713715837e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1225220113992691,
"step": 1775,
"valid_targets_mean": 2797.4,
"valid_targets_min": 932
},
{
"epoch": 2.825396825396825,
"grad_norm": 0.6598142297768089,
"learning_rate": 2.9793653814174957e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13078439235687256,
"step": 1780,
"valid_targets_mean": 3160.2,
"valid_targets_min": 1406
},
{
"epoch": 2.8333333333333335,
"grad_norm": 0.6341362087786145,
"learning_rate": 2.9724563515913317e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08914564549922943,
"step": 1785,
"valid_targets_mean": 2214.0,
"valid_targets_min": 486
},
{
"epoch": 2.8412698412698414,
"grad_norm": 0.7609575143650333,
"learning_rate": 2.9655320901097348e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15402570366859436,
"step": 1790,
"valid_targets_mean": 2849.5,
"valid_targets_min": 1404
},
{
"epoch": 2.8492063492063493,
"grad_norm": 0.6657562541253584,
"learning_rate": 2.9585927054279224e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.143843412399292,
"step": 1795,
"valid_targets_mean": 3437.2,
"valid_targets_min": 1651
},
{
"epoch": 2.857142857142857,
"grad_norm": 0.6799877740404671,
"learning_rate": 2.951638306237988e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15773284435272217,
"step": 1800,
"valid_targets_mean": 2877.4,
"valid_targets_min": 1139
},
{
"epoch": 2.865079365079365,
"grad_norm": 0.6865473240955069,
"learning_rate": 2.9446690014671976e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1253039836883545,
"step": 1805,
"valid_targets_mean": 2390.0,
"valid_targets_min": 997
},
{
"epoch": 2.873015873015873,
"grad_norm": 0.6534863995749159,
"learning_rate": 2.937684900276285e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11391299962997437,
"step": 1810,
"valid_targets_mean": 2806.4,
"valid_targets_min": 1592
},
{
"epoch": 2.880952380952381,
"grad_norm": 0.7567889432998731,
"learning_rate": 2.9306861120577416e-05,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11856131255626678,
"step": 1815,
"valid_targets_mean": 2440.9,
"valid_targets_min": 939
},
{
"epoch": 2.888888888888889,
"grad_norm": 0.6635665729697707,
"learning_rate": 2.923672746434103e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11890023946762085,
"step": 1820,
"valid_targets_mean": 3114.4,
"valid_targets_min": 645
},
{
"epoch": 2.8968253968253967,
"grad_norm": 0.7898960244652132,
"learning_rate": 2.9166449132562303e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2273479551076889,
"step": 1825,
"valid_targets_mean": 3445.4,
"valid_targets_min": 615
},
{
"epoch": 2.9047619047619047,
"grad_norm": 0.6221253005823774,
"learning_rate": 2.9096027226015927e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16060924530029297,
"step": 1830,
"valid_targets_mean": 3911.6,
"valid_targets_min": 1618
},
{
"epoch": 2.9126984126984126,
"grad_norm": 0.6890919052022301,
"learning_rate": 2.9025462847725405e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15114042162895203,
"step": 1835,
"valid_targets_mean": 3334.8,
"valid_targets_min": 1413
},
{
"epoch": 2.9206349206349205,
"grad_norm": 0.7151703994390879,
"learning_rate": 2.8954757102945798e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.164110004901886,
"step": 1840,
"valid_targets_mean": 3427.1,
"valid_targets_min": 1160
},
{
"epoch": 2.928571428571429,
"grad_norm": 0.6725713608557474,
"learning_rate": 2.888391109914638e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17118103802204132,
"step": 1845,
"valid_targets_mean": 4161.8,
"valid_targets_min": 1537
},
{
"epoch": 2.9365079365079367,
"grad_norm": 0.6210771507140483,
"learning_rate": 2.8812925945993333e-05,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10453899949789047,
"step": 1850,
"valid_targets_mean": 3119.2,
"valid_targets_min": 937
},
{
"epoch": 2.9444444444444446,
"grad_norm": 0.6584848576192016,
"learning_rate": 2.8741802755332332e-05,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15300224721431732,
"step": 1855,
"valid_targets_mean": 3997.0,
"valid_targets_min": 968
},
{
"epoch": 2.9523809523809526,
"grad_norm": 0.603729636604423,
"learning_rate": 2.8670542641171155e-05,
"loss": 0.2735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16688242554664612,
"step": 1860,
"valid_targets_mean": 3805.8,
"valid_targets_min": 1368
},
{
"epoch": 2.9603174603174605,
"grad_norm": 0.6685639760048532,
"learning_rate": 2.859914671966221e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15483403205871582,
"step": 1865,
"valid_targets_mean": 3771.5,
"valid_targets_min": 2012
},
{
"epoch": 2.9682539682539684,
"grad_norm": 0.7257652525758371,
"learning_rate": 2.8527616109085082e-05,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11175280809402466,
"step": 1870,
"valid_targets_mean": 2321.2,
"valid_targets_min": 1040
},
{
"epoch": 2.9761904761904763,
"grad_norm": 0.764225120374443,
"learning_rate": 2.8455951929828977e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16258296370506287,
"step": 1875,
"valid_targets_mean": 2744.0,
"valid_targets_min": 1181
},
{
"epoch": 2.984126984126984,
"grad_norm": 0.7040782057209479,
"learning_rate": 2.8384155304375223e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2076944261789322,
"step": 1880,
"valid_targets_mean": 4440.1,
"valid_targets_min": 1859
},
{
"epoch": 2.992063492063492,
"grad_norm": 0.5526066260270843,
"learning_rate": 2.8312227357279646e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1588117629289627,
"step": 1885,
"valid_targets_mean": 4321.2,
"valid_targets_min": 1174
},
{
"epoch": 3.0,
"grad_norm": 0.7083973280267318,
"learning_rate": 2.8240169215154977e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11426911503076553,
"step": 1890,
"valid_targets_mean": 2519.1,
"valid_targets_min": 1488
},
{
"epoch": 3.007936507936508,
"grad_norm": 0.6902028100549552,
"learning_rate": 2.8167982006653196e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12100070714950562,
"step": 1895,
"valid_targets_mean": 2715.6,
"valid_targets_min": 944
},
{
"epoch": 3.015873015873016,
"grad_norm": 0.7498148150106853,
"learning_rate": 2.8095666862447876e-05,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15154170989990234,
"step": 1900,
"valid_targets_mean": 3611.8,
"valid_targets_min": 1506
},
{
"epoch": 3.0238095238095237,
"grad_norm": 0.6616656629988206,
"learning_rate": 2.8023224915216442e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1271711140871048,
"step": 1905,
"valid_targets_mean": 3507.9,
"valid_targets_min": 936
},
{
"epoch": 3.0317460317460316,
"grad_norm": 0.7116856168102649,
"learning_rate": 2.795065729962244e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08189952373504639,
"step": 1910,
"valid_targets_mean": 2039.9,
"valid_targets_min": 1125
},
{
"epoch": 3.0396825396825395,
"grad_norm": 0.6876408809777227,
"learning_rate": 2.7877965152297785e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10088761150836945,
"step": 1915,
"valid_targets_mean": 2376.2,
"valid_targets_min": 1454
},
{
"epoch": 3.0476190476190474,
"grad_norm": 0.6942636265425131,
"learning_rate": 2.780514961182492e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1270643174648285,
"step": 1920,
"valid_targets_mean": 3030.1,
"valid_targets_min": 1496
},
{
"epoch": 3.0555555555555554,
"grad_norm": 0.6047340947825474,
"learning_rate": 2.773221181871903e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1178026869893074,
"step": 1925,
"valid_targets_mean": 4042.6,
"valid_targets_min": 1537
},
{
"epoch": 3.0634920634920633,
"grad_norm": 0.6821898699763301,
"learning_rate": 2.765915291541013e-05,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13922007381916046,
"step": 1930,
"valid_targets_mean": 3912.5,
"valid_targets_min": 1016
},
{
"epoch": 3.0714285714285716,
"grad_norm": 0.6551781793298332,
"learning_rate": 2.7585974046225206e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14014190435409546,
"step": 1935,
"valid_targets_mean": 3799.6,
"valid_targets_min": 1019
},
{
"epoch": 3.0793650793650795,
"grad_norm": 0.7821365657217646,
"learning_rate": 2.751267635737027e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1164986789226532,
"step": 1940,
"valid_targets_mean": 2321.2,
"valid_targets_min": 846
},
{
"epoch": 3.0873015873015874,
"grad_norm": 0.6698276676313706,
"learning_rate": 2.7439260996912423e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11518267542123795,
"step": 1945,
"valid_targets_mean": 3101.5,
"valid_targets_min": 1563
},
{
"epoch": 3.0952380952380953,
"grad_norm": 0.7281910335267264,
"learning_rate": 2.7365729114761862e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856643557548523,
"step": 1950,
"valid_targets_mean": 3758.4,
"valid_targets_min": 1446
},
{
"epoch": 3.1031746031746033,
"grad_norm": 0.8454083755018548,
"learning_rate": 2.729208186265386e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17740434408187866,
"step": 1955,
"valid_targets_mean": 3700.9,
"valid_targets_min": 836
},
{
"epoch": 3.111111111111111,
"grad_norm": 0.8235684513843857,
"learning_rate": 2.721832039413077e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12159430235624313,
"step": 1960,
"valid_targets_mean": 2358.2,
"valid_targets_min": 900
},
{
"epoch": 3.119047619047619,
"grad_norm": 0.7603822952932935,
"learning_rate": 2.7144445864523887e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11871971189975739,
"step": 1965,
"valid_targets_mean": 2330.9,
"valid_targets_min": 778
},
{
"epoch": 3.126984126984127,
"grad_norm": 0.5890854643098785,
"learning_rate": 2.7070459430935407e-05,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11397400498390198,
"step": 1970,
"valid_targets_mean": 3696.4,
"valid_targets_min": 1454
},
{
"epoch": 3.134920634920635,
"grad_norm": 0.6251976447943539,
"learning_rate": 2.69963622522203e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10502277314662933,
"step": 1975,
"valid_targets_mean": 3759.9,
"valid_targets_min": 2157
},
{
"epoch": 3.142857142857143,
"grad_norm": 0.723522815940443,
"learning_rate": 2.6922155488968117e-05,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10363540053367615,
"step": 1980,
"valid_targets_mean": 2637.6,
"valid_targets_min": 680
},
{
"epoch": 3.1507936507936507,
"grad_norm": 0.890979704609736,
"learning_rate": 2.684784030348486e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13063833117485046,
"step": 1985,
"valid_targets_mean": 2054.8,
"valid_targets_min": 1050
},
{
"epoch": 3.1587301587301586,
"grad_norm": 0.7071717645076813,
"learning_rate": 2.6773417859774755e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11484183371067047,
"step": 1990,
"valid_targets_mean": 3003.2,
"valid_targets_min": 1033
},
{
"epoch": 3.1666666666666665,
"grad_norm": 0.7255166589054973,
"learning_rate": 2.669888932352201e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10529197752475739,
"step": 1995,
"valid_targets_mean": 2306.5,
"valid_targets_min": 1230
},
{
"epoch": 3.1746031746031744,
"grad_norm": 0.7002772175531771,
"learning_rate": 2.662425586207259e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12117639183998108,
"step": 2000,
"valid_targets_mean": 3534.6,
"valid_targets_min": 1424
},
{
"epoch": 3.1825396825396823,
"grad_norm": 0.646490577280726,
"learning_rate": 2.6549518644415876e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09091825038194656,
"step": 2005,
"valid_targets_mean": 2662.6,
"valid_targets_min": 1489
},
{
"epoch": 3.1904761904761907,
"grad_norm": 0.6342896994103852,
"learning_rate": 2.6474678841166426e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1556168496608734,
"step": 2010,
"valid_targets_mean": 4756.2,
"valid_targets_min": 1659
},
{
"epoch": 3.1984126984126986,
"grad_norm": 0.6522004622714066,
"learning_rate": 2.639973762454558e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12138301134109497,
"step": 2015,
"valid_targets_mean": 3672.4,
"valid_targets_min": 1612
},
{
"epoch": 3.2063492063492065,
"grad_norm": 0.7782670981533159,
"learning_rate": 2.6324696168363134e-05,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1658809781074524,
"step": 2020,
"valid_targets_mean": 3090.1,
"valid_targets_min": 1357
},
{
"epoch": 3.2142857142857144,
"grad_norm": 0.6622860830034212,
"learning_rate": 2.624955564799894e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1196448802947998,
"step": 2025,
"valid_targets_mean": 3399.8,
"valid_targets_min": 706
},
{
"epoch": 3.2222222222222223,
"grad_norm": 0.693901810628061,
"learning_rate": 2.617431724038451e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10215766727924347,
"step": 2030,
"valid_targets_mean": 2399.5,
"valid_targets_min": 551
},
{
"epoch": 3.2301587301587302,
"grad_norm": 0.5671979640230917,
"learning_rate": 2.609898212398455e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16594891250133514,
"step": 2035,
"valid_targets_mean": 5821.9,
"valid_targets_min": 1505
},
{
"epoch": 3.238095238095238,
"grad_norm": 0.6974681739689081,
"learning_rate": 2.6023551478778535e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11858563125133514,
"step": 2040,
"valid_targets_mean": 2829.8,
"valid_targets_min": 773
},
{
"epoch": 3.246031746031746,
"grad_norm": 0.6882592331713957,
"learning_rate": 2.5948026486242225e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10707972943782806,
"step": 2045,
"valid_targets_mean": 3013.4,
"valid_targets_min": 1161
},
{
"epoch": 3.253968253968254,
"grad_norm": 0.6051374206215899,
"learning_rate": 2.5872408329329136e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14780555665493011,
"step": 2050,
"valid_targets_mean": 6003.6,
"valid_targets_min": 2869
},
{
"epoch": 3.261904761904762,
"grad_norm": 0.8178419818692619,
"learning_rate": 2.5796698192452016e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13839825987815857,
"step": 2055,
"valid_targets_mean": 3007.5,
"valid_targets_min": 847
},
{
"epoch": 3.2698412698412698,
"grad_norm": 0.610892128183204,
"learning_rate": 2.572089726146432e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.131939098238945,
"step": 2060,
"valid_targets_mean": 4979.1,
"valid_targets_min": 821
},
{
"epoch": 3.2777777777777777,
"grad_norm": 0.5925456999380748,
"learning_rate": 2.564500672364162e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08675329387187958,
"step": 2065,
"valid_targets_mean": 3128.8,
"valid_targets_min": 1033
},
{
"epoch": 3.2857142857142856,
"grad_norm": 0.7101170401554764,
"learning_rate": 2.556902776766298e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11017313599586487,
"step": 2070,
"valid_targets_mean": 2635.2,
"valid_targets_min": 1656
},
{
"epoch": 3.2936507936507935,
"grad_norm": 0.6737500763312219,
"learning_rate": 2.5492961583592397e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11181756108999252,
"step": 2075,
"valid_targets_mean": 2606.4,
"valid_targets_min": 1535
},
{
"epoch": 3.3015873015873014,
"grad_norm": 0.7396901842301878,
"learning_rate": 2.5416809362860107e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13949820399284363,
"step": 2080,
"valid_targets_mean": 3067.6,
"valid_targets_min": 1132
},
{
"epoch": 3.3095238095238093,
"grad_norm": 0.6498890292466925,
"learning_rate": 2.5340572298243946e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10242730379104614,
"step": 2085,
"valid_targets_mean": 2982.5,
"valid_targets_min": 1488
},
{
"epoch": 3.317460317460317,
"grad_norm": 0.7574837036969985,
"learning_rate": 2.5264251583850677e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579362004995346,
"step": 2090,
"valid_targets_mean": 3493.5,
"valid_targets_min": 1290
},
{
"epoch": 3.3253968253968256,
"grad_norm": 0.5407051448256301,
"learning_rate": 2.518784841509726e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11689899861812592,
"step": 2095,
"valid_targets_mean": 4560.6,
"valid_targets_min": 933
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.6970226932960573,
"learning_rate": 2.511136398869216e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13105079531669617,
"step": 2100,
"valid_targets_mean": 3603.1,
"valid_targets_min": 331
},
{
"epoch": 3.3412698412698414,
"grad_norm": 0.7186804216812557,
"learning_rate": 2.503479950261658e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13403379917144775,
"step": 2105,
"valid_targets_mean": 2903.1,
"valid_targets_min": 1096
},
{
"epoch": 3.3492063492063493,
"grad_norm": 0.6455942984531485,
"learning_rate": 2.4958156156105693e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10922306776046753,
"step": 2110,
"valid_targets_mean": 3211.5,
"valid_targets_min": 2118
},
{
"epoch": 3.357142857142857,
"grad_norm": 0.6571243872308732,
"learning_rate": 2.4881435149629892e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13601714372634888,
"step": 2115,
"valid_targets_mean": 3930.4,
"valid_targets_min": 1427
},
{
"epoch": 3.365079365079365,
"grad_norm": 0.6585273608503487,
"learning_rate": 2.4804637684875937e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10247397422790527,
"step": 2120,
"valid_targets_mean": 2421.5,
"valid_targets_min": 971
},
{
"epoch": 3.373015873015873,
"grad_norm": 0.62544048579586,
"learning_rate": 2.4727764964728177e-05,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16413845121860504,
"step": 2125,
"valid_targets_mean": 4857.9,
"valid_targets_min": 1029
},
{
"epoch": 3.380952380952381,
"grad_norm": 0.6792630869673345,
"learning_rate": 2.4650818193249693e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12296905368566513,
"step": 2130,
"valid_targets_mean": 3710.6,
"valid_targets_min": 1830
},
{
"epoch": 3.388888888888889,
"grad_norm": 0.6779730353915933,
"learning_rate": 2.4573798575663425e-05,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11248013377189636,
"step": 2135,
"valid_targets_mean": 2979.5,
"valid_targets_min": 701
},
{
"epoch": 3.3968253968253967,
"grad_norm": 0.9098770112161331,
"learning_rate": 2.4496707318333323e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12486522644758224,
"step": 2140,
"valid_targets_mean": 1802.4,
"valid_targets_min": 645
},
{
"epoch": 3.4047619047619047,
"grad_norm": 0.7636101057011379,
"learning_rate": 2.441954562874541e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125074565410614,
"step": 2145,
"valid_targets_mean": 2825.0,
"valid_targets_min": 1558
},
{
"epoch": 3.4126984126984126,
"grad_norm": 0.6467450666633284,
"learning_rate": 2.434231471548893e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08474473655223846,
"step": 2150,
"valid_targets_mean": 3010.1,
"valid_targets_min": 750
},
{
"epoch": 3.4206349206349205,
"grad_norm": 0.6917977015493815,
"learning_rate": 2.4265015788237348e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1237451583147049,
"step": 2155,
"valid_targets_mean": 2535.2,
"valid_targets_min": 1103
},
{
"epoch": 3.4285714285714284,
"grad_norm": 0.7739173113165484,
"learning_rate": 2.4187650057729465e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13617797195911407,
"step": 2160,
"valid_targets_mean": 2652.1,
"valid_targets_min": 693
},
{
"epoch": 3.4365079365079367,
"grad_norm": 0.6831983748541813,
"learning_rate": 2.4110218735750403e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12043888866901398,
"step": 2165,
"valid_targets_mean": 3557.0,
"valid_targets_min": 1053
},
{
"epoch": 3.4444444444444446,
"grad_norm": 0.6052935127475482,
"learning_rate": 2.4032723035112667e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10145443677902222,
"step": 2170,
"valid_targets_mean": 4060.8,
"valid_targets_min": 1215
},
{
"epoch": 3.4523809523809526,
"grad_norm": 0.7675317267799375,
"learning_rate": 2.3955164169637124e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08529975265264511,
"step": 2175,
"valid_targets_mean": 1873.2,
"valid_targets_min": 641
},
{
"epoch": 3.4603174603174605,
"grad_norm": 0.6683938001153137,
"learning_rate": 2.387754335413398e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10772879421710968,
"step": 2180,
"valid_targets_mean": 3114.6,
"valid_targets_min": 1156
},
{
"epoch": 3.4682539682539684,
"grad_norm": 0.6735296084441879,
"learning_rate": 2.3799861804383807e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13499006628990173,
"step": 2185,
"valid_targets_mean": 3644.8,
"valid_targets_min": 1400
},
{
"epoch": 3.4761904761904763,
"grad_norm": 0.6831817897125874,
"learning_rate": 2.3722120737118414e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07938480377197266,
"step": 2190,
"valid_targets_mean": 1924.0,
"valid_targets_min": 1054
},
{
"epoch": 3.484126984126984,
"grad_norm": 0.6737327071370827,
"learning_rate": 2.3644321370001868e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1572818160057068,
"step": 2195,
"valid_targets_mean": 2819.1,
"valid_targets_min": 1142
},
{
"epoch": 3.492063492063492,
"grad_norm": 0.6691135799512201,
"learning_rate": 2.3566464921611393e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11640235781669617,
"step": 2200,
"valid_targets_mean": 2922.6,
"valid_targets_min": 770
},
{
"epoch": 3.5,
"grad_norm": 0.6587392719241073,
"learning_rate": 2.348855261141827e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10942356288433075,
"step": 2205,
"valid_targets_mean": 3722.4,
"valid_targets_min": 858
},
{
"epoch": 3.507936507936508,
"grad_norm": 0.750713040033646,
"learning_rate": 2.341058565976874e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13870318233966827,
"step": 2210,
"valid_targets_mean": 2861.6,
"valid_targets_min": 1779
},
{
"epoch": 3.515873015873016,
"grad_norm": 0.7491380731832215,
"learning_rate": 2.3332565287864918e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14582455158233643,
"step": 2215,
"valid_targets_mean": 2783.4,
"valid_targets_min": 1314
},
{
"epoch": 3.5238095238095237,
"grad_norm": 0.6351357539271595,
"learning_rate": 2.325449271774563e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11707961559295654,
"step": 2220,
"valid_targets_mean": 3604.9,
"valid_targets_min": 1073
},
{
"epoch": 3.5317460317460316,
"grad_norm": 0.8231068256271177,
"learning_rate": 2.3176369172267286e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19035357236862183,
"step": 2225,
"valid_targets_mean": 3547.5,
"valid_targets_min": 1823
},
{
"epoch": 3.5396825396825395,
"grad_norm": 0.6637559646990401,
"learning_rate": 2.3098195875084732e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19387897849082947,
"step": 2230,
"valid_targets_mean": 4797.4,
"valid_targets_min": 1702
},
{
"epoch": 3.5476190476190474,
"grad_norm": 0.5840086031255308,
"learning_rate": 2.301997405063208e-05,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13106292486190796,
"step": 2235,
"valid_targets_mean": 4836.0,
"valid_targets_min": 2196
},
{
"epoch": 3.5555555555555554,
"grad_norm": 0.6883285297059432,
"learning_rate": 2.2941704924103535e-05,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0974530503153801,
"step": 2240,
"valid_targets_mean": 2712.2,
"valid_targets_min": 574
},
{
"epoch": 3.5634920634920633,
"grad_norm": 0.6118340955483631,
"learning_rate": 2.2863389721434165e-05,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13404448330402374,
"step": 2245,
"valid_targets_mean": 3707.8,
"valid_targets_min": 725
},
{
"epoch": 3.571428571428571,
"grad_norm": 0.6823518338026194,
"learning_rate": 2.2785029669280775e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09207911789417267,
"step": 2250,
"valid_targets_mean": 2036.5,
"valid_targets_min": 806
},
{
"epoch": 3.5793650793650795,
"grad_norm": 0.722255561298478,
"learning_rate": 2.2706625995002626e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11790738254785538,
"step": 2255,
"valid_targets_mean": 2746.2,
"valid_targets_min": 1230
},
{
"epoch": 3.5873015873015874,
"grad_norm": 0.6732026842214269,
"learning_rate": 2.262817992664224e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14672116935253143,
"step": 2260,
"valid_targets_mean": 4038.0,
"valid_targets_min": 1675
},
{
"epoch": 3.5952380952380953,
"grad_norm": 0.781949743871262,
"learning_rate": 2.2549692692906158e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13185100257396698,
"step": 2265,
"valid_targets_mean": 2627.5,
"valid_targets_min": 567
},
{
"epoch": 3.6031746031746033,
"grad_norm": 0.7262791657638447,
"learning_rate": 2.24711655231457e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20940609276294708,
"step": 2270,
"valid_targets_mean": 5433.1,
"valid_targets_min": 1399
},
{
"epoch": 3.611111111111111,
"grad_norm": 0.784848270932435,
"learning_rate": 2.2392599647337724e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12663155794143677,
"step": 2275,
"valid_targets_mean": 2872.4,
"valid_targets_min": 1406
},
{
"epoch": 3.619047619047619,
"grad_norm": 0.6453755291298704,
"learning_rate": 2.23139962960653e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16382941603660583,
"step": 2280,
"valid_targets_mean": 5086.6,
"valid_targets_min": 1625
},
{
"epoch": 3.626984126984127,
"grad_norm": 0.6243214368704214,
"learning_rate": 2.2235356700498528e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09489156305789948,
"step": 2285,
"valid_targets_mean": 2987.9,
"valid_targets_min": 941
},
{
"epoch": 3.634920634920635,
"grad_norm": 0.728831644905216,
"learning_rate": 2.2156682092375175e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12532003223896027,
"step": 2290,
"valid_targets_mean": 3108.4,
"valid_targets_min": 1380
},
{
"epoch": 3.642857142857143,
"grad_norm": 0.6766396276223146,
"learning_rate": 2.2077973703981423e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10541743785142899,
"step": 2295,
"valid_targets_mean": 3278.2,
"valid_targets_min": 1427
},
{
"epoch": 3.6507936507936507,
"grad_norm": 0.728273106075939,
"learning_rate": 2.1999232768132552e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13243606686592102,
"step": 2300,
"valid_targets_mean": 3081.8,
"valid_targets_min": 1017
},
{
"epoch": 3.6587301587301586,
"grad_norm": 0.6367194277051416,
"learning_rate": 2.1920460518153637e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14943772554397583,
"step": 2305,
"valid_targets_mean": 3977.2,
"valid_targets_min": 1438
},
{
"epoch": 3.6666666666666665,
"grad_norm": 0.6636887290598896,
"learning_rate": 2.1841658187860232e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14413931965827942,
"step": 2310,
"valid_targets_mean": 3984.5,
"valid_targets_min": 950
},
{
"epoch": 3.674603174603175,
"grad_norm": 0.6924824608448896,
"learning_rate": 2.176282701153904e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10788863897323608,
"step": 2315,
"valid_targets_mean": 3827.2,
"valid_targets_min": 1204
},
{
"epoch": 3.682539682539683,
"grad_norm": 0.7500867165407975,
"learning_rate": 2.1683968223928572e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11223761737346649,
"step": 2320,
"valid_targets_mean": 2388.6,
"valid_targets_min": 958
},
{
"epoch": 3.6904761904761907,
"grad_norm": 0.6150664924768718,
"learning_rate": 2.1605083060199835e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13505640625953674,
"step": 2325,
"valid_targets_mean": 3697.6,
"valid_targets_min": 716
},
{
"epoch": 3.6984126984126986,
"grad_norm": 0.7555466609315117,
"learning_rate": 2.152617275593694e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1521606296300888,
"step": 2330,
"valid_targets_mean": 3023.5,
"valid_targets_min": 1520
},
{
"epoch": 3.7063492063492065,
"grad_norm": 0.7029257644513573,
"learning_rate": 2.144723854711781e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16023379564285278,
"step": 2335,
"valid_targets_mean": 3591.4,
"valid_targets_min": 802
},
{
"epoch": 3.7142857142857144,
"grad_norm": 0.6918176391496552,
"learning_rate": 2.1368281670094766e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13360567390918732,
"step": 2340,
"valid_targets_mean": 3050.0,
"valid_targets_min": 1247
},
{
"epoch": 3.7222222222222223,
"grad_norm": 0.6428044957155385,
"learning_rate": 2.1289303361575175e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11518841981887817,
"step": 2345,
"valid_targets_mean": 3680.9,
"valid_targets_min": 905
},
{
"epoch": 3.7301587301587302,
"grad_norm": 0.6973754385222307,
"learning_rate": 2.121030485860211e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621910184621811,
"step": 2350,
"valid_targets_mean": 3594.0,
"valid_targets_min": 859
},
{
"epoch": 3.738095238095238,
"grad_norm": 0.7349289761819597,
"learning_rate": 2.113128739853493e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13967764377593994,
"step": 2355,
"valid_targets_mean": 3569.4,
"valid_targets_min": 1369
},
{
"epoch": 3.746031746031746,
"grad_norm": 0.7522020159710882,
"learning_rate": 2.1052252219029944e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12228189408779144,
"step": 2360,
"valid_targets_mean": 2334.9,
"valid_targets_min": 1448
},
{
"epoch": 3.753968253968254,
"grad_norm": 0.5729484428634234,
"learning_rate": 2.0973200558020967e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09384536743164062,
"step": 2365,
"valid_targets_mean": 3340.4,
"valid_targets_min": 1206
},
{
"epoch": 3.761904761904762,
"grad_norm": 0.6492714046787679,
"learning_rate": 2.0894133653700005e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12654618918895721,
"step": 2370,
"valid_targets_mean": 3602.9,
"valid_targets_min": 1014
},
{
"epoch": 3.7698412698412698,
"grad_norm": 0.697904697849088,
"learning_rate": 2.0815052744497795e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14032703638076782,
"step": 2375,
"valid_targets_mean": 3229.0,
"valid_targets_min": 645
},
{
"epoch": 3.7777777777777777,
"grad_norm": 0.7308391868980172,
"learning_rate": 2.0735959069064434e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12916788458824158,
"step": 2380,
"valid_targets_mean": 2837.2,
"valid_targets_min": 1121
},
{
"epoch": 3.7857142857142856,
"grad_norm": 0.691499175418863,
"learning_rate": 2.065685386624999e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1294250339269638,
"step": 2385,
"valid_targets_mean": 3112.2,
"valid_targets_min": 1521
},
{
"epoch": 3.7936507936507935,
"grad_norm": 0.5969033546170376,
"learning_rate": 2.0577738375085076e-05,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09190475195646286,
"step": 2390,
"valid_targets_mean": 2841.9,
"valid_targets_min": 1244
},
{
"epoch": 3.8015873015873014,
"grad_norm": 0.7220359693489179,
"learning_rate": 2.0498613834761462e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16056948900222778,
"step": 2395,
"valid_targets_mean": 3376.4,
"valid_targets_min": 1264
},
{
"epoch": 3.8095238095238093,
"grad_norm": 1.2099115424108589,
"learning_rate": 2.041948148461264e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13240090012550354,
"step": 2400,
"valid_targets_mean": 3901.5,
"valid_targets_min": 1065
},
{
"epoch": 3.817460317460317,
"grad_norm": 0.7893114301162967,
"learning_rate": 2.0340342564094436e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1543714702129364,
"step": 2405,
"valid_targets_mean": 2780.1,
"valid_targets_min": 1198
},
{
"epoch": 3.825396825396825,
"grad_norm": 0.6632506580999861,
"learning_rate": 2.0261198312765597e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12213265150785446,
"step": 2410,
"valid_targets_mean": 3707.4,
"valid_targets_min": 1452
},
{
"epoch": 3.8333333333333335,
"grad_norm": 0.5666934298053149,
"learning_rate": 2.0182049970268355e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11713714152574539,
"step": 2415,
"valid_targets_mean": 4613.4,
"valid_targets_min": 1868
},
{
"epoch": 3.8412698412698414,
"grad_norm": 0.7113706519827881,
"learning_rate": 2.010289877630902e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12731067836284637,
"step": 2420,
"valid_targets_mean": 4011.0,
"valid_targets_min": 1569
},
{
"epoch": 3.8492063492063493,
"grad_norm": 0.5910058190767906,
"learning_rate": 2.002374597063858e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0885014608502388,
"step": 2425,
"valid_targets_mean": 3732.4,
"valid_targets_min": 1372
},
{
"epoch": 3.857142857142857,
"grad_norm": 0.613181664922125,
"learning_rate": 1.9944592793033255e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1397075355052948,
"step": 2430,
"valid_targets_mean": 3596.5,
"valid_targets_min": 1614
},
{
"epoch": 3.865079365079365,
"grad_norm": 0.7433760742723559,
"learning_rate": 1.9865440483275086e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11835931986570358,
"step": 2435,
"valid_targets_mean": 3025.0,
"valid_targets_min": 1014
},
{
"epoch": 3.873015873015873,
"grad_norm": 0.6605685240194553,
"learning_rate": 1.978629028113254e-05,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10053889453411102,
"step": 2440,
"valid_targets_mean": 2641.2,
"valid_targets_min": 615
},
{
"epoch": 3.880952380952381,
"grad_norm": 0.7119660876197761,
"learning_rate": 1.9707143426341058e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13378119468688965,
"step": 2445,
"valid_targets_mean": 3406.1,
"valid_targets_min": 1708
},
{
"epoch": 3.888888888888889,
"grad_norm": 0.671693312370587,
"learning_rate": 1.962800115858364e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17709845304489136,
"step": 2450,
"valid_targets_mean": 4737.1,
"valid_targets_min": 1773
},
{
"epoch": 3.8968253968253967,
"grad_norm": 0.5187002193324203,
"learning_rate": 1.9548864717471472e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.114749014377594,
"step": 2455,
"valid_targets_mean": 5417.0,
"valid_targets_min": 2435
},
{
"epoch": 3.9047619047619047,
"grad_norm": 0.5690598952425717,
"learning_rate": 1.9469735342524454e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283632516860962,
"step": 2460,
"valid_targets_mean": 4894.6,
"valid_targets_min": 1517
},
{
"epoch": 3.9126984126984126,
"grad_norm": 0.8811218156014363,
"learning_rate": 1.939061427315179e-05,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14203287661075592,
"step": 2465,
"valid_targets_mean": 1957.8,
"valid_targets_min": 1215
},
{
"epoch": 3.9206349206349205,
"grad_norm": 0.7300566426187972,
"learning_rate": 1.931150274863265e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15685239434242249,
"step": 2470,
"valid_targets_mean": 3397.5,
"valid_targets_min": 1333
},
{
"epoch": 3.928571428571429,
"grad_norm": 0.6643843278715006,
"learning_rate": 1.9232402008096643e-05,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505836546421051,
"step": 2475,
"valid_targets_mean": 3670.0,
"valid_targets_min": 1015
},
{
"epoch": 3.9365079365079367,
"grad_norm": 0.7251725567833401,
"learning_rate": 1.9153313290504495e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14810281991958618,
"step": 2480,
"valid_targets_mean": 3935.0,
"valid_targets_min": 1705
},
{
"epoch": 3.9444444444444446,
"grad_norm": 0.6456264170608652,
"learning_rate": 1.9074237834628623e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12540534138679504,
"step": 2485,
"valid_targets_mean": 3541.1,
"valid_targets_min": 991
},
{
"epoch": 3.9523809523809526,
"grad_norm": 0.8356018356170182,
"learning_rate": 1.8995176879033698e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1368331015110016,
"step": 2490,
"valid_targets_mean": 2445.4,
"valid_targets_min": 762
},
{
"epoch": 3.9603174603174605,
"grad_norm": 0.6288308457322553,
"learning_rate": 1.89161316620573e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14380553364753723,
"step": 2495,
"valid_targets_mean": 4345.1,
"valid_targets_min": 794
},
{
"epoch": 3.9682539682539684,
"grad_norm": 0.6579847446205861,
"learning_rate": 1.8837103421790486e-05,
"loss": 0.2431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07781261205673218,
"step": 2500,
"valid_targets_mean": 2298.8,
"valid_targets_min": 586
},
{
"epoch": 3.9761904761904763,
"grad_norm": 0.7093298174783987,
"learning_rate": 1.8758093396058386e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1043231263756752,
"step": 2505,
"valid_targets_mean": 2240.4,
"valid_targets_min": 1245
},
{
"epoch": 3.984126984126984,
"grad_norm": 0.7566876521088187,
"learning_rate": 1.8679102822400874e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10809953510761261,
"step": 2510,
"valid_targets_mean": 2235.2,
"valid_targets_min": 373
},
{
"epoch": 3.992063492063492,
"grad_norm": 0.6429354432180481,
"learning_rate": 1.8600132938053098e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1338648647069931,
"step": 2515,
"valid_targets_mean": 4055.4,
"valid_targets_min": 858
},
{
"epoch": 4.0,
"grad_norm": 0.7125286840342117,
"learning_rate": 1.8521184979926177e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10315399616956711,
"step": 2520,
"valid_targets_mean": 2988.1,
"valid_targets_min": 1423
},
{
"epoch": 4.007936507936508,
"grad_norm": 0.5876567034131157,
"learning_rate": 1.8442260184587804e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1037619337439537,
"step": 2525,
"valid_targets_mean": 3516.1,
"valid_targets_min": 770
},
{
"epoch": 4.015873015873016,
"grad_norm": 0.6765268923330178,
"learning_rate": 1.8363359788242842e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09999796748161316,
"step": 2530,
"valid_targets_mean": 3009.6,
"valid_targets_min": 1258
},
{
"epoch": 4.023809523809524,
"grad_norm": 0.843564874643514,
"learning_rate": 1.8284485026714013e-05,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1326655000448227,
"step": 2535,
"valid_targets_mean": 2664.0,
"valid_targets_min": 1373
},
{
"epoch": 4.031746031746032,
"grad_norm": 0.7819775900849527,
"learning_rate": 1.8205637135422525e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12343311309814453,
"step": 2540,
"valid_targets_mean": 2378.2,
"valid_targets_min": 1514
},
{
"epoch": 4.0396825396825395,
"grad_norm": 0.6399638759318811,
"learning_rate": 1.8126817349368697e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12565383315086365,
"step": 2545,
"valid_targets_mean": 4908.5,
"valid_targets_min": 1814
},
{
"epoch": 4.0476190476190474,
"grad_norm": 0.7019507639956757,
"learning_rate": 1.8048026903112632e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13092780113220215,
"step": 2550,
"valid_targets_mean": 3983.9,
"valid_targets_min": 1711
},
{
"epoch": 4.055555555555555,
"grad_norm": 0.6288446075374055,
"learning_rate": 1.7969267030754903e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11063070595264435,
"step": 2555,
"valid_targets_mean": 3873.1,
"valid_targets_min": 1824
},
{
"epoch": 4.063492063492063,
"grad_norm": 0.6811814187899629,
"learning_rate": 1.7890538965917184e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11278326064348221,
"step": 2560,
"valid_targets_mean": 3182.5,
"valid_targets_min": 866
},
{
"epoch": 4.071428571428571,
"grad_norm": 0.7348752847522607,
"learning_rate": 1.7811843941722952e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14403583109378815,
"step": 2565,
"valid_targets_mean": 3754.9,
"valid_targets_min": 1404
},
{
"epoch": 4.079365079365079,
"grad_norm": 0.6911463348956305,
"learning_rate": 1.7733183190778174e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17022690176963806,
"step": 2570,
"valid_targets_mean": 4647.0,
"valid_targets_min": 1430
},
{
"epoch": 4.087301587301587,
"grad_norm": 0.7780248768456252,
"learning_rate": 1.7654557945151968e-05,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0747632160782814,
"step": 2575,
"valid_targets_mean": 2295.0,
"valid_targets_min": 621
},
{
"epoch": 4.095238095238095,
"grad_norm": 0.6940182721758144,
"learning_rate": 1.7575969436357352e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1094612330198288,
"step": 2580,
"valid_targets_mean": 3678.9,
"valid_targets_min": 881
},
{
"epoch": 4.103174603174603,
"grad_norm": 0.5643874374030184,
"learning_rate": 1.7497418895331934e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10210039466619492,
"step": 2585,
"valid_targets_mean": 4622.6,
"valid_targets_min": 847
},
{
"epoch": 4.111111111111111,
"grad_norm": 0.7297769226717193,
"learning_rate": 1.7418907552418597e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1272350400686264,
"step": 2590,
"valid_targets_mean": 3948.5,
"valid_targets_min": 875
},
{
"epoch": 4.119047619047619,
"grad_norm": 0.8006581395181448,
"learning_rate": 1.7340436637346315e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12104944884777069,
"step": 2595,
"valid_targets_mean": 2991.2,
"valid_targets_min": 1156
},
{
"epoch": 4.1269841269841265,
"grad_norm": 0.6613137801764501,
"learning_rate": 1.726200737921079e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06504228711128235,
"step": 2600,
"valid_targets_mean": 2492.5,
"valid_targets_min": 1140
},
{
"epoch": 4.134920634920635,
"grad_norm": 0.7387136949916735,
"learning_rate": 1.718362100645527e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12065084278583527,
"step": 2605,
"valid_targets_mean": 2898.9,
"valid_targets_min": 655
},
{
"epoch": 4.142857142857143,
"grad_norm": 0.7090937396787783,
"learning_rate": 1.710527874685129e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11025974899530411,
"step": 2610,
"valid_targets_mean": 2430.9,
"valid_targets_min": 1056
},
{
"epoch": 4.150793650793651,
"grad_norm": 0.722190758689241,
"learning_rate": 1.702698182747942e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10215307772159576,
"step": 2615,
"valid_targets_mean": 2964.1,
"valid_targets_min": 778
},
{
"epoch": 4.158730158730159,
"grad_norm": 0.7144776057022394,
"learning_rate": 1.6948731474710075e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12342202663421631,
"step": 2620,
"valid_targets_mean": 3819.5,
"valid_targets_min": 1317
},
{
"epoch": 4.166666666666667,
"grad_norm": 0.7492914431944917,
"learning_rate": 1.68705289141843e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13639488816261292,
"step": 2625,
"valid_targets_mean": 3750.9,
"valid_targets_min": 1330
},
{
"epoch": 4.174603174603175,
"grad_norm": 0.7401208722013239,
"learning_rate": 1.679237537079454e-05,
"loss": 0.233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440812647342682,
"step": 2630,
"valid_targets_mean": 3458.8,
"valid_targets_min": 1229
},
{
"epoch": 4.182539682539683,
"grad_norm": 0.6025773710893592,
"learning_rate": 1.6714272068665526e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08263147622346878,
"step": 2635,
"valid_targets_mean": 3376.2,
"valid_targets_min": 998
},
{
"epoch": 4.190476190476191,
"grad_norm": 0.596963688362553,
"learning_rate": 1.663622023113501e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09171557426452637,
"step": 2640,
"valid_targets_mean": 4571.8,
"valid_targets_min": 2009
},
{
"epoch": 4.198412698412699,
"grad_norm": 0.7542922003219502,
"learning_rate": 1.655822108073467e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12120301276445389,
"step": 2645,
"valid_targets_mean": 3426.8,
"valid_targets_min": 1327
},
{
"epoch": 4.2063492063492065,
"grad_norm": 0.794127406475235,
"learning_rate": 1.648027583917095e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13536590337753296,
"step": 2650,
"valid_targets_mean": 3598.9,
"valid_targets_min": 1506
},
{
"epoch": 4.214285714285714,
"grad_norm": 0.7449195658686859,
"learning_rate": 1.640238572730591e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10461185872554779,
"step": 2655,
"valid_targets_mean": 3327.4,
"valid_targets_min": 1331
},
{
"epoch": 4.222222222222222,
"grad_norm": 0.6732836280628659,
"learning_rate": 1.632455196513809e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12440332025289536,
"step": 2660,
"valid_targets_mean": 3556.0,
"valid_targets_min": 1127
},
{
"epoch": 4.23015873015873,
"grad_norm": 0.7638215074334139,
"learning_rate": 1.624677577178345e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15293553471565247,
"step": 2665,
"valid_targets_mean": 3222.5,
"valid_targets_min": 1203
},
{
"epoch": 4.238095238095238,
"grad_norm": 0.6453140298046666,
"learning_rate": 1.616905836545624e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11287044733762741,
"step": 2670,
"valid_targets_mean": 4032.5,
"valid_targets_min": 1499
},
{
"epoch": 4.246031746031746,
"grad_norm": 0.9229381005829962,
"learning_rate": 1.6091400963449894e-05,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18993867933750153,
"step": 2675,
"valid_targets_mean": 3324.4,
"valid_targets_min": 332
},
{
"epoch": 4.253968253968254,
"grad_norm": 0.7863010352864319,
"learning_rate": 1.6013804782118043e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1106230691075325,
"step": 2680,
"valid_targets_mean": 2505.0,
"valid_targets_min": 318
},
{
"epoch": 4.261904761904762,
"grad_norm": 0.7694376524205275,
"learning_rate": 1.5936271036855372e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08633385598659515,
"step": 2685,
"valid_targets_mean": 2414.8,
"valid_targets_min": 622
},
{
"epoch": 4.26984126984127,
"grad_norm": 0.6357694871639326,
"learning_rate": 1.585880094207864e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12916597723960876,
"step": 2690,
"valid_targets_mean": 4749.9,
"valid_targets_min": 702
},
{
"epoch": 4.277777777777778,
"grad_norm": 0.838277956659092,
"learning_rate": 1.5781395711207664e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11889150738716125,
"step": 2695,
"valid_targets_mean": 2379.8,
"valid_targets_min": 647
},
{
"epoch": 4.285714285714286,
"grad_norm": 0.6591004793230493,
"learning_rate": 1.5704056556646255e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10079076886177063,
"step": 2700,
"valid_targets_mean": 3413.8,
"valid_targets_min": 825
},
{
"epoch": 4.2936507936507935,
"grad_norm": 0.6543704431835511,
"learning_rate": 1.562678468976329e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10609576106071472,
"step": 2705,
"valid_targets_mean": 3200.8,
"valid_targets_min": 671
},
{
"epoch": 4.301587301587301,
"grad_norm": 0.7687796568069265,
"learning_rate": 1.5549581320873715e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10676814615726471,
"step": 2710,
"valid_targets_mean": 3095.1,
"valid_targets_min": 767
},
{
"epoch": 4.309523809523809,
"grad_norm": 0.6932002931278404,
"learning_rate": 1.5472447659219573e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13282454013824463,
"step": 2715,
"valid_targets_mean": 3701.2,
"valid_targets_min": 1301
},
{
"epoch": 4.317460317460317,
"grad_norm": 0.5902369291201127,
"learning_rate": 1.5395384912951096e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12770837545394897,
"step": 2720,
"valid_targets_mean": 5372.8,
"valid_targets_min": 1753
},
{
"epoch": 4.325396825396825,
"grad_norm": 0.6748449023035938,
"learning_rate": 1.531839428910774e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.120603047311306,
"step": 2725,
"valid_targets_mean": 3591.1,
"valid_targets_min": 2100
},
{
"epoch": 4.333333333333333,
"grad_norm": 0.5987121324615388,
"learning_rate": 1.5241476993599318e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11681363731622696,
"step": 2730,
"valid_targets_mean": 5095.5,
"valid_targets_min": 1581
},
{
"epoch": 4.341269841269841,
"grad_norm": 0.7159427225817645,
"learning_rate": 1.5164634231187106e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14144907891750336,
"step": 2735,
"valid_targets_mean": 3225.6,
"valid_targets_min": 1473
},
{
"epoch": 4.349206349206349,
"grad_norm": 0.6611954382275911,
"learning_rate": 1.5087867205464933e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09750405699014664,
"step": 2740,
"valid_targets_mean": 3417.1,
"valid_targets_min": 965
},
{
"epoch": 4.357142857142857,
"grad_norm": 0.7263798618780849,
"learning_rate": 1.5011177118840376e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12625962495803833,
"step": 2745,
"valid_targets_mean": 3994.0,
"valid_targets_min": 1406
},
{
"epoch": 4.365079365079365,
"grad_norm": 0.7933122878926689,
"learning_rate": 1.4934565172515917e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0890585258603096,
"step": 2750,
"valid_targets_mean": 2174.6,
"valid_targets_min": 1007
},
{
"epoch": 4.3730158730158735,
"grad_norm": 0.7213075598879185,
"learning_rate": 1.4858032566470107e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17482303082942963,
"step": 2755,
"valid_targets_mean": 5093.8,
"valid_targets_min": 1293
},
{
"epoch": 4.380952380952381,
"grad_norm": 0.8248529406403541,
"learning_rate": 1.4781580499438794e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08823531866073608,
"step": 2760,
"valid_targets_mean": 1934.1,
"valid_targets_min": 916
},
{
"epoch": 4.388888888888889,
"grad_norm": 0.7466423261561578,
"learning_rate": 1.4705210168896327e-05,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11548350751399994,
"step": 2765,
"valid_targets_mean": 3395.5,
"valid_targets_min": 1282
},
{
"epoch": 4.396825396825397,
"grad_norm": 0.6912935398648323,
"learning_rate": 1.462892277103681e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11666476726531982,
"step": 2770,
"valid_targets_mean": 3372.8,
"valid_targets_min": 1084
},
{
"epoch": 4.404761904761905,
"grad_norm": 0.6849370643438872,
"learning_rate": 1.455271950075539e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09486103057861328,
"step": 2775,
"valid_targets_mean": 2735.1,
"valid_targets_min": 551
},
{
"epoch": 4.412698412698413,
"grad_norm": 0.5989489711073828,
"learning_rate": 1.4476601551629493e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11204937100410461,
"step": 2780,
"valid_targets_mean": 4433.1,
"valid_targets_min": 1363
},
{
"epoch": 4.420634920634921,
"grad_norm": 0.8531974727728336,
"learning_rate": 1.4400570115900147e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309199035167694,
"step": 2785,
"valid_targets_mean": 3022.9,
"valid_targets_min": 1582
},
{
"epoch": 4.428571428571429,
"grad_norm": 0.7725264862980028,
"learning_rate": 1.4324626384453345e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12786544859409332,
"step": 2790,
"valid_targets_mean": 3201.5,
"valid_targets_min": 1886
},
{
"epoch": 4.436507936507937,
"grad_norm": 1.2348782492609787,
"learning_rate": 1.4248771546801339e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10978405177593231,
"step": 2795,
"valid_targets_mean": 2609.4,
"valid_targets_min": 1227
},
{
"epoch": 4.444444444444445,
"grad_norm": 0.5857767158165396,
"learning_rate": 1.4173006791064023e-05,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11274480074644089,
"step": 2800,
"valid_targets_mean": 4386.8,
"valid_targets_min": 1685
},
{
"epoch": 4.4523809523809526,
"grad_norm": 0.7243806950657568,
"learning_rate": 1.4097333303950368e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13323573768138885,
"step": 2805,
"valid_targets_mean": 3164.4,
"valid_targets_min": 1546
},
{
"epoch": 4.4603174603174605,
"grad_norm": 0.8365899391330908,
"learning_rate": 1.4021752270739759e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17075440287590027,
"step": 2810,
"valid_targets_mean": 3530.6,
"valid_targets_min": 1523
},
{
"epoch": 4.468253968253968,
"grad_norm": 0.6426801032723285,
"learning_rate": 1.3946264875263485e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10363493859767914,
"step": 2815,
"valid_targets_mean": 3605.0,
"valid_targets_min": 1712
},
{
"epoch": 4.476190476190476,
"grad_norm": 0.6890993167954129,
"learning_rate": 1.3870872299886184e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07421109080314636,
"step": 2820,
"valid_targets_mean": 2241.6,
"valid_targets_min": 1195
},
{
"epoch": 4.484126984126984,
"grad_norm": 0.6729360045725103,
"learning_rate": 1.3795575725487303e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09559076279401779,
"step": 2825,
"valid_targets_mean": 3219.1,
"valid_targets_min": 1489
},
{
"epoch": 4.492063492063492,
"grad_norm": 0.9472374491757762,
"learning_rate": 1.3720376331442652e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12624111771583557,
"step": 2830,
"valid_targets_mean": 1985.1,
"valid_targets_min": 1181
},
{
"epoch": 4.5,
"grad_norm": 0.6423699741233883,
"learning_rate": 1.364527529560586e-05,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09665095806121826,
"step": 2835,
"valid_targets_mean": 3381.6,
"valid_targets_min": 1302
},
{
"epoch": 4.507936507936508,
"grad_norm": 0.8434624170792736,
"learning_rate": 1.3570273794289978e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11487355828285217,
"step": 2840,
"valid_targets_mean": 2106.1,
"valid_targets_min": 1085
},
{
"epoch": 4.515873015873016,
"grad_norm": 0.8176335490386788,
"learning_rate": 1.3495373002249061e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11494874209165573,
"step": 2845,
"valid_targets_mean": 2774.2,
"valid_targets_min": 941
},
{
"epoch": 4.523809523809524,
"grad_norm": 0.7509641841477122,
"learning_rate": 1.3420574092659713e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0945759192109108,
"step": 2850,
"valid_targets_mean": 2959.2,
"valid_targets_min": 1038
},
{
"epoch": 4.531746031746032,
"grad_norm": 0.7303411502442227,
"learning_rate": 1.3345878237102766e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12984412908554077,
"step": 2855,
"valid_targets_mean": 3543.2,
"valid_targets_min": 1360
},
{
"epoch": 4.5396825396825395,
"grad_norm": 0.7135801927779284,
"learning_rate": 1.3271286605544906e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1369558870792389,
"step": 2860,
"valid_targets_mean": 4178.8,
"valid_targets_min": 1205
},
{
"epoch": 4.5476190476190474,
"grad_norm": 0.8002438173525717,
"learning_rate": 1.3196800366320357e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13606247305870056,
"step": 2865,
"valid_targets_mean": 3268.6,
"valid_targets_min": 961
},
{
"epoch": 4.555555555555555,
"grad_norm": 0.7255775013934033,
"learning_rate": 1.3122420686112554e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09334878623485565,
"step": 2870,
"valid_targets_mean": 2750.4,
"valid_targets_min": 906
},
{
"epoch": 4.563492063492063,
"grad_norm": 0.7155396542120448,
"learning_rate": 1.3048148729935917e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12097464501857758,
"step": 2875,
"valid_targets_mean": 3632.4,
"valid_targets_min": 1730
},
{
"epoch": 4.571428571428571,
"grad_norm": 1.8092713084981278,
"learning_rate": 1.297398566111756e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11287643015384674,
"step": 2880,
"valid_targets_mean": 3300.0,
"valid_targets_min": 1120
},
{
"epoch": 4.579365079365079,
"grad_norm": 0.7654711485267467,
"learning_rate": 1.2899932641279082e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11186093091964722,
"step": 2885,
"valid_targets_mean": 2760.4,
"valid_targets_min": 858
},
{
"epoch": 4.587301587301587,
"grad_norm": 0.774643668364101,
"learning_rate": 1.2825990830318395e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09278203547000885,
"step": 2890,
"valid_targets_mean": 2548.6,
"valid_targets_min": 936
},
{
"epoch": 4.595238095238095,
"grad_norm": 0.8001318452509485,
"learning_rate": 1.2752161386391526e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10767956078052521,
"step": 2895,
"valid_targets_mean": 2060.4,
"valid_targets_min": 858
},
{
"epoch": 4.603174603174603,
"grad_norm": 0.5712255444569291,
"learning_rate": 1.2678445465894491e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10319489985704422,
"step": 2900,
"valid_targets_mean": 4445.1,
"valid_targets_min": 2055
},
{
"epoch": 4.611111111111111,
"grad_norm": 0.6135689736493125,
"learning_rate": 1.2604844223445181e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07687068730592728,
"step": 2905,
"valid_targets_mean": 2514.1,
"valid_targets_min": 886
},
{
"epoch": 4.619047619047619,
"grad_norm": 0.6579258264976859,
"learning_rate": 1.2531358811865268e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11658872663974762,
"step": 2910,
"valid_targets_mean": 3789.9,
"valid_targets_min": 1324
},
{
"epoch": 4.6269841269841265,
"grad_norm": 0.6444665058651138,
"learning_rate": 1.2457990382162173e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12281468510627747,
"step": 2915,
"valid_targets_mean": 4370.9,
"valid_targets_min": 1616
},
{
"epoch": 4.634920634920634,
"grad_norm": 0.6876035515078412,
"learning_rate": 1.238474008351101e-05,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09872429817914963,
"step": 2920,
"valid_targets_mean": 3054.0,
"valid_targets_min": 1126
},
{
"epoch": 4.642857142857143,
"grad_norm": 0.6931951314781377,
"learning_rate": 1.2311609063236594e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10577560216188431,
"step": 2925,
"valid_targets_mean": 3132.2,
"valid_targets_min": 838
},
{
"epoch": 4.650793650793651,
"grad_norm": 0.6819762221919383,
"learning_rate": 1.2238598466795493e-05,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11494247615337372,
"step": 2930,
"valid_targets_mean": 3767.6,
"valid_targets_min": 1581
},
{
"epoch": 4.658730158730159,
"grad_norm": 0.5497909587102477,
"learning_rate": 1.2165709437758042e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1371319591999054,
"step": 2935,
"valid_targets_mean": 4767.9,
"valid_targets_min": 2053
},
{
"epoch": 4.666666666666667,
"grad_norm": 0.7497286458898537,
"learning_rate": 1.209294311779047e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10149647295475006,
"step": 2940,
"valid_targets_mean": 2748.5,
"valid_targets_min": 956
},
{
"epoch": 4.674603174603175,
"grad_norm": 0.794199842888716,
"learning_rate": 1.2020300646637018e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12010520696640015,
"step": 2945,
"valid_targets_mean": 2594.0,
"valid_targets_min": 1049
},
{
"epoch": 4.682539682539683,
"grad_norm": 0.6156502044065189,
"learning_rate": 1.1947783162102043e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0953923910856247,
"step": 2950,
"valid_targets_mean": 3468.9,
"valid_targets_min": 1599
},
{
"epoch": 4.690476190476191,
"grad_norm": 0.7560140620960419,
"learning_rate": 1.1875391800032248e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14818307757377625,
"step": 2955,
"valid_targets_mean": 3391.6,
"valid_targets_min": 1426
},
{
"epoch": 4.698412698412699,
"grad_norm": 0.6675396719960957,
"learning_rate": 1.1803127694298873e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10536058992147446,
"step": 2960,
"valid_targets_mean": 3879.0,
"valid_targets_min": 1464
},
{
"epoch": 4.7063492063492065,
"grad_norm": 0.7216255033546128,
"learning_rate": 1.173099197677992e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09683910012245178,
"step": 2965,
"valid_targets_mean": 3976.0,
"valid_targets_min": 876
},
{
"epoch": 4.714285714285714,
"grad_norm": 0.6299655661341759,
"learning_rate": 1.1658985777342458e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10072541236877441,
"step": 2970,
"valid_targets_mean": 4138.9,
"valid_targets_min": 2165
},
{
"epoch": 4.722222222222222,
"grad_norm": 0.7267114286430387,
"learning_rate": 1.1587110223824874e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11458795517683029,
"step": 2975,
"valid_targets_mean": 3501.6,
"valid_targets_min": 1048
},
{
"epoch": 4.73015873015873,
"grad_norm": 0.5711880649526813,
"learning_rate": 1.151536644201925e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10362765938043594,
"step": 2980,
"valid_targets_mean": 5068.5,
"valid_targets_min": 374
},
{
"epoch": 4.738095238095238,
"grad_norm": 0.6837744972295653,
"learning_rate": 1.1443755555653751e-05,
"loss": 0.2115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11046740412712097,
"step": 2985,
"valid_targets_mean": 3774.5,
"valid_targets_min": 1516
},
{
"epoch": 4.746031746031746,
"grad_norm": 0.8268088262430978,
"learning_rate": 1.1372278686374935e-05,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11939245462417603,
"step": 2990,
"valid_targets_mean": 2241.9,
"valid_targets_min": 844
},
{
"epoch": 4.753968253968254,
"grad_norm": 0.7080274610839087,
"learning_rate": 1.1300936953730273e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07471520453691483,
"step": 2995,
"valid_targets_mean": 2855.1,
"valid_targets_min": 1028
},
{
"epoch": 4.761904761904762,
"grad_norm": 0.6346454470756567,
"learning_rate": 1.1229731475150594e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09645067900419235,
"step": 3000,
"valid_targets_mean": 3225.0,
"valid_targets_min": 1558
},
{
"epoch": 4.76984126984127,
"grad_norm": 0.8159716611544979,
"learning_rate": 1.1158663365932529e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16088628768920898,
"step": 3005,
"valid_targets_mean": 3942.8,
"valid_targets_min": 811
},
{
"epoch": 4.777777777777778,
"grad_norm": 0.7485963907590999,
"learning_rate": 1.1087733739221109e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07297512143850327,
"step": 3010,
"valid_targets_mean": 2137.1,
"valid_targets_min": 1215
},
{
"epoch": 4.785714285714286,
"grad_norm": 0.6959060383565719,
"learning_rate": 1.1016943705992311e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14023664593696594,
"step": 3015,
"valid_targets_mean": 4470.1,
"valid_targets_min": 1215
},
{
"epoch": 4.7936507936507935,
"grad_norm": 0.8209624595660114,
"learning_rate": 1.0946294375035639e-05,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10550207644701004,
"step": 3020,
"valid_targets_mean": 2292.6,
"valid_targets_min": 285
},
{
"epoch": 4.801587301587301,
"grad_norm": 0.8467111860371475,
"learning_rate": 1.087578685293674e-05,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1101028323173523,
"step": 3025,
"valid_targets_mean": 2002.0,
"valid_targets_min": 963
},
{
"epoch": 4.809523809523809,
"grad_norm": 0.7031175355751162,
"learning_rate": 1.080542224406015e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08865861594676971,
"step": 3030,
"valid_targets_mean": 2722.9,
"valid_targets_min": 1096
},
{
"epoch": 4.817460317460317,
"grad_norm": 0.6340433410827726,
"learning_rate": 1.0735201650531915e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08490338921546936,
"step": 3035,
"valid_targets_mean": 3582.5,
"valid_targets_min": 1662
},
{
"epoch": 4.825396825396825,
"grad_norm": 0.8779889239691778,
"learning_rate": 1.066512617222235e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1368151307106018,
"step": 3040,
"valid_targets_mean": 2917.8,
"valid_targets_min": 645
},
{
"epoch": 4.833333333333333,
"grad_norm": 0.8148128948217418,
"learning_rate": 1.059519690672884e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1347075253725052,
"step": 3045,
"valid_targets_mean": 3162.8,
"valid_targets_min": 1554
},
{
"epoch": 4.841269841269841,
"grad_norm": 0.7163970373680205,
"learning_rate": 1.0525414949358614e-05,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12431874126195908,
"step": 3050,
"valid_targets_mean": 4172.5,
"valid_targets_min": 1986
},
{
"epoch": 4.849206349206349,
"grad_norm": 0.7360036176983142,
"learning_rate": 1.0455781393111613e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15029457211494446,
"step": 3055,
"valid_targets_mean": 4648.4,
"valid_targets_min": 1219
},
{
"epoch": 4.857142857142857,
"grad_norm": 0.7198933951477575,
"learning_rate": 1.0386297328663353e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11901850998401642,
"step": 3060,
"valid_targets_mean": 3197.0,
"valid_targets_min": 2097
},
{
"epoch": 4.865079365079366,
"grad_norm": 0.7591758487987466,
"learning_rate": 1.0316963844347843e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16917167603969574,
"step": 3065,
"valid_targets_mean": 3458.1,
"valid_targets_min": 1407
},
{
"epoch": 4.8730158730158735,
"grad_norm": 0.6661543635742453,
"learning_rate": 1.0247782026140576e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1022878885269165,
"step": 3070,
"valid_targets_mean": 2875.9,
"valid_targets_min": 1623
},
{
"epoch": 4.880952380952381,
"grad_norm": 0.8652472888174663,
"learning_rate": 1.017875295764144e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1259920448064804,
"step": 3075,
"valid_targets_mean": 2689.5,
"valid_targets_min": 724
},
{
"epoch": 4.888888888888889,
"grad_norm": 0.7850884128960549,
"learning_rate": 1.0109877720057818e-05,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09217704832553864,
"step": 3080,
"valid_targets_mean": 2314.9,
"valid_targets_min": 1135
},
{
"epoch": 4.896825396825397,
"grad_norm": 0.7008626159310546,
"learning_rate": 1.0041157392187651e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09693759679794312,
"step": 3085,
"valid_targets_mean": 2638.2,
"valid_targets_min": 1401
},
{
"epoch": 4.904761904761905,
"grad_norm": 0.8580160012430362,
"learning_rate": 9.972593050402471e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11387155950069427,
"step": 3090,
"valid_targets_mean": 1859.2,
"valid_targets_min": 845
},
{
"epoch": 4.912698412698413,
"grad_norm": 0.6468446443099518,
"learning_rate": 9.904185768630612e-06,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15160252153873444,
"step": 3095,
"valid_targets_mean": 5390.9,
"valid_targets_min": 1587
},
{
"epoch": 4.920634920634921,
"grad_norm": 0.5684268979378351,
"learning_rate": 9.835936618340377e-06,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13138213753700256,
"step": 3100,
"valid_targets_mean": 4122.5,
"valid_targets_min": 567
},
{
"epoch": 4.928571428571429,
"grad_norm": 0.7131733546217154,
"learning_rate": 9.76784666852323e-06,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06886936724185944,
"step": 3105,
"valid_targets_mean": 1896.1,
"valid_targets_min": 1242
},
{
"epoch": 4.936507936507937,
"grad_norm": 0.8263911818151064,
"learning_rate": 9.699916985677062e-06,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13891655206680298,
"step": 3110,
"valid_targets_mean": 3128.5,
"valid_targets_min": 1302
},
{
"epoch": 4.944444444444445,
"grad_norm": 0.678512236825066,
"learning_rate": 9.6321486337895e-06,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10146833956241608,
"step": 3115,
"valid_targets_mean": 3825.9,
"valid_targets_min": 1227
},
{
"epoch": 4.9523809523809526,
"grad_norm": 0.6938061243394774,
"learning_rate": 9.564542674321228e-06,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11534064263105392,
"step": 3120,
"valid_targets_mean": 3539.6,
"valid_targets_min": 1226
},
{
"epoch": 4.9603174603174605,
"grad_norm": 0.6496250853188159,
"learning_rate": 9.49710016618937e-06,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13002172112464905,
"step": 3125,
"valid_targets_mean": 3752.9,
"valid_targets_min": 819
},
{
"epoch": 4.968253968253968,
"grad_norm": 0.731846216839573,
"learning_rate": 9.429822165750893e-06,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1303645372390747,
"step": 3130,
"valid_targets_mean": 3501.1,
"valid_targets_min": 1453
},
{
"epoch": 4.976190476190476,
"grad_norm": 0.7302474135173942,
"learning_rate": 9.36270972678607e-06,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12065795063972473,
"step": 3135,
"valid_targets_mean": 3030.6,
"valid_targets_min": 1525
},
{
"epoch": 4.984126984126984,
"grad_norm": 0.8382447486874602,
"learning_rate": 9.295763900481977e-06,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08970605581998825,
"step": 3140,
"valid_targets_mean": 2422.5,
"valid_targets_min": 898
},
{
"epoch": 4.992063492063492,
"grad_norm": 0.6946408347465951,
"learning_rate": 9.22898573541602e-06,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10561580210924149,
"step": 3145,
"valid_targets_mean": 3991.8,
"valid_targets_min": 963
},
{
"epoch": 5.0,
"grad_norm": 0.7898033128472092,
"learning_rate": 9.162376277539513e-06,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11227846145629883,
"step": 3150,
"valid_targets_mean": 2750.9,
"valid_targets_min": 677
},
{
"epoch": 5.007936507936508,
"grad_norm": 0.7146420475983313,
"learning_rate": 9.095936570161301e-06,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12624788284301758,
"step": 3155,
"valid_targets_mean": 3846.4,
"valid_targets_min": 1350
},
{
"epoch": 5.015873015873016,
"grad_norm": 0.6517411197054727,
"learning_rate": 9.029667653931411e-06,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06766072660684586,
"step": 3160,
"valid_targets_mean": 3087.6,
"valid_targets_min": 942
},
{
"epoch": 5.023809523809524,
"grad_norm": 0.8345596778348867,
"learning_rate": 8.96357056682475e-06,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10621356964111328,
"step": 3165,
"valid_targets_mean": 2631.9,
"valid_targets_min": 907
},
{
"epoch": 5.031746031746032,
"grad_norm": 0.8085550022852781,
"learning_rate": 8.897646344124882e-06,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12722842395305634,
"step": 3170,
"valid_targets_mean": 3126.6,
"valid_targets_min": 1496
},
{
"epoch": 5.0396825396825395,
"grad_norm": 0.6859939671973228,
"learning_rate": 8.83189601840773e-06,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08324988931417465,
"step": 3175,
"valid_targets_mean": 2954.6,
"valid_targets_min": 615
},
{
"epoch": 5.0476190476190474,
"grad_norm": 0.6329422503933559,
"learning_rate": 8.766320619525511e-06,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11945187300443649,
"step": 3180,
"valid_targets_mean": 4450.5,
"valid_targets_min": 1558
},
{
"epoch": 5.055555555555555,
"grad_norm": 0.8029282832348713,
"learning_rate": 8.700921174590525e-06,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10649940371513367,
"step": 3185,
"valid_targets_mean": 2527.2,
"valid_targets_min": 1120
},
{
"epoch": 5.063492063492063,
"grad_norm": 0.6560077390622969,
"learning_rate": 8.63569870795907e-06,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12603171169757843,
"step": 3190,
"valid_targets_mean": 5060.4,
"valid_targets_min": 1244
},
{
"epoch": 5.071428571428571,
"grad_norm": 0.7218401202124031,
"learning_rate": 8.570654241215466e-06,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11767058074474335,
"step": 3195,
"valid_targets_mean": 3966.0,
"valid_targets_min": 2226
},
{
"epoch": 5.079365079365079,
"grad_norm": 0.8081789481249295,
"learning_rate": 8.505788793155978e-06,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08667795360088348,
"step": 3200,
"valid_targets_mean": 2434.5,
"valid_targets_min": 1440
},
{
"epoch": 5.087301587301587,
"grad_norm": 0.7458764582812119,
"learning_rate": 8.441103379772893e-06,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09307099878787994,
"step": 3205,
"valid_targets_mean": 3196.9,
"valid_targets_min": 1336
},
{
"epoch": 5.095238095238095,
"grad_norm": 0.6048773964520159,
"learning_rate": 8.376599014238605e-06,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08689746260643005,
"step": 3210,
"valid_targets_mean": 3691.8,
"valid_targets_min": 810
},
{
"epoch": 5.103174603174603,
"grad_norm": 0.7088750227894017,
"learning_rate": 8.312276706889738e-06,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11118713021278381,
"step": 3215,
"valid_targets_mean": 3710.4,
"valid_targets_min": 1442
},
{
"epoch": 5.111111111111111,
"grad_norm": 0.7875888873370555,
"learning_rate": 8.24813746521133e-06,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10653230547904968,
"step": 3220,
"valid_targets_mean": 2371.4,
"valid_targets_min": 1474
},
{
"epoch": 5.119047619047619,
"grad_norm": 0.6271107098202612,
"learning_rate": 8.184182293821046e-06,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09181641787290573,
"step": 3225,
"valid_targets_mean": 3844.1,
"valid_targets_min": 1192
},
{
"epoch": 5.1269841269841265,
"grad_norm": 0.7729536882848088,
"learning_rate": 8.120412194453442e-06,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13168609142303467,
"step": 3230,
"valid_targets_mean": 3441.9,
"valid_targets_min": 971
},
{
"epoch": 5.134920634920635,
"grad_norm": 0.7684229615937804,
"learning_rate": 8.056828165944282e-06,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09150117635726929,
"step": 3235,
"valid_targets_mean": 2375.8,
"valid_targets_min": 973
},
{
"epoch": 5.142857142857143,
"grad_norm": 0.7878065076580593,
"learning_rate": 7.993431204214883e-06,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1006222665309906,
"step": 3240,
"valid_targets_mean": 2976.8,
"valid_targets_min": 877
},
{
"epoch": 5.150793650793651,
"grad_norm": 0.7479238006778793,
"learning_rate": 7.93022230225652e-06,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12401343137025833,
"step": 3245,
"valid_targets_mean": 3254.5,
"valid_targets_min": 1008
},
{
"epoch": 5.158730158730159,
"grad_norm": 0.702402201184209,
"learning_rate": 7.867202450114892e-06,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09244085103273392,
"step": 3250,
"valid_targets_mean": 3044.9,
"valid_targets_min": 1271
},
{
"epoch": 5.166666666666667,
"grad_norm": 0.6904073371631958,
"learning_rate": 7.804372634874582e-06,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11687523871660233,
"step": 3255,
"valid_targets_mean": 4131.0,
"valid_targets_min": 1638
},
{
"epoch": 5.174603174603175,
"grad_norm": 0.794713029359026,
"learning_rate": 7.74173384064359e-06,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10450978577136993,
"step": 3260,
"valid_targets_mean": 3100.6,
"valid_targets_min": 1159
},
{
"epoch": 5.182539682539683,
"grad_norm": 0.7899895590351436,
"learning_rate": 7.679287048537987e-06,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12722371518611908,
"step": 3265,
"valid_targets_mean": 3208.2,
"valid_targets_min": 1358
},
{
"epoch": 5.190476190476191,
"grad_norm": 0.6296178163629895,
"learning_rate": 7.617033236666469e-06,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07929957658052444,
"step": 3270,
"valid_targets_mean": 3253.1,
"valid_targets_min": 1086
},
{
"epoch": 5.198412698412699,
"grad_norm": 0.772550287330192,
"learning_rate": 7.55497338011506e-06,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12237787246704102,
"step": 3275,
"valid_targets_mean": 3851.5,
"valid_targets_min": 1990
},
{
"epoch": 5.2063492063492065,
"grad_norm": 0.6767191861039769,
"learning_rate": 7.493108450931879e-06,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10229524970054626,
"step": 3280,
"valid_targets_mean": 4133.1,
"valid_targets_min": 821
},
{
"epoch": 5.214285714285714,
"grad_norm": 0.720480770224619,
"learning_rate": 7.4314394181118636e-06,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11554890125989914,
"step": 3285,
"valid_targets_mean": 4656.8,
"valid_targets_min": 1672
},
{
"epoch": 5.222222222222222,
"grad_norm": 0.726519804219711,
"learning_rate": 7.369967247581611e-06,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1208588257431984,
"step": 3290,
"valid_targets_mean": 3772.8,
"valid_targets_min": 1731
},
{
"epoch": 5.23015873015873,
"grad_norm": 0.7321877521486466,
"learning_rate": 7.3086929021842575e-06,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1158241480588913,
"step": 3295,
"valid_targets_mean": 4226.0,
"valid_targets_min": 1607
},
{
"epoch": 5.238095238095238,
"grad_norm": 0.7393559355923631,
"learning_rate": 7.247617341664384e-06,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13511210680007935,
"step": 3300,
"valid_targets_mean": 4740.5,
"valid_targets_min": 1710
},
{
"epoch": 5.246031746031746,
"grad_norm": 0.793371294614497,
"learning_rate": 7.186741522652994e-06,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0859147161245346,
"step": 3305,
"valid_targets_mean": 2580.8,
"valid_targets_min": 874
},
{
"epoch": 5.253968253968254,
"grad_norm": 0.8066319717320056,
"learning_rate": 7.12606639865252e-06,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.172830730676651,
"step": 3310,
"valid_targets_mean": 3399.0,
"valid_targets_min": 1479
},
{
"epoch": 5.261904761904762,
"grad_norm": 0.8161505028774265,
"learning_rate": 7.065592920021893e-06,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12437000870704651,
"step": 3315,
"valid_targets_mean": 2944.4,
"valid_targets_min": 285
},
{
"epoch": 5.26984126984127,
"grad_norm": 0.6723134626596974,
"learning_rate": 7.005322033961679e-06,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09198858588933945,
"step": 3320,
"valid_targets_mean": 3883.2,
"valid_targets_min": 1115
},
{
"epoch": 5.277777777777778,
"grad_norm": 0.6815222171306629,
"learning_rate": 6.945254684499185e-06,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08335371315479279,
"step": 3325,
"valid_targets_mean": 3160.1,
"valid_targets_min": 1536
},
{
"epoch": 5.285714285714286,
"grad_norm": 0.9098274401850043,
"learning_rate": 6.8853918124737274e-06,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1184665709733963,
"step": 3330,
"valid_targets_mean": 2596.0,
"valid_targets_min": 1315
},
{
"epoch": 5.2936507936507935,
"grad_norm": 0.6857614007500089,
"learning_rate": 6.825734355521898e-06,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1017097607254982,
"step": 3335,
"valid_targets_mean": 4198.5,
"valid_targets_min": 1562
},
{
"epoch": 5.301587301587301,
"grad_norm": 0.8272058345129579,
"learning_rate": 6.766283248062817e-06,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08390039950609207,
"step": 3340,
"valid_targets_mean": 2267.4,
"valid_targets_min": 1306
},
{
"epoch": 5.309523809523809,
"grad_norm": 0.8083062386180365,
"learning_rate": 6.707039421283559e-06,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0976867526769638,
"step": 3345,
"valid_targets_mean": 2621.0,
"valid_targets_min": 673
},
{
"epoch": 5.317460317460317,
"grad_norm": 0.7907657672139157,
"learning_rate": 6.648003803124559e-06,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06761344522237778,
"step": 3350,
"valid_targets_mean": 2349.9,
"valid_targets_min": 1323
},
{
"epoch": 5.325396825396825,
"grad_norm": 0.8295765502920541,
"learning_rate": 6.589177318265047e-06,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08894240111112595,
"step": 3355,
"valid_targets_mean": 3019.9,
"valid_targets_min": 1086
},
{
"epoch": 5.333333333333333,
"grad_norm": 0.7155977892403146,
"learning_rate": 6.53056088810857e-06,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08744360506534576,
"step": 3360,
"valid_targets_mean": 3405.6,
"valid_targets_min": 1690
},
{
"epoch": 5.341269841269841,
"grad_norm": 0.7623686882341104,
"learning_rate": 6.472155430768608e-06,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.096970334649086,
"step": 3365,
"valid_targets_mean": 3433.9,
"valid_targets_min": 1287
},
{
"epoch": 5.349206349206349,
"grad_norm": 0.6991086887361436,
"learning_rate": 6.413961861054132e-06,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09134359657764435,
"step": 3370,
"valid_targets_mean": 3337.8,
"valid_targets_min": 778
},
{
"epoch": 5.357142857142857,
"grad_norm": 0.7184355046680967,
"learning_rate": 6.3559810904553095e-06,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09643669426441193,
"step": 3375,
"valid_targets_mean": 3267.6,
"valid_targets_min": 1005
},
{
"epoch": 5.365079365079365,
"grad_norm": 0.7691159521423506,
"learning_rate": 6.298214027129219e-06,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08167582750320435,
"step": 3380,
"valid_targets_mean": 3071.9,
"valid_targets_min": 2067
},
{
"epoch": 5.3730158730158735,
"grad_norm": 0.7232492216728219,
"learning_rate": 6.240661575885629e-06,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09442508220672607,
"step": 3385,
"valid_targets_mean": 3521.1,
"valid_targets_min": 1072
},
{
"epoch": 5.380952380952381,
"grad_norm": 0.7830495336781548,
"learning_rate": 6.183324638172819e-06,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10402445495128632,
"step": 3390,
"valid_targets_mean": 2552.1,
"valid_targets_min": 744
},
{
"epoch": 5.388888888888889,
"grad_norm": 0.729818898985151,
"learning_rate": 6.126204112063463e-06,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1520620882511139,
"step": 3395,
"valid_targets_mean": 4477.5,
"valid_targets_min": 1029
},
{
"epoch": 5.396825396825397,
"grad_norm": 0.6920667559511638,
"learning_rate": 6.069300892240564e-06,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09078704565763474,
"step": 3400,
"valid_targets_mean": 3087.2,
"valid_targets_min": 1270
},
{
"epoch": 5.404761904761905,
"grad_norm": 0.7781077186783485,
"learning_rate": 6.0126158699834625e-06,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10325247049331665,
"step": 3405,
"valid_targets_mean": 3032.1,
"valid_targets_min": 1200
},
{
"epoch": 5.412698412698413,
"grad_norm": 0.7663501738172225,
"learning_rate": 5.956149933153816e-06,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07357954978942871,
"step": 3410,
"valid_targets_mean": 2068.0,
"valid_targets_min": 721
},
{
"epoch": 5.420634920634921,
"grad_norm": 0.7027131190487993,
"learning_rate": 5.899903966181751e-06,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10673792660236359,
"step": 3415,
"valid_targets_mean": 3083.1,
"valid_targets_min": 1552
},
{
"epoch": 5.428571428571429,
"grad_norm": 0.6911729334824366,
"learning_rate": 5.843878850052007e-06,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09318830817937851,
"step": 3420,
"valid_targets_mean": 3576.4,
"valid_targets_min": 1720
},
{
"epoch": 5.436507936507937,
"grad_norm": 0.7317882758484224,
"learning_rate": 5.788075462290084e-06,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0958942249417305,
"step": 3425,
"valid_targets_mean": 2726.6,
"valid_targets_min": 1096
},
{
"epoch": 5.444444444444445,
"grad_norm": 0.7898992040430142,
"learning_rate": 5.732494676948554e-06,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1019308939576149,
"step": 3430,
"valid_targets_mean": 3273.1,
"valid_targets_min": 1297
},
{
"epoch": 5.4523809523809526,
"grad_norm": 0.6476619928289603,
"learning_rate": 5.677137364593363e-06,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1071840450167656,
"step": 3435,
"valid_targets_mean": 4286.2,
"valid_targets_min": 1373
},
{
"epoch": 5.4603174603174605,
"grad_norm": 0.8557484260093969,
"learning_rate": 5.622004392290163e-06,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12339898943901062,
"step": 3440,
"valid_targets_mean": 2923.4,
"valid_targets_min": 1672
},
{
"epoch": 5.468253968253968,
"grad_norm": 0.7015615872264492,
"learning_rate": 5.567096623590758e-06,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09825904667377472,
"step": 3445,
"valid_targets_mean": 3929.8,
"valid_targets_min": 738
},
{
"epoch": 5.476190476190476,
"grad_norm": 0.8655562264421257,
"learning_rate": 5.512414918519573e-06,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1307569444179535,
"step": 3450,
"valid_targets_mean": 3211.2,
"valid_targets_min": 1356
},
{
"epoch": 5.484126984126984,
"grad_norm": 0.8890725294031256,
"learning_rate": 5.457960133560179e-06,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0857107937335968,
"step": 3455,
"valid_targets_mean": 1887.0,
"valid_targets_min": 823
},
{
"epoch": 5.492063492063492,
"grad_norm": 0.7014404433696352,
"learning_rate": 5.403733121641883e-06,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0767240822315216,
"step": 3460,
"valid_targets_mean": 3447.1,
"valid_targets_min": 833
},
{
"epoch": 5.5,
"grad_norm": 0.7077085117048115,
"learning_rate": 5.349734732126366e-06,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1149144172668457,
"step": 3465,
"valid_targets_mean": 3409.2,
"valid_targets_min": 810
},
{
"epoch": 5.507936507936508,
"grad_norm": 0.6964990148226815,
"learning_rate": 5.295965810794376e-06,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12690629065036774,
"step": 3470,
"valid_targets_mean": 4805.8,
"valid_targets_min": 1606
},
{
"epoch": 5.515873015873016,
"grad_norm": 0.71008503903071,
"learning_rate": 5.2424271998324895e-06,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1080438420176506,
"step": 3475,
"valid_targets_mean": 3492.4,
"valid_targets_min": 1643
},
{
"epoch": 5.523809523809524,
"grad_norm": 0.7353298420126876,
"learning_rate": 5.189119737819912e-06,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11497688293457031,
"step": 3480,
"valid_targets_mean": 3634.8,
"valid_targets_min": 969
},
{
"epoch": 5.531746031746032,
"grad_norm": 0.8109076591558645,
"learning_rate": 5.136044259715342e-06,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15082211792469025,
"step": 3485,
"valid_targets_mean": 3544.9,
"valid_targets_min": 1127
},
{
"epoch": 5.5396825396825395,
"grad_norm": 0.7922885526246444,
"learning_rate": 5.083201596843905e-06,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10521303117275238,
"step": 3490,
"valid_targets_mean": 4138.5,
"valid_targets_min": 1128
},
{
"epoch": 5.5476190476190474,
"grad_norm": 0.8243700889289516,
"learning_rate": 5.030592576884117e-06,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07981052994728088,
"step": 3495,
"valid_targets_mean": 2294.5,
"valid_targets_min": 1025
},
{
"epoch": 5.555555555555555,
"grad_norm": 0.6042313383840995,
"learning_rate": 4.978218023854928e-06,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08307897299528122,
"step": 3500,
"valid_targets_mean": 3926.1,
"valid_targets_min": 873
},
{
"epoch": 5.563492063492063,
"grad_norm": 0.7790070861867432,
"learning_rate": 4.926078758102834e-06,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11292654275894165,
"step": 3505,
"valid_targets_mean": 3235.6,
"valid_targets_min": 1610
},
{
"epoch": 5.571428571428571,
"grad_norm": 0.7080847761324837,
"learning_rate": 4.87417559628897e-06,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1172761619091034,
"step": 3510,
"valid_targets_mean": 3966.9,
"valid_targets_min": 1625
},
{
"epoch": 5.579365079365079,
"grad_norm": 0.7463489141334009,
"learning_rate": 4.822509351376399e-06,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12706415355205536,
"step": 3515,
"valid_targets_mean": 3811.5,
"valid_targets_min": 2163
},
{
"epoch": 5.587301587301587,
"grad_norm": 0.7519098028952099,
"learning_rate": 4.7710808326173115e-06,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1024027168750763,
"step": 3520,
"valid_targets_mean": 3474.1,
"valid_targets_min": 1022
},
{
"epoch": 5.595238095238095,
"grad_norm": 0.7086990550463645,
"learning_rate": 4.719890845540385e-06,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10318700969219208,
"step": 3525,
"valid_targets_mean": 3613.8,
"valid_targets_min": 700
},
{
"epoch": 5.603174603174603,
"grad_norm": 0.7506770758799025,
"learning_rate": 4.668940191938156e-06,
"loss": 0.2159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0782381072640419,
"step": 3530,
"valid_targets_mean": 2510.2,
"valid_targets_min": 762
},
{
"epoch": 5.611111111111111,
"grad_norm": 0.696777680063598,
"learning_rate": 4.618229669854464e-06,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08006583154201508,
"step": 3535,
"valid_targets_mean": 3453.9,
"valid_targets_min": 1159
},
{
"epoch": 5.619047619047619,
"grad_norm": 0.922756787599331,
"learning_rate": 4.567760073571947e-06,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12967818975448608,
"step": 3540,
"valid_targets_mean": 4102.4,
"valid_targets_min": 1504
},
{
"epoch": 5.6269841269841265,
"grad_norm": 0.7078421783660265,
"learning_rate": 4.51753219359961e-06,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09606287628412247,
"step": 3545,
"valid_targets_mean": 3108.1,
"valid_targets_min": 959
},
{
"epoch": 5.634920634920634,
"grad_norm": 0.7506430958719362,
"learning_rate": 4.467546816660433e-06,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09307855367660522,
"step": 3550,
"valid_targets_mean": 2918.5,
"valid_targets_min": 1428
},
{
"epoch": 5.642857142857143,
"grad_norm": 0.9094911858240387,
"learning_rate": 4.417804725679058e-06,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13038109242916107,
"step": 3555,
"valid_targets_mean": 2835.5,
"valid_targets_min": 1029
},
{
"epoch": 5.650793650793651,
"grad_norm": 0.9032674979239957,
"learning_rate": 4.368306699769518e-06,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13430385291576385,
"step": 3560,
"valid_targets_mean": 3887.0,
"valid_targets_min": 338
},
{
"epoch": 5.658730158730159,
"grad_norm": 0.7586381935839076,
"learning_rate": 4.319053514223033e-06,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08391046524047852,
"step": 3565,
"valid_targets_mean": 3104.5,
"valid_targets_min": 1432
},
{
"epoch": 5.666666666666667,
"grad_norm": 0.7301760680360758,
"learning_rate": 4.270045940495879e-06,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0900624692440033,
"step": 3570,
"valid_targets_mean": 2651.0,
"valid_targets_min": 1582
},
{
"epoch": 5.674603174603175,
"grad_norm": 0.7547968526194967,
"learning_rate": 4.221284746197292e-06,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08366125822067261,
"step": 3575,
"valid_targets_mean": 2382.6,
"valid_targets_min": 988
},
{
"epoch": 5.682539682539683,
"grad_norm": 0.8234421252575538,
"learning_rate": 4.172770695077437e-06,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11100704967975616,
"step": 3580,
"valid_targets_mean": 2705.6,
"valid_targets_min": 1352
},
{
"epoch": 5.690476190476191,
"grad_norm": 0.8174606359388051,
"learning_rate": 4.124504547015487e-06,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1208464503288269,
"step": 3585,
"valid_targets_mean": 3083.4,
"valid_targets_min": 1639
},
{
"epoch": 5.698412698412699,
"grad_norm": 0.7562999444174163,
"learning_rate": 4.0764870580076675e-06,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0921013206243515,
"step": 3590,
"valid_targets_mean": 2875.4,
"valid_targets_min": 806
},
{
"epoch": 5.7063492063492065,
"grad_norm": 0.7965104320892732,
"learning_rate": 4.0287189801554304e-06,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09799252450466156,
"step": 3595,
"valid_targets_mean": 3153.5,
"valid_targets_min": 1286
},
{
"epoch": 5.714285714285714,
"grad_norm": 0.857269142950299,
"learning_rate": 3.98120106165371e-06,
"loss": 0.2133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08865942060947418,
"step": 3600,
"valid_targets_mean": 2800.6,
"valid_targets_min": 656
},
{
"epoch": 5.722222222222222,
"grad_norm": 0.7527257186466023,
"learning_rate": 3.933934046779164e-06,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09972484409809113,
"step": 3605,
"valid_targets_mean": 2838.0,
"valid_targets_min": 1631
},
{
"epoch": 5.73015873015873,
"grad_norm": 0.5994753331151756,
"learning_rate": 3.886918675878513e-06,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08137780427932739,
"step": 3610,
"valid_targets_mean": 4263.1,
"valid_targets_min": 2086
},
{
"epoch": 5.738095238095238,
"grad_norm": 0.8232153717265387,
"learning_rate": 3.840155685356983e-06,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09935421496629715,
"step": 3615,
"valid_targets_mean": 2672.6,
"valid_targets_min": 1511
},
{
"epoch": 5.746031746031746,
"grad_norm": 0.750128536941153,
"learning_rate": 3.793645807666735e-06,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1128338873386383,
"step": 3620,
"valid_targets_mean": 3398.9,
"valid_targets_min": 1313
},
{
"epoch": 5.753968253968254,
"grad_norm": 0.7880891847487402,
"learning_rate": 3.747389771295411e-06,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10944647341966629,
"step": 3625,
"valid_targets_mean": 2556.5,
"valid_targets_min": 1189
},
{
"epoch": 5.761904761904762,
"grad_norm": 0.6786715199961021,
"learning_rate": 3.701388300754709e-06,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11284029483795166,
"step": 3630,
"valid_targets_mean": 4237.8,
"valid_targets_min": 1348
},
{
"epoch": 5.76984126984127,
"grad_norm": 0.786402047995528,
"learning_rate": 3.6556421165690516e-06,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1069340705871582,
"step": 3635,
"valid_targets_mean": 3257.5,
"valid_targets_min": 1574
},
{
"epoch": 5.777777777777778,
"grad_norm": 0.9927590000924167,
"learning_rate": 3.610151935264288e-06,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08624372631311417,
"step": 3640,
"valid_targets_mean": 2332.5,
"valid_targets_min": 318
},
{
"epoch": 5.785714285714286,
"grad_norm": 0.7575310728766175,
"learning_rate": 3.5649184693564797e-06,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08996361494064331,
"step": 3645,
"valid_targets_mean": 2656.9,
"valid_targets_min": 634
},
{
"epoch": 5.7936507936507935,
"grad_norm": 0.6353430242205899,
"learning_rate": 3.5199424273407277e-06,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09710676968097687,
"step": 3650,
"valid_targets_mean": 4277.1,
"valid_targets_min": 2470
},
{
"epoch": 5.801587301587301,
"grad_norm": 0.8104745502933571,
"learning_rate": 3.4752245136801065e-06,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09580199420452118,
"step": 3655,
"valid_targets_mean": 2233.1,
"valid_targets_min": 1041
},
{
"epoch": 5.809523809523809,
"grad_norm": 0.8218115415777589,
"learning_rate": 3.430765428794569e-06,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09398232400417328,
"step": 3660,
"valid_targets_mean": 2095.1,
"valid_targets_min": 974
},
{
"epoch": 5.817460317460317,
"grad_norm": 0.8000713802610769,
"learning_rate": 3.3865658690500424e-06,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10749034583568573,
"step": 3665,
"valid_targets_mean": 3013.5,
"valid_targets_min": 728
},
{
"epoch": 5.825396825396825,
"grad_norm": 0.816997724762598,
"learning_rate": 3.34262652674749e-06,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1072094738483429,
"step": 3670,
"valid_targets_mean": 3302.1,
"valid_targets_min": 1243
},
{
"epoch": 5.833333333333333,
"grad_norm": 0.7748883081700283,
"learning_rate": 3.2989480901120684e-06,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05944449454545975,
"step": 3675,
"valid_targets_mean": 1702.4,
"valid_targets_min": 1121
},
{
"epoch": 5.841269841269841,
"grad_norm": 0.7205680487267188,
"learning_rate": 3.2555312432823283e-06,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0655689686536789,
"step": 3680,
"valid_targets_mean": 2465.4,
"valid_targets_min": 1310
},
{
"epoch": 5.849206349206349,
"grad_norm": 0.7713827436038354,
"learning_rate": 3.2123766662995572e-06,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11447322368621826,
"step": 3685,
"valid_targets_mean": 3081.1,
"valid_targets_min": 804
},
{
"epoch": 5.857142857142857,
"grad_norm": 0.6412703691192485,
"learning_rate": 3.1694850350970686e-06,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13718387484550476,
"step": 3690,
"valid_targets_mean": 5159.6,
"valid_targets_min": 1106
},
{
"epoch": 5.865079365079366,
"grad_norm": 0.7311165566889636,
"learning_rate": 3.1268570214896265e-06,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10165748745203018,
"step": 3695,
"valid_targets_mean": 3384.6,
"valid_targets_min": 767
},
{
"epoch": 5.8730158730158735,
"grad_norm": 0.838423608791939,
"learning_rate": 3.0844932931629602e-06,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08572743833065033,
"step": 3700,
"valid_targets_mean": 2373.0,
"valid_targets_min": 1190
},
{
"epoch": 5.880952380952381,
"grad_norm": 0.6958758298936207,
"learning_rate": 3.0423945136632626e-06,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07737462967634201,
"step": 3705,
"valid_targets_mean": 2863.1,
"valid_targets_min": 735
},
{
"epoch": 5.888888888888889,
"grad_norm": 0.6597673477275796,
"learning_rate": 3.000561342386814e-06,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10114225745201111,
"step": 3710,
"valid_targets_mean": 3721.8,
"valid_targets_min": 1506
},
{
"epoch": 5.896825396825397,
"grad_norm": 0.8306491531882909,
"learning_rate": 2.9589944345696596e-06,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11550882458686829,
"step": 3715,
"valid_targets_mean": 2761.6,
"valid_targets_min": 1327
},
{
"epoch": 5.904761904761905,
"grad_norm": 0.8683852586162994,
"learning_rate": 2.9176944412773322e-06,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09660732746124268,
"step": 3720,
"valid_targets_mean": 2080.1,
"valid_targets_min": 572
},
{
"epoch": 5.912698412698413,
"grad_norm": 0.7251086912309824,
"learning_rate": 2.876662009394673e-06,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12001783400774002,
"step": 3725,
"valid_targets_mean": 3939.5,
"valid_targets_min": 1282
},
{
"epoch": 5.920634920634921,
"grad_norm": 0.8129360177739626,
"learning_rate": 2.8358977816156796e-06,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10110355913639069,
"step": 3730,
"valid_targets_mean": 3384.8,
"valid_targets_min": 2192
},
{
"epoch": 5.928571428571429,
"grad_norm": 0.7180542554037956,
"learning_rate": 2.7954023964334485e-06,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09065502882003784,
"step": 3735,
"valid_targets_mean": 2732.5,
"valid_targets_min": 1448
},
{
"epoch": 5.936507936507937,
"grad_norm": 0.8552826097328355,
"learning_rate": 2.7551764881301955e-06,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08631910383701324,
"step": 3740,
"valid_targets_mean": 2285.6,
"valid_targets_min": 1428
},
{
"epoch": 5.944444444444445,
"grad_norm": 0.6262989640665731,
"learning_rate": 2.715220686767268e-06,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10843861103057861,
"step": 3745,
"valid_targets_mean": 5061.1,
"valid_targets_min": 1356
},
{
"epoch": 5.9523809523809526,
"grad_norm": 0.7897971423207434,
"learning_rate": 2.6755356181753247e-06,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10058259963989258,
"step": 3750,
"valid_targets_mean": 3069.1,
"valid_targets_min": 1088
},
{
"epoch": 5.9603174603174605,
"grad_norm": 0.7636236084851435,
"learning_rate": 2.6361219039445328e-06,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08092188835144043,
"step": 3755,
"valid_targets_mean": 2315.1,
"valid_targets_min": 611
},
{
"epoch": 5.968253968253968,
"grad_norm": 0.6963273983529872,
"learning_rate": 2.5969801614147838e-06,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1218203455209732,
"step": 3760,
"valid_targets_mean": 4196.5,
"valid_targets_min": 1130
},
{
"epoch": 5.976190476190476,
"grad_norm": 0.6948330177609254,
"learning_rate": 2.558111003666075e-06,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09535790979862213,
"step": 3765,
"valid_targets_mean": 2892.5,
"valid_targets_min": 1354
},
{
"epoch": 5.984126984126984,
"grad_norm": 0.7485809892595101,
"learning_rate": 2.519515039508893e-06,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12762418389320374,
"step": 3770,
"valid_targets_mean": 4171.5,
"valid_targets_min": 1710
},
{
"epoch": 5.992063492063492,
"grad_norm": 0.7209339180022664,
"learning_rate": 2.481192873474667e-06,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14580002427101135,
"step": 3775,
"valid_targets_mean": 4015.1,
"valid_targets_min": 1347
},
{
"epoch": 6.0,
"grad_norm": 0.7486824941956289,
"learning_rate": 2.4431451058062928e-06,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12455324083566666,
"step": 3780,
"valid_targets_mean": 3672.8,
"valid_targets_min": 994
},
{
"epoch": 6.007936507936508,
"grad_norm": 0.6782508888637717,
"learning_rate": 2.4053723324487677e-06,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0711774080991745,
"step": 3785,
"valid_targets_mean": 2518.9,
"valid_targets_min": 1545
},
{
"epoch": 6.015873015873016,
"grad_norm": 0.6911427139250138,
"learning_rate": 2.3678751450398196e-06,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11248598247766495,
"step": 3790,
"valid_targets_mean": 3788.2,
"valid_targets_min": 601
},
{
"epoch": 6.023809523809524,
"grad_norm": 0.7538661391977503,
"learning_rate": 2.330654130900656e-06,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08532236516475677,
"step": 3795,
"valid_targets_mean": 2292.0,
"valid_targets_min": 1204
},
{
"epoch": 6.031746031746032,
"grad_norm": 0.8225525420805956,
"learning_rate": 2.2937098730267572e-06,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298900842666626,
"step": 3800,
"valid_targets_mean": 3416.4,
"valid_targets_min": 1501
},
{
"epoch": 6.0396825396825395,
"grad_norm": 0.7635534745827315,
"learning_rate": 2.2570429500787604e-06,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0920785516500473,
"step": 3805,
"valid_targets_mean": 2786.8,
"valid_targets_min": 1354
},
{
"epoch": 6.0476190476190474,
"grad_norm": 0.659940926257208,
"learning_rate": 2.2206539363733738e-06,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05400678142905235,
"step": 3810,
"valid_targets_mean": 2275.5,
"valid_targets_min": 364
},
{
"epoch": 6.055555555555555,
"grad_norm": 0.6973295697920284,
"learning_rate": 2.1845434018744038e-06,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12242526561021805,
"step": 3815,
"valid_targets_mean": 4405.4,
"valid_targets_min": 1473
},
{
"epoch": 6.063492063492063,
"grad_norm": 0.8213586989325722,
"learning_rate": 2.148711912183803e-06,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1367570012807846,
"step": 3820,
"valid_targets_mean": 3735.0,
"valid_targets_min": 1120
},
{
"epoch": 6.071428571428571,
"grad_norm": 0.679938514817628,
"learning_rate": 2.1131600285328458e-06,
"loss": 0.2193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09106817096471786,
"step": 3825,
"valid_targets_mean": 4257.8,
"valid_targets_min": 1554
},
{
"epoch": 6.079365079365079,
"grad_norm": 0.6807386614704928,
"learning_rate": 2.0778883077732903e-06,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12356531620025635,
"step": 3830,
"valid_targets_mean": 5071.1,
"valid_targets_min": 1373
},
{
"epoch": 6.087301587301587,
"grad_norm": 0.7553925830584054,
"learning_rate": 2.0428973023686983e-06,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10499994456768036,
"step": 3835,
"valid_targets_mean": 3480.4,
"valid_targets_min": 1535
},
{
"epoch": 6.095238095238095,
"grad_norm": 0.888088778216751,
"learning_rate": 2.0081875603857726e-06,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10103853046894073,
"step": 3840,
"valid_targets_mean": 2299.6,
"valid_targets_min": 1160
},
{
"epoch": 6.103174603174603,
"grad_norm": 0.6779555773520787,
"learning_rate": 1.973759625485743e-06,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10814555734395981,
"step": 3845,
"valid_targets_mean": 3903.9,
"valid_targets_min": 811
},
{
"epoch": 6.111111111111111,
"grad_norm": 0.6945692361650982,
"learning_rate": 1.9396140369159e-06,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0844080001115799,
"step": 3850,
"valid_targets_mean": 3611.2,
"valid_targets_min": 845
},
{
"epoch": 6.119047619047619,
"grad_norm": 0.819841381174835,
"learning_rate": 1.9057513295011087e-06,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17100293934345245,
"step": 3855,
"valid_targets_mean": 3577.8,
"valid_targets_min": 655
},
{
"epoch": 6.1269841269841265,
"grad_norm": 0.6920995453717935,
"learning_rate": 1.8721720336354487e-06,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07847906649112701,
"step": 3860,
"valid_targets_mean": 2644.1,
"valid_targets_min": 1056
},
{
"epoch": 6.134920634920635,
"grad_norm": 0.7097918126712862,
"learning_rate": 1.8388766752739017e-06,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09960925579071045,
"step": 3865,
"valid_targets_mean": 3381.4,
"valid_targets_min": 1443
},
{
"epoch": 6.142857142857143,
"grad_norm": 0.6413975048934565,
"learning_rate": 1.805865775924116e-06,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09482008218765259,
"step": 3870,
"valid_targets_mean": 5026.4,
"valid_targets_min": 1530
},
{
"epoch": 6.150793650793651,
"grad_norm": 0.7978109804263973,
"learning_rate": 1.7731398526382416e-06,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14775651693344116,
"step": 3875,
"valid_targets_mean": 3349.0,
"valid_targets_min": 1775
},
{
"epoch": 6.158730158730159,
"grad_norm": 0.6618833893869975,
"learning_rate": 1.7406994180048231e-06,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08926299959421158,
"step": 3880,
"valid_targets_mean": 3658.2,
"valid_targets_min": 778
},
{
"epoch": 6.166666666666667,
"grad_norm": 0.6268145598843055,
"learning_rate": 1.7085449801407783e-06,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10563044995069504,
"step": 3885,
"valid_targets_mean": 4803.8,
"valid_targets_min": 2923
},
{
"epoch": 6.174603174603175,
"grad_norm": 0.7930198414251461,
"learning_rate": 1.67667704268343e-06,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09213380515575409,
"step": 3890,
"valid_targets_mean": 3095.4,
"valid_targets_min": 1281
},
{
"epoch": 6.182539682539683,
"grad_norm": 0.7855535649914588,
"learning_rate": 1.6450961047826353e-06,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10935674607753754,
"step": 3895,
"valid_targets_mean": 3000.8,
"valid_targets_min": 729
},
{
"epoch": 6.190476190476191,
"grad_norm": 0.7167832062061632,
"learning_rate": 1.6138026610929446e-06,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0821952372789383,
"step": 3900,
"valid_targets_mean": 3084.2,
"valid_targets_min": 1591
},
{
"epoch": 6.198412698412699,
"grad_norm": 0.7355915549419297,
"learning_rate": 1.5827972017658732e-06,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07168291509151459,
"step": 3905,
"valid_targets_mean": 2457.8,
"valid_targets_min": 1347
},
{
"epoch": 6.2063492063492065,
"grad_norm": 0.7339590222002838,
"learning_rate": 1.5520802124422108e-06,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06518985331058502,
"step": 3910,
"valid_targets_mean": 2686.0,
"valid_targets_min": 1446
},
{
"epoch": 6.214285714285714,
"grad_norm": 0.7700254235965525,
"learning_rate": 1.5216521742444236e-06,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10491657257080078,
"step": 3915,
"valid_targets_mean": 3282.0,
"valid_targets_min": 619
},
{
"epoch": 6.222222222222222,
"grad_norm": 0.7706206197929331,
"learning_rate": 1.491513563769118e-06,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1297735571861267,
"step": 3920,
"valid_targets_mean": 3537.9,
"valid_targets_min": 1342
},
{
"epoch": 6.23015873015873,
"grad_norm": 0.7125278750032971,
"learning_rate": 1.4616648530795673e-06,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12319030612707138,
"step": 3925,
"valid_targets_mean": 4568.1,
"valid_targets_min": 1083
},
{
"epoch": 6.238095238095238,
"grad_norm": 0.7509002816161764,
"learning_rate": 1.432106509698319e-06,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10249030590057373,
"step": 3930,
"valid_targets_mean": 3594.0,
"valid_targets_min": 972
},
{
"epoch": 6.246031746031746,
"grad_norm": 0.8970120821160956,
"learning_rate": 1.4028389965998867e-06,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10491965711116791,
"step": 3935,
"valid_targets_mean": 2135.4,
"valid_targets_min": 1377
},
{
"epoch": 6.253968253968254,
"grad_norm": 0.8134853281807751,
"learning_rate": 1.3738627722034848e-06,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08832602202892303,
"step": 3940,
"valid_targets_mean": 2626.1,
"valid_targets_min": 1053
},
{
"epoch": 6.261904761904762,
"grad_norm": 0.7862015024702198,
"learning_rate": 1.345178290365845e-06,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07818420976400375,
"step": 3945,
"valid_targets_mean": 2288.4,
"valid_targets_min": 1510
},
{
"epoch": 6.26984126984127,
"grad_norm": 0.8454958849822186,
"learning_rate": 1.3167860003741218e-06,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11491268873214722,
"step": 3950,
"valid_targets_mean": 3148.0,
"valid_targets_min": 1319
},
{
"epoch": 6.277777777777778,
"grad_norm": 0.9550952759949879,
"learning_rate": 1.2886863469388389e-06,
"loss": 0.2159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08679212629795074,
"step": 3955,
"valid_targets_mean": 1462.1,
"valid_targets_min": 930
},
{
"epoch": 6.285714285714286,
"grad_norm": 0.6798761734084032,
"learning_rate": 1.2608797701869425e-06,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1112833023071289,
"step": 3960,
"valid_targets_mean": 4642.1,
"valid_targets_min": 734
},
{
"epoch": 6.2936507936507935,
"grad_norm": 0.7161938785556553,
"learning_rate": 1.2333667056548881e-06,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0901009738445282,
"step": 3965,
"valid_targets_mean": 3483.0,
"valid_targets_min": 1438
},
{
"epoch": 6.301587301587301,
"grad_norm": 0.7919495256788115,
"learning_rate": 1.2061475842818337e-06,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10928655415773392,
"step": 3970,
"valid_targets_mean": 3111.4,
"valid_targets_min": 1159
},
{
"epoch": 6.309523809523809,
"grad_norm": 0.6622868143264027,
"learning_rate": 1.1792228324028776e-06,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0938882902264595,
"step": 3975,
"valid_targets_mean": 4688.2,
"valid_targets_min": 1526
},
{
"epoch": 6.317460317460317,
"grad_norm": 0.714843100243358,
"learning_rate": 1.152592871742395e-06,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08914178609848022,
"step": 3980,
"valid_targets_mean": 3923.6,
"valid_targets_min": 1905
},
{
"epoch": 6.325396825396825,
"grad_norm": 0.7459606794822701,
"learning_rate": 1.1262581194074152e-06,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13458332419395447,
"step": 3985,
"valid_targets_mean": 3634.6,
"valid_targets_min": 1182
},
{
"epoch": 6.333333333333333,
"grad_norm": 0.7535897780328545,
"learning_rate": 1.100218987881112e-06,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08394159376621246,
"step": 3990,
"valid_targets_mean": 2917.5,
"valid_targets_min": 1433
},
{
"epoch": 6.341269841269841,
"grad_norm": 0.6530045323214579,
"learning_rate": 1.0744758850163085e-06,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12506398558616638,
"step": 3995,
"valid_targets_mean": 4917.4,
"valid_targets_min": 1066
},
{
"epoch": 6.349206349206349,
"grad_norm": 0.7979509577422987,
"learning_rate": 1.0490292140291247e-06,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11587633192539215,
"step": 4000,
"valid_targets_mean": 2967.2,
"valid_targets_min": 1396
},
{
"epoch": 6.357142857142857,
"grad_norm": 0.8755874967319832,
"learning_rate": 1.0238793734926467e-06,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13597938418388367,
"step": 4005,
"valid_targets_mean": 2481.9,
"valid_targets_min": 1132
},
{
"epoch": 6.365079365079365,
"grad_norm": 0.6783876323503061,
"learning_rate": 9.990267573306745e-07,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10617756843566895,
"step": 4010,
"valid_targets_mean": 4420.9,
"valid_targets_min": 1257
},
{
"epoch": 6.3730158730158735,
"grad_norm": 0.722469792560784,
"learning_rate": 9.744717548115613e-07,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09820477664470673,
"step": 4015,
"valid_targets_mean": 3403.4,
"valid_targets_min": 1298
},
{
"epoch": 6.380952380952381,
"grad_norm": 0.733459872022677,
"learning_rate": 9.502147505421244e-07,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08142758905887604,
"step": 4020,
"valid_targets_mean": 2535.2,
"valid_targets_min": 1200
},
{
"epoch": 6.388888888888889,
"grad_norm": 0.8345987403978284,
"learning_rate": 9.262561244616108e-07,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10948467999696732,
"step": 4025,
"valid_targets_mean": 3486.9,
"valid_targets_min": 1180
},
{
"epoch": 6.396825396825397,
"grad_norm": 0.7819290637056325,
"learning_rate": 9.025962518357323e-07,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09386520832777023,
"step": 4030,
"valid_targets_mean": 4022.1,
"valid_targets_min": 2193
},
{
"epoch": 6.404761904761905,
"grad_norm": 0.7675973062209386,
"learning_rate": 8.792355032508282e-07,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10054197907447815,
"step": 4035,
"valid_targets_mean": 3192.8,
"valid_targets_min": 1637
},
{
"epoch": 6.412698412698413,
"grad_norm": 0.7308179209216745,
"learning_rate": 8.561742446080168e-07,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13068924844264984,
"step": 4040,
"valid_targets_mean": 4124.1,
"valid_targets_min": 819
},
{
"epoch": 6.420634920634921,
"grad_norm": 0.7949394003439152,
"learning_rate": 8.334128371174955e-07,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09118463099002838,
"step": 4045,
"valid_targets_mean": 2320.0,
"valid_targets_min": 1229
},
{
"epoch": 6.428571428571429,
"grad_norm": 0.8482819989896451,
"learning_rate": 8.109516372928605e-07,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09792070090770721,
"step": 4050,
"valid_targets_mean": 2030.2,
"valid_targets_min": 906
},
{
"epoch": 6.436507936507937,
"grad_norm": 0.6555352946842179,
"learning_rate": 7.887909969455366e-07,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10069252550601959,
"step": 4055,
"valid_targets_mean": 4303.4,
"valid_targets_min": 2117
},
{
"epoch": 6.444444444444445,
"grad_norm": 0.7356412967204531,
"learning_rate": 7.669312631792758e-07,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09753116965293884,
"step": 4060,
"valid_targets_mean": 3563.4,
"valid_targets_min": 1759
},
{
"epoch": 6.4523809523809526,
"grad_norm": 0.831688287232052,
"learning_rate": 7.453727783846876e-07,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13499116897583008,
"step": 4065,
"valid_targets_mean": 3057.4,
"valid_targets_min": 1139
},
{
"epoch": 6.4603174603174605,
"grad_norm": 0.7591710445025716,
"learning_rate": 7.241158802339065e-07,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1253347396850586,
"step": 4070,
"valid_targets_mean": 3662.1,
"valid_targets_min": 785
},
{
"epoch": 6.468253968253968,
"grad_norm": 0.6810251121546419,
"learning_rate": 7.031609016753016e-07,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07710853219032288,
"step": 4075,
"valid_targets_mean": 2938.1,
"valid_targets_min": 1201
},
{
"epoch": 6.476190476190476,
"grad_norm": 0.7354002690469413,
"learning_rate": 6.825081709282377e-07,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10170842707157135,
"step": 4080,
"valid_targets_mean": 3541.6,
"valid_targets_min": 759
},
{
"epoch": 6.484126984126984,
"grad_norm": 0.6860941434399659,
"learning_rate": 6.62158011477958e-07,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08662896603345871,
"step": 4085,
"valid_targets_mean": 3065.5,
"valid_targets_min": 1368
},
{
"epoch": 6.492063492063492,
"grad_norm": 0.8315820409255328,
"learning_rate": 6.421107420705097e-07,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10763676464557648,
"step": 4090,
"valid_targets_mean": 2476.9,
"valid_targets_min": 1314
},
{
"epoch": 6.5,
"grad_norm": 0.6779255746870322,
"learning_rate": 6.223666767077508e-07,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10068156570196152,
"step": 4095,
"valid_targets_mean": 4325.5,
"valid_targets_min": 733
},
{
"epoch": 6.507936507936508,
"grad_norm": 0.703785843801452,
"learning_rate": 6.029261246424267e-07,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08343538641929626,
"step": 4100,
"valid_targets_mean": 3569.0,
"valid_targets_min": 1165
},
{
"epoch": 6.515873015873016,
"grad_norm": 0.8180230926027161,
"learning_rate": 5.837893903733394e-07,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1009148359298706,
"step": 4105,
"valid_targets_mean": 2869.2,
"valid_targets_min": 907
},
{
"epoch": 6.523809523809524,
"grad_norm": 0.8734844267563727,
"learning_rate": 5.649567736405681e-07,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09930504113435745,
"step": 4110,
"valid_targets_mean": 2767.9,
"valid_targets_min": 1455
},
{
"epoch": 6.531746031746032,
"grad_norm": 0.7514289018139494,
"learning_rate": 5.464285694207672e-07,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11243937909603119,
"step": 4115,
"valid_targets_mean": 4020.0,
"valid_targets_min": 1291
},
{
"epoch": 6.5396825396825395,
"grad_norm": 0.6536374909100122,
"learning_rate": 5.282050679225714e-07,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10605214536190033,
"step": 4120,
"valid_targets_mean": 3659.0,
"valid_targets_min": 1727
},
{
"epoch": 6.5476190476190474,
"grad_norm": 0.792550081612281,
"learning_rate": 5.102865545820245e-07,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15852200984954834,
"step": 4125,
"valid_targets_mean": 3726.1,
"valid_targets_min": 1391
},
{
"epoch": 6.555555555555555,
"grad_norm": 0.6031293409437452,
"learning_rate": 4.926733100581182e-07,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0508820079267025,
"step": 4130,
"valid_targets_mean": 3083.6,
"valid_targets_min": 1152
},
{
"epoch": 6.563492063492063,
"grad_norm": 0.9382734552288612,
"learning_rate": 4.7536561022840213e-07,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12225069105625153,
"step": 4135,
"valid_targets_mean": 2312.8,
"valid_targets_min": 1435
},
{
"epoch": 6.571428571428571,
"grad_norm": 0.8645030624347266,
"learning_rate": 4.5836372618464964e-07,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10689771175384521,
"step": 4140,
"valid_targets_mean": 2341.1,
"valid_targets_min": 725
},
{
"epoch": 6.579365079365079,
"grad_norm": 0.6811962105069355,
"learning_rate": 4.416679242286215e-07,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09631943702697754,
"step": 4145,
"valid_targets_mean": 4323.8,
"valid_targets_min": 1536
},
{
"epoch": 6.587301587301587,
"grad_norm": 0.9350005697667735,
"learning_rate": 4.2527846586789547e-07,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10233885049819946,
"step": 4150,
"valid_targets_mean": 1772.5,
"valid_targets_min": 645
},
{
"epoch": 6.595238095238095,
"grad_norm": 0.7013237365598121,
"learning_rate": 4.0919560781176317e-07,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09215062111616135,
"step": 4155,
"valid_targets_mean": 3150.1,
"valid_targets_min": 1088
},
{
"epoch": 6.603174603174603,
"grad_norm": 0.6666170005950856,
"learning_rate": 3.934196019672176e-07,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06517612934112549,
"step": 4160,
"valid_targets_mean": 2124.1,
"valid_targets_min": 715
},
{
"epoch": 6.611111111111111,
"grad_norm": 0.7153573335048872,
"learning_rate": 3.779506954349965e-07,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09253278374671936,
"step": 4165,
"valid_targets_mean": 3570.9,
"valid_targets_min": 1996
},
{
"epoch": 6.619047619047619,
"grad_norm": 0.6315001261313217,
"learning_rate": 3.6278913050572076e-07,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09306520223617554,
"step": 4170,
"valid_targets_mean": 4232.5,
"valid_targets_min": 1537
},
{
"epoch": 6.6269841269841265,
"grad_norm": 0.815649453820826,
"learning_rate": 3.4793514465610414e-07,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11297182738780975,
"step": 4175,
"valid_targets_mean": 3307.9,
"valid_targets_min": 1436
},
{
"epoch": 6.634920634920634,
"grad_norm": 0.8506804351795452,
"learning_rate": 3.3338897054521205e-07,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07656246423721313,
"step": 4180,
"valid_targets_mean": 1789.6,
"valid_targets_min": 825
},
{
"epoch": 6.642857142857143,
"grad_norm": 0.6360744471035349,
"learning_rate": 3.191508360108464e-07,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11496680974960327,
"step": 4185,
"valid_targets_mean": 4958.0,
"valid_targets_min": 1201
},
{
"epoch": 6.650793650793651,
"grad_norm": 0.7875567736431006,
"learning_rate": 3.0522096406595536e-07,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07022293657064438,
"step": 4190,
"valid_targets_mean": 2186.5,
"valid_targets_min": 695
},
{
"epoch": 6.658730158730159,
"grad_norm": 0.7266157867648473,
"learning_rate": 2.9159957289514926e-07,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08252222090959549,
"step": 4195,
"valid_targets_mean": 3179.4,
"valid_targets_min": 1158
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.7434994690323846,
"learning_rate": 2.782868758512791e-07,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11222994327545166,
"step": 4200,
"valid_targets_mean": 3610.9,
"valid_targets_min": 1092
},
{
"epoch": 6.674603174603175,
"grad_norm": 0.9804608900117372,
"learning_rate": 2.6528308145210125e-07,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11486151814460754,
"step": 4205,
"valid_targets_mean": 2239.6,
"valid_targets_min": 1147
},
{
"epoch": 6.682539682539683,
"grad_norm": 0.8248478366294771,
"learning_rate": 2.525883933770046e-07,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09823493659496307,
"step": 4210,
"valid_targets_mean": 3023.0,
"valid_targets_min": 995
},
{
"epoch": 6.690476190476191,
"grad_norm": 0.6927076587244559,
"learning_rate": 2.402030104638198e-07,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08244895935058594,
"step": 4215,
"valid_targets_mean": 3867.2,
"valid_targets_min": 1395
},
{
"epoch": 6.698412698412699,
"grad_norm": 0.8426480786347594,
"learning_rate": 2.2812712670571502e-07,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08320321142673492,
"step": 4220,
"valid_targets_mean": 2116.5,
"valid_targets_min": 1014
},
{
"epoch": 6.7063492063492065,
"grad_norm": 0.6551086035705184,
"learning_rate": 2.1636093124814738e-07,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09654587507247925,
"step": 4225,
"valid_targets_mean": 4037.6,
"valid_targets_min": 1436
},
{
"epoch": 6.714285714285714,
"grad_norm": 0.6617880708598886,
"learning_rate": 2.0490460838589855e-07,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10055264830589294,
"step": 4230,
"valid_targets_mean": 4157.2,
"valid_targets_min": 722
},
{
"epoch": 6.722222222222222,
"grad_norm": 0.7010021079670415,
"learning_rate": 1.9375833756019923e-07,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06797967851161957,
"step": 4235,
"valid_targets_mean": 2408.1,
"valid_targets_min": 819
},
{
"epoch": 6.73015873015873,
"grad_norm": 0.7857502387885508,
"learning_rate": 1.8292229335590716e-07,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11493973433971405,
"step": 4240,
"valid_targets_mean": 3881.6,
"valid_targets_min": 1440
},
{
"epoch": 6.738095238095238,
"grad_norm": 0.6685857676840744,
"learning_rate": 1.7239664549878688e-07,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11982367932796478,
"step": 4245,
"valid_targets_mean": 4794.2,
"valid_targets_min": 663
},
{
"epoch": 6.746031746031746,
"grad_norm": 0.8352380931276744,
"learning_rate": 1.6218155885283192e-07,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09608037769794464,
"step": 4250,
"valid_targets_mean": 2731.6,
"valid_targets_min": 1142
},
{
"epoch": 6.753968253968254,
"grad_norm": 0.7422039573980747,
"learning_rate": 1.5227719341769364e-07,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10857705026865005,
"step": 4255,
"valid_targets_mean": 4047.4,
"valid_targets_min": 1023
},
{
"epoch": 6.761904761904762,
"grad_norm": 0.8106967225306234,
"learning_rate": 1.4268370432618306e-07,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11048707365989685,
"step": 4260,
"valid_targets_mean": 3013.6,
"valid_targets_min": 1213
},
{
"epoch": 6.76984126984127,
"grad_norm": 0.6751488059587877,
"learning_rate": 1.3340124184182178e-07,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08324621617794037,
"step": 4265,
"valid_targets_mean": 2745.6,
"valid_targets_min": 838
},
{
"epoch": 6.777777777777778,
"grad_norm": 0.8655488128813514,
"learning_rate": 1.2442995135650393e-07,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08682005107402802,
"step": 4270,
"valid_targets_mean": 1827.8,
"valid_targets_min": 677
},
{
"epoch": 6.785714285714286,
"grad_norm": 0.7408048732361547,
"learning_rate": 1.1576997338821339e-07,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08840866386890411,
"step": 4275,
"valid_targets_mean": 3092.5,
"valid_targets_min": 1099
},
{
"epoch": 6.7936507936507935,
"grad_norm": 0.7105155741932084,
"learning_rate": 1.0742144357882567e-07,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07121296972036362,
"step": 4280,
"valid_targets_mean": 3423.8,
"valid_targets_min": 1620
},
{
"epoch": 6.801587301587301,
"grad_norm": 0.7068956813433978,
"learning_rate": 9.938449269197181e-08,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0767413005232811,
"step": 4285,
"valid_targets_mean": 3846.8,
"valid_targets_min": 1080
},
{
"epoch": 6.809523809523809,
"grad_norm": 0.6965119531557177,
"learning_rate": 9.165924661100889e-08,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09733986854553223,
"step": 4290,
"valid_targets_mean": 4943.8,
"valid_targets_min": 1648
},
{
"epoch": 6.817460317460317,
"grad_norm": 0.624576583182396,
"learning_rate": 8.424582633703493e-08,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09332321584224701,
"step": 4295,
"valid_targets_mean": 4326.4,
"valid_targets_min": 1787
},
{
"epoch": 6.825396825396825,
"grad_norm": 0.7482091326815062,
"learning_rate": 7.714434798699933e-08,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08122950047254562,
"step": 4300,
"valid_targets_mean": 2637.1,
"valid_targets_min": 1151
},
{
"epoch": 6.833333333333333,
"grad_norm": 0.7797234183323177,
"learning_rate": 7.035492279187538e-08,
"loss": 0.2058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1142660602927208,
"step": 4305,
"valid_targets_mean": 3337.1,
"valid_targets_min": 1051
},
{
"epoch": 6.841269841269841,
"grad_norm": 0.7603070154020699,
"learning_rate": 6.387765709493288e-08,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11581508815288544,
"step": 4310,
"valid_targets_mean": 3581.8,
"valid_targets_min": 1559
},
{
"epoch": 6.849206349206349,
"grad_norm": 0.8265224795703434,
"learning_rate": 5.7712652350061515e-08,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1010211855173111,
"step": 4315,
"valid_targets_mean": 2683.1,
"valid_targets_min": 1159
},
{
"epoch": 6.857142857142857,
"grad_norm": 0.8763516568425196,
"learning_rate": 5.186000512018341e-08,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12908044457435608,
"step": 4320,
"valid_targets_mean": 3439.4,
"valid_targets_min": 1869
},
{
"epoch": 6.865079365079366,
"grad_norm": 0.7573392781428435,
"learning_rate": 4.631980707574535e-08,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11205847561359406,
"step": 4325,
"valid_targets_mean": 3704.8,
"valid_targets_min": 721
},
{
"epoch": 6.8730158730158735,
"grad_norm": 0.7230981939132772,
"learning_rate": 4.10921449932733e-08,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13283637166023254,
"step": 4330,
"valid_targets_mean": 4179.9,
"valid_targets_min": 1573
},
{
"epoch": 6.880952380952381,
"grad_norm": 0.7439954422056636,
"learning_rate": 3.61771007540268e-08,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1041351854801178,
"step": 4335,
"valid_targets_mean": 3090.6,
"valid_targets_min": 1286
},
{
"epoch": 6.888888888888889,
"grad_norm": 0.800212928436307,
"learning_rate": 3.157475134270227e-08,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1381809115409851,
"step": 4340,
"valid_targets_mean": 4396.8,
"valid_targets_min": 648
},
{
"epoch": 6.896825396825397,
"grad_norm": 0.7600538047962414,
"learning_rate": 2.728516884624277e-08,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09590177237987518,
"step": 4345,
"valid_targets_mean": 3049.9,
"valid_targets_min": 1365
},
{
"epoch": 6.904761904761905,
"grad_norm": 0.7875192862873142,
"learning_rate": 2.3308420452690106e-08,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09034988284111023,
"step": 4350,
"valid_targets_mean": 2993.2,
"valid_targets_min": 285
},
{
"epoch": 6.912698412698413,
"grad_norm": 0.7653025338992717,
"learning_rate": 1.9644568450147837e-08,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1180688887834549,
"step": 4355,
"valid_targets_mean": 3412.2,
"valid_targets_min": 1285
},
{
"epoch": 6.920634920634921,
"grad_norm": 0.776729001579722,
"learning_rate": 1.6293670225799864e-08,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1176794022321701,
"step": 4360,
"valid_targets_mean": 3754.5,
"valid_targets_min": 1897
},
{
"epoch": 6.928571428571429,
"grad_norm": 0.9428126914025173,
"learning_rate": 1.3255778265013342e-08,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10972875356674194,
"step": 4365,
"valid_targets_mean": 2532.8,
"valid_targets_min": 1014
},
{
"epoch": 6.936507936507937,
"grad_norm": 0.8284198122126346,
"learning_rate": 1.0530940150512703e-08,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08045537769794464,
"step": 4370,
"valid_targets_mean": 2189.8,
"valid_targets_min": 1005
},
{
"epoch": 6.944444444444445,
"grad_norm": 0.8350132511254953,
"learning_rate": 8.119198561638009e-09,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.090115025639534,
"step": 4375,
"valid_targets_mean": 2316.4,
"valid_targets_min": 696
},
{
"epoch": 6.9523809523809526,
"grad_norm": 0.821524042196439,
"learning_rate": 6.020591273674381e-09,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09740573167800903,
"step": 4380,
"valid_targets_mean": 2340.9,
"valid_targets_min": 1488
},
{
"epoch": 6.9603174603174605,
"grad_norm": 0.7332655762989541,
"learning_rate": 4.2351511572635835e-09,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08111314475536346,
"step": 4385,
"valid_targets_mean": 2680.2,
"valid_targets_min": 737
},
{
"epoch": 6.968253968253968,
"grad_norm": 0.7743587093318401,
"learning_rate": 2.7629061778866597e-09,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07953701913356781,
"step": 4390,
"valid_targets_mean": 2203.2,
"valid_targets_min": 1016
},
{
"epoch": 6.976190476190476,
"grad_norm": 0.7689455216523182,
"learning_rate": 1.603879395422059e-09,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1031486839056015,
"step": 4395,
"valid_targets_mean": 3022.2,
"valid_targets_min": 941
},
{
"epoch": 6.984126984126984,
"grad_norm": 0.7245017440420248,
"learning_rate": 7.580889637925914e-10,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08405288308858871,
"step": 4400,
"valid_targets_mean": 3571.1,
"valid_targets_min": 1048
},
{
"epoch": 6.992063492063492,
"grad_norm": 0.7740093811974629,
"learning_rate": 2.2554813067676705e-10,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309514343738556,
"step": 4405,
"valid_targets_mean": 3787.1,
"valid_targets_min": 943
},
{
"epoch": 7.0,
"grad_norm": 0.7862017131182104,
"learning_rate": 6.265237300073778e-12,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12112488597631454,
"step": 4410,
"valid_targets_mean": 3677.4,
"valid_targets_min": 1243
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12112488597631454,
"step": 4410,
"total_flos": 1.1127298177168835e+18,
"train_loss": 0.27853014678641513,
"train_runtime": 38947.6166,
"train_samples_per_second": 1.811,
"train_steps_per_second": 0.113,
"valid_targets_mean": 3677.4,
"valid_targets_min": 1243
}
],
"logging_steps": 5,
"max_steps": 4410,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1000,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.1127298177168835e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}