g1_timeout_e1_gpt_long_tacc / trainer_state.json
EtashGuha's picture
Add files using upload-large-folder tool
4e3752f verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4347,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008051529790660225,
"grad_norm": 12.6211720137527,
"learning_rate": 3.6781609195402303e-07,
"loss": 0.8023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8141472339630127,
"step": 5,
"valid_targets_mean": 6454.3,
"valid_targets_min": 2941
},
{
"epoch": 0.01610305958132045,
"grad_norm": 13.535375108314145,
"learning_rate": 8.275862068965518e-07,
"loss": 0.779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7463928461074829,
"step": 10,
"valid_targets_mean": 6041.3,
"valid_targets_min": 3050
},
{
"epoch": 0.024154589371980676,
"grad_norm": 11.267948292741378,
"learning_rate": 1.2873563218390806e-06,
"loss": 0.7929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7566848993301392,
"step": 15,
"valid_targets_mean": 6337.3,
"valid_targets_min": 3318
},
{
"epoch": 0.0322061191626409,
"grad_norm": 9.384853818135273,
"learning_rate": 1.7471264367816093e-06,
"loss": 0.7322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7497715353965759,
"step": 20,
"valid_targets_mean": 6536.2,
"valid_targets_min": 3943
},
{
"epoch": 0.040257648953301126,
"grad_norm": 6.508928535304328,
"learning_rate": 2.206896551724138e-06,
"loss": 0.6848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6616116762161255,
"step": 25,
"valid_targets_mean": 6144.0,
"valid_targets_min": 1873
},
{
"epoch": 0.04830917874396135,
"grad_norm": 4.939706725980711,
"learning_rate": 2.666666666666667e-06,
"loss": 0.6527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6172756552696228,
"step": 30,
"valid_targets_mean": 5658.6,
"valid_targets_min": 3195
},
{
"epoch": 0.05636070853462158,
"grad_norm": 2.5910555463911815,
"learning_rate": 3.1264367816091956e-06,
"loss": 0.626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6274504065513611,
"step": 35,
"valid_targets_mean": 5992.8,
"valid_targets_min": 3207
},
{
"epoch": 0.0644122383252818,
"grad_norm": 1.7689592025893621,
"learning_rate": 3.5862068965517243e-06,
"loss": 0.576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6012336015701294,
"step": 40,
"valid_targets_mean": 5498.4,
"valid_targets_min": 2385
},
{
"epoch": 0.07246376811594203,
"grad_norm": 1.3230501227984852,
"learning_rate": 4.0459770114942535e-06,
"loss": 0.5463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5329886078834534,
"step": 45,
"valid_targets_mean": 6101.3,
"valid_targets_min": 2571
},
{
"epoch": 0.08051529790660225,
"grad_norm": 1.1549301298631403,
"learning_rate": 4.505747126436782e-06,
"loss": 0.5354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5498359203338623,
"step": 50,
"valid_targets_mean": 5591.6,
"valid_targets_min": 436
},
{
"epoch": 0.08856682769726248,
"grad_norm": 0.9148612268441723,
"learning_rate": 4.965517241379311e-06,
"loss": 0.5173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5667314529418945,
"step": 55,
"valid_targets_mean": 7175.1,
"valid_targets_min": 3309
},
{
"epoch": 0.0966183574879227,
"grad_norm": 0.9051707439274824,
"learning_rate": 5.42528735632184e-06,
"loss": 0.4999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49746763706207275,
"step": 60,
"valid_targets_mean": 5700.9,
"valid_targets_min": 1417
},
{
"epoch": 0.10466988727858294,
"grad_norm": 0.7105966724914392,
"learning_rate": 5.8850574712643685e-06,
"loss": 0.4905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49637746810913086,
"step": 65,
"valid_targets_mean": 6462.1,
"valid_targets_min": 3176
},
{
"epoch": 0.11272141706924316,
"grad_norm": 0.6112534858050221,
"learning_rate": 6.344827586206898e-06,
"loss": 0.483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44268643856048584,
"step": 70,
"valid_targets_mean": 6671.4,
"valid_targets_min": 2978
},
{
"epoch": 0.12077294685990338,
"grad_norm": 0.6428768043018936,
"learning_rate": 6.804597701149426e-06,
"loss": 0.4662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4915180206298828,
"step": 75,
"valid_targets_mean": 5441.8,
"valid_targets_min": 2285
},
{
"epoch": 0.1288244766505636,
"grad_norm": 0.9646038113879557,
"learning_rate": 7.264367816091955e-06,
"loss": 0.4314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43008822202682495,
"step": 80,
"valid_targets_mean": 5118.4,
"valid_targets_min": 2205
},
{
"epoch": 0.13687600644122383,
"grad_norm": 1.4574457159646115,
"learning_rate": 7.724137931034483e-06,
"loss": 0.615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6628851890563965,
"step": 85,
"valid_targets_mean": 2431.5,
"valid_targets_min": 1052
},
{
"epoch": 0.14492753623188406,
"grad_norm": 1.041883232166695,
"learning_rate": 8.183908045977013e-06,
"loss": 0.701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6815399527549744,
"step": 90,
"valid_targets_mean": 3045.8,
"valid_targets_min": 1348
},
{
"epoch": 0.1529790660225443,
"grad_norm": 0.8494250273002256,
"learning_rate": 8.643678160919541e-06,
"loss": 0.6405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6369081735610962,
"step": 95,
"valid_targets_mean": 3644.5,
"valid_targets_min": 1127
},
{
"epoch": 0.1610305958132045,
"grad_norm": 0.8637751062370636,
"learning_rate": 9.10344827586207e-06,
"loss": 0.6437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6281415224075317,
"step": 100,
"valid_targets_mean": 2985.6,
"valid_targets_min": 1353
},
{
"epoch": 0.16908212560386474,
"grad_norm": 0.7659577551413557,
"learning_rate": 9.563218390804598e-06,
"loss": 0.5845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5499722957611084,
"step": 105,
"valid_targets_mean": 4235.5,
"valid_targets_min": 1153
},
{
"epoch": 0.17713365539452497,
"grad_norm": 0.8658771361706771,
"learning_rate": 1.0022988505747126e-05,
"loss": 0.6017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6165111660957336,
"step": 110,
"valid_targets_mean": 3142.8,
"valid_targets_min": 1555
},
{
"epoch": 0.18518518518518517,
"grad_norm": 0.7434733707474204,
"learning_rate": 1.0482758620689658e-05,
"loss": 0.5981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5669258832931519,
"step": 115,
"valid_targets_mean": 3279.6,
"valid_targets_min": 1283
},
{
"epoch": 0.1932367149758454,
"grad_norm": 0.8722216577271487,
"learning_rate": 1.0942528735632186e-05,
"loss": 0.6172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6591456532478333,
"step": 120,
"valid_targets_mean": 2693.6,
"valid_targets_min": 1497
},
{
"epoch": 0.20128824476650564,
"grad_norm": 0.8310182578313449,
"learning_rate": 1.1402298850574713e-05,
"loss": 0.5898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5488319396972656,
"step": 125,
"valid_targets_mean": 2785.3,
"valid_targets_min": 1343
},
{
"epoch": 0.20933977455716588,
"grad_norm": 0.9235409692277453,
"learning_rate": 1.1862068965517241e-05,
"loss": 0.6038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6315065622329712,
"step": 130,
"valid_targets_mean": 2680.9,
"valid_targets_min": 1319
},
{
"epoch": 0.21739130434782608,
"grad_norm": 0.7693874973200193,
"learning_rate": 1.2321839080459773e-05,
"loss": 0.5719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5175089836120605,
"step": 135,
"valid_targets_mean": 3356.8,
"valid_targets_min": 1216
},
{
"epoch": 0.22544283413848631,
"grad_norm": 0.926054709365038,
"learning_rate": 1.2781609195402301e-05,
"loss": 0.5767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.59300696849823,
"step": 140,
"valid_targets_mean": 2648.8,
"valid_targets_min": 1013
},
{
"epoch": 0.23349436392914655,
"grad_norm": 0.7436423550718153,
"learning_rate": 1.324137931034483e-05,
"loss": 0.5838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5333613157272339,
"step": 145,
"valid_targets_mean": 3610.2,
"valid_targets_min": 1346
},
{
"epoch": 0.24154589371980675,
"grad_norm": 0.8771301167213914,
"learning_rate": 1.3701149425287356e-05,
"loss": 0.5807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5605872869491577,
"step": 150,
"valid_targets_mean": 2815.4,
"valid_targets_min": 1085
},
{
"epoch": 0.249597423510467,
"grad_norm": 0.7265522281955346,
"learning_rate": 1.4160919540229888e-05,
"loss": 0.5597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5334085822105408,
"step": 155,
"valid_targets_mean": 3536.7,
"valid_targets_min": 1598
},
{
"epoch": 0.2576489533011272,
"grad_norm": 0.8637169240692523,
"learning_rate": 1.4620689655172416e-05,
"loss": 0.5512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5399806499481201,
"step": 160,
"valid_targets_mean": 2561.4,
"valid_targets_min": 1339
},
{
"epoch": 0.26570048309178745,
"grad_norm": 0.7684987940501175,
"learning_rate": 1.5080459770114944e-05,
"loss": 0.5561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5099571943283081,
"step": 165,
"valid_targets_mean": 2889.4,
"valid_targets_min": 1076
},
{
"epoch": 0.27375201288244766,
"grad_norm": 1.2443263629609338,
"learning_rate": 1.5540229885057473e-05,
"loss": 0.5758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5990105271339417,
"step": 170,
"valid_targets_mean": 2557.4,
"valid_targets_min": 1094
},
{
"epoch": 0.28180354267310787,
"grad_norm": 0.7025661086648686,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.5516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5607724785804749,
"step": 175,
"valid_targets_mean": 3530.8,
"valid_targets_min": 1290
},
{
"epoch": 0.2898550724637681,
"grad_norm": 0.9299035150917279,
"learning_rate": 1.645977011494253e-05,
"loss": 0.5504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5684704184532166,
"step": 180,
"valid_targets_mean": 2579.7,
"valid_targets_min": 1229
},
{
"epoch": 0.29790660225442833,
"grad_norm": 0.9029683337889093,
"learning_rate": 1.691954022988506e-05,
"loss": 0.5549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5909307599067688,
"step": 185,
"valid_targets_mean": 3024.5,
"valid_targets_min": 1126
},
{
"epoch": 0.3059581320450886,
"grad_norm": 0.7196257441971349,
"learning_rate": 1.7379310344827586e-05,
"loss": 0.533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5063704252243042,
"step": 190,
"valid_targets_mean": 3523.4,
"valid_targets_min": 1277
},
{
"epoch": 0.3140096618357488,
"grad_norm": 0.7255462834778044,
"learning_rate": 1.7839080459770116e-05,
"loss": 0.5285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5233041644096375,
"step": 195,
"valid_targets_mean": 3317.8,
"valid_targets_min": 1389
},
{
"epoch": 0.322061191626409,
"grad_norm": 0.8908272457952328,
"learning_rate": 1.8298850574712646e-05,
"loss": 0.566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5723013877868652,
"step": 200,
"valid_targets_mean": 2728.8,
"valid_targets_min": 1062
},
{
"epoch": 0.33011272141706927,
"grad_norm": 0.7237478954756121,
"learning_rate": 1.8758620689655173e-05,
"loss": 0.5403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.488622784614563,
"step": 205,
"valid_targets_mean": 3474.4,
"valid_targets_min": 1520
},
{
"epoch": 0.33816425120772947,
"grad_norm": 0.9731721468625133,
"learning_rate": 1.9218390804597703e-05,
"loss": 0.5479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5853530168533325,
"step": 210,
"valid_targets_mean": 2857.8,
"valid_targets_min": 1154
},
{
"epoch": 0.3462157809983897,
"grad_norm": 0.8620329842750755,
"learning_rate": 1.9678160919540233e-05,
"loss": 0.5582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5213043689727783,
"step": 215,
"valid_targets_mean": 2419.3,
"valid_targets_min": 1115
},
{
"epoch": 0.35426731078904994,
"grad_norm": 0.9094077963820549,
"learning_rate": 2.013793103448276e-05,
"loss": 0.5365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5487880706787109,
"step": 220,
"valid_targets_mean": 2817.8,
"valid_targets_min": 1383
},
{
"epoch": 0.36231884057971014,
"grad_norm": 0.7944146685277702,
"learning_rate": 2.059770114942529e-05,
"loss": 0.5477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5611993074417114,
"step": 225,
"valid_targets_mean": 2906.6,
"valid_targets_min": 1414
},
{
"epoch": 0.37037037037037035,
"grad_norm": 0.8404791965077937,
"learning_rate": 2.1057471264367816e-05,
"loss": 0.5326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5319218635559082,
"step": 230,
"valid_targets_mean": 2699.4,
"valid_targets_min": 1140
},
{
"epoch": 0.3784219001610306,
"grad_norm": 0.7398954624086636,
"learning_rate": 2.1517241379310346e-05,
"loss": 0.5158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5021366477012634,
"step": 235,
"valid_targets_mean": 3474.1,
"valid_targets_min": 1060
},
{
"epoch": 0.3864734299516908,
"grad_norm": 0.6565950720543745,
"learning_rate": 2.1977011494252873e-05,
"loss": 0.516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4567714333534241,
"step": 240,
"valid_targets_mean": 4942.6,
"valid_targets_min": 1358
},
{
"epoch": 0.394524959742351,
"grad_norm": 0.7843837006160241,
"learning_rate": 2.2436781609195406e-05,
"loss": 0.5148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.525688886642456,
"step": 245,
"valid_targets_mean": 3203.9,
"valid_targets_min": 1109
},
{
"epoch": 0.4025764895330113,
"grad_norm": 0.786413171985749,
"learning_rate": 2.2896551724137933e-05,
"loss": 0.4953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5001181364059448,
"step": 250,
"valid_targets_mean": 2741.4,
"valid_targets_min": 990
},
{
"epoch": 0.4106280193236715,
"grad_norm": 0.9340749614199906,
"learning_rate": 2.3356321839080463e-05,
"loss": 0.5043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5208650827407837,
"step": 255,
"valid_targets_mean": 2505.7,
"valid_targets_min": 1217
},
{
"epoch": 0.41867954911433175,
"grad_norm": 0.7974854363515583,
"learning_rate": 2.381609195402299e-05,
"loss": 0.4952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4734256863594055,
"step": 260,
"valid_targets_mean": 2908.2,
"valid_targets_min": 977
},
{
"epoch": 0.42673107890499196,
"grad_norm": 0.7083832787574131,
"learning_rate": 2.427586206896552e-05,
"loss": 0.4563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4569528102874756,
"step": 265,
"valid_targets_mean": 3492.0,
"valid_targets_min": 1549
},
{
"epoch": 0.43478260869565216,
"grad_norm": 0.8471307752430234,
"learning_rate": 2.4735632183908046e-05,
"loss": 0.4805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4980763792991638,
"step": 270,
"valid_targets_mean": 2432.0,
"valid_targets_min": 838
},
{
"epoch": 0.4428341384863124,
"grad_norm": 0.7581722015778103,
"learning_rate": 2.5195402298850576e-05,
"loss": 0.4698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4556068778038025,
"step": 275,
"valid_targets_mean": 3069.9,
"valid_targets_min": 269
},
{
"epoch": 0.45088566827697263,
"grad_norm": 0.7647100815494069,
"learning_rate": 2.5655172413793103e-05,
"loss": 0.5029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5297585725784302,
"step": 280,
"valid_targets_mean": 3644.1,
"valid_targets_min": 1308
},
{
"epoch": 0.45893719806763283,
"grad_norm": 0.6888367368546122,
"learning_rate": 2.6114942528735636e-05,
"loss": 0.4635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4325258135795593,
"step": 285,
"valid_targets_mean": 3538.7,
"valid_targets_min": 865
},
{
"epoch": 0.4669887278582931,
"grad_norm": 0.7918334936431798,
"learning_rate": 2.6574712643678166e-05,
"loss": 0.4829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48796749114990234,
"step": 290,
"valid_targets_mean": 2789.2,
"valid_targets_min": 1084
},
{
"epoch": 0.4750402576489533,
"grad_norm": 0.8297680238669458,
"learning_rate": 2.7034482758620693e-05,
"loss": 0.5134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47267746925354004,
"step": 295,
"valid_targets_mean": 2663.7,
"valid_targets_min": 1007
},
{
"epoch": 0.4830917874396135,
"grad_norm": 0.6633379830429746,
"learning_rate": 2.749425287356322e-05,
"loss": 0.4589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49964243173599243,
"step": 300,
"valid_targets_mean": 3865.0,
"valid_targets_min": 556
},
{
"epoch": 0.49114331723027377,
"grad_norm": 0.6267750181705374,
"learning_rate": 2.795402298850575e-05,
"loss": 0.4686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44949406385421753,
"step": 305,
"valid_targets_mean": 4117.5,
"valid_targets_min": 1094
},
{
"epoch": 0.499194847020934,
"grad_norm": 0.705425101438482,
"learning_rate": 2.8413793103448276e-05,
"loss": 0.4443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4142606258392334,
"step": 310,
"valid_targets_mean": 3565.3,
"valid_targets_min": 333
},
{
"epoch": 0.5072463768115942,
"grad_norm": 0.6719556250206123,
"learning_rate": 2.8873563218390806e-05,
"loss": 0.4748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46530526876449585,
"step": 315,
"valid_targets_mean": 3507.9,
"valid_targets_min": 1135
},
{
"epoch": 0.5152979066022544,
"grad_norm": 0.7129427212893642,
"learning_rate": 2.9333333333333333e-05,
"loss": 0.4742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4753148555755615,
"step": 320,
"valid_targets_mean": 3822.9,
"valid_targets_min": 428
},
{
"epoch": 0.5233494363929146,
"grad_norm": 0.7453050849315828,
"learning_rate": 2.9793103448275866e-05,
"loss": 0.4602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4605864882469177,
"step": 325,
"valid_targets_mean": 2932.9,
"valid_targets_min": 1398
},
{
"epoch": 0.5314009661835749,
"grad_norm": 0.6416359264690352,
"learning_rate": 3.0252873563218396e-05,
"loss": 0.4427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3964742124080658,
"step": 330,
"valid_targets_mean": 3473.2,
"valid_targets_min": 1265
},
{
"epoch": 0.5394524959742351,
"grad_norm": 0.8091118683339827,
"learning_rate": 3.071264367816092e-05,
"loss": 0.4865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5222635269165039,
"step": 335,
"valid_targets_mean": 2707.5,
"valid_targets_min": 1453
},
{
"epoch": 0.5475040257648953,
"grad_norm": 0.6475514263706704,
"learning_rate": 3.117241379310345e-05,
"loss": 0.468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4403412640094757,
"step": 340,
"valid_targets_mean": 3770.1,
"valid_targets_min": 1554
},
{
"epoch": 0.5555555555555556,
"grad_norm": 0.6905557475577746,
"learning_rate": 3.1632183908045976e-05,
"loss": 0.4429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42495399713516235,
"step": 345,
"valid_targets_mean": 3687.9,
"valid_targets_min": 1423
},
{
"epoch": 0.5636070853462157,
"grad_norm": 0.7104740968387137,
"learning_rate": 3.2091954022988506e-05,
"loss": 0.455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43538206815719604,
"step": 350,
"valid_targets_mean": 3580.0,
"valid_targets_min": 1778
},
{
"epoch": 0.571658615136876,
"grad_norm": 0.7499873582780294,
"learning_rate": 3.2551724137931036e-05,
"loss": 0.471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42534762620925903,
"step": 355,
"valid_targets_mean": 3154.2,
"valid_targets_min": 1070
},
{
"epoch": 0.5797101449275363,
"grad_norm": 0.6642445186064259,
"learning_rate": 3.3011494252873566e-05,
"loss": 0.4456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45597341656684875,
"step": 360,
"valid_targets_mean": 3442.1,
"valid_targets_min": 1222
},
{
"epoch": 0.5877616747181964,
"grad_norm": 0.9240276056077943,
"learning_rate": 3.3471264367816096e-05,
"loss": 0.4582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46805498003959656,
"step": 365,
"valid_targets_mean": 2991.2,
"valid_targets_min": 1344
},
{
"epoch": 0.5958132045088567,
"grad_norm": 0.7060945620088765,
"learning_rate": 3.3931034482758626e-05,
"loss": 0.4711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42430639266967773,
"step": 370,
"valid_targets_mean": 3584.1,
"valid_targets_min": 1080
},
{
"epoch": 0.6038647342995169,
"grad_norm": 0.6951756292278192,
"learning_rate": 3.4390804597701156e-05,
"loss": 0.435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4317897856235504,
"step": 375,
"valid_targets_mean": 3283.6,
"valid_targets_min": 1136
},
{
"epoch": 0.6119162640901772,
"grad_norm": 0.6929947538123722,
"learning_rate": 3.485057471264368e-05,
"loss": 0.4654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44339442253112793,
"step": 380,
"valid_targets_mean": 3267.1,
"valid_targets_min": 1469
},
{
"epoch": 0.6199677938808373,
"grad_norm": 0.59684922350695,
"learning_rate": 3.531034482758621e-05,
"loss": 0.4385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38249504566192627,
"step": 385,
"valid_targets_mean": 4220.8,
"valid_targets_min": 1141
},
{
"epoch": 0.6280193236714976,
"grad_norm": 0.6361797000665275,
"learning_rate": 3.577011494252874e-05,
"loss": 0.4499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42138925194740295,
"step": 390,
"valid_targets_mean": 3403.3,
"valid_targets_min": 1315
},
{
"epoch": 0.6360708534621579,
"grad_norm": 0.7553402257839422,
"learning_rate": 3.622988505747126e-05,
"loss": 0.4251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.415188193321228,
"step": 395,
"valid_targets_mean": 3994.0,
"valid_targets_min": 1243
},
{
"epoch": 0.644122383252818,
"grad_norm": 0.7840399240091517,
"learning_rate": 3.668965517241379e-05,
"loss": 0.4666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4885357618331909,
"step": 400,
"valid_targets_mean": 2728.6,
"valid_targets_min": 1205
},
{
"epoch": 0.6521739130434783,
"grad_norm": 0.7737252334457005,
"learning_rate": 3.714942528735633e-05,
"loss": 0.4453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4366183876991272,
"step": 405,
"valid_targets_mean": 2805.7,
"valid_targets_min": 1316
},
{
"epoch": 0.6602254428341385,
"grad_norm": 0.8020067156942912,
"learning_rate": 3.760919540229885e-05,
"loss": 0.4458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4633807837963104,
"step": 410,
"valid_targets_mean": 3165.5,
"valid_targets_min": 1339
},
{
"epoch": 0.6682769726247987,
"grad_norm": 0.7674549160676873,
"learning_rate": 3.806896551724138e-05,
"loss": 0.4431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4483141601085663,
"step": 415,
"valid_targets_mean": 2954.1,
"valid_targets_min": 1158
},
{
"epoch": 0.6763285024154589,
"grad_norm": 0.6203648387560737,
"learning_rate": 3.852873563218391e-05,
"loss": 0.4338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4143407642841339,
"step": 420,
"valid_targets_mean": 4536.0,
"valid_targets_min": 1647
},
{
"epoch": 0.6843800322061192,
"grad_norm": 0.6999255524103093,
"learning_rate": 3.898850574712644e-05,
"loss": 0.4453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41560059785842896,
"step": 425,
"valid_targets_mean": 3440.9,
"valid_targets_min": 1237
},
{
"epoch": 0.6924315619967794,
"grad_norm": 0.7359356732077772,
"learning_rate": 3.9448275862068966e-05,
"loss": 0.4852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4889700412750244,
"step": 430,
"valid_targets_mean": 3381.9,
"valid_targets_min": 1538
},
{
"epoch": 0.7004830917874396,
"grad_norm": 0.6434530063256044,
"learning_rate": 3.9908045977011496e-05,
"loss": 0.438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43669044971466064,
"step": 435,
"valid_targets_mean": 4124.1,
"valid_targets_min": 1524
},
{
"epoch": 0.7085346215780999,
"grad_norm": 0.7259157801334376,
"learning_rate": 3.9999896813789735e-05,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46412330865859985,
"step": 440,
"valid_targets_mean": 3666.5,
"valid_targets_min": 1144
},
{
"epoch": 0.71658615136876,
"grad_norm": 0.6920837839026965,
"learning_rate": 3.999947762163533e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4421723783016205,
"step": 445,
"valid_targets_mean": 3813.6,
"valid_targets_min": 1150
},
{
"epoch": 0.7246376811594203,
"grad_norm": 0.8229582070019114,
"learning_rate": 3.999873598115203e-05,
"loss": 0.4244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4543113112449646,
"step": 450,
"valid_targets_mean": 3184.7,
"valid_targets_min": 1064
},
{
"epoch": 0.7326892109500805,
"grad_norm": 0.6618965870642886,
"learning_rate": 3.999767190429718e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4174274504184723,
"step": 455,
"valid_targets_mean": 3734.6,
"valid_targets_min": 1689
},
{
"epoch": 0.7407407407407407,
"grad_norm": 0.7350636189187817,
"learning_rate": 3.99962854082267e-05,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45041102170944214,
"step": 460,
"valid_targets_mean": 3706.6,
"valid_targets_min": 1537
},
{
"epoch": 0.748792270531401,
"grad_norm": 0.6527924396728313,
"learning_rate": 3.9994576515294864e-05,
"loss": 0.4562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44863760471343994,
"step": 465,
"valid_targets_mean": 3998.4,
"valid_targets_min": 1261
},
{
"epoch": 0.7568438003220612,
"grad_norm": 0.7162099025470566,
"learning_rate": 3.999254525305386e-05,
"loss": 0.3562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30241087079048157,
"step": 470,
"valid_targets_mean": 6379.5,
"valid_targets_min": 3100
},
{
"epoch": 0.7648953301127214,
"grad_norm": 0.5518921640398805,
"learning_rate": 3.999019165425341e-05,
"loss": 0.2954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.271371066570282,
"step": 475,
"valid_targets_mean": 5043.8,
"valid_targets_min": 2708
},
{
"epoch": 0.7729468599033816,
"grad_norm": 0.5572299520035154,
"learning_rate": 3.99875157568402e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725101113319397,
"step": 480,
"valid_targets_mean": 5717.3,
"valid_targets_min": 3191
},
{
"epoch": 0.7809983896940419,
"grad_norm": 0.6593727425698053,
"learning_rate": 3.998451760395729e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33532363176345825,
"step": 485,
"valid_targets_mean": 6198.8,
"valid_targets_min": 2599
},
{
"epoch": 0.789049919484702,
"grad_norm": 0.4904371382366237,
"learning_rate": 3.99811972439434e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27875158190727234,
"step": 490,
"valid_targets_mean": 5880.9,
"valid_targets_min": 3427
},
{
"epoch": 0.7971014492753623,
"grad_norm": 0.5384641711313225,
"learning_rate": 3.997755473033218e-05,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27927276492118835,
"step": 495,
"valid_targets_mean": 5429.1,
"valid_targets_min": 3331
},
{
"epoch": 0.8051529790660226,
"grad_norm": 0.4872366354078386,
"learning_rate": 3.997359012185127e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796809673309326,
"step": 500,
"valid_targets_mean": 5318.9,
"valid_targets_min": 3176
},
{
"epoch": 0.8132045088566827,
"grad_norm": 0.5513399943173102,
"learning_rate": 3.996930348242141e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34563466906547546,
"step": 505,
"valid_targets_mean": 6334.5,
"valid_targets_min": 3200
},
{
"epoch": 0.821256038647343,
"grad_norm": 0.5178713450708176,
"learning_rate": 3.996469488115539e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2517154812812805,
"step": 510,
"valid_targets_mean": 5575.2,
"valid_targets_min": 2982
},
{
"epoch": 0.8293075684380032,
"grad_norm": 0.5354106021483718,
"learning_rate": 3.995976439235694e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508094310760498,
"step": 515,
"valid_targets_mean": 5045.2,
"valid_targets_min": 2662
},
{
"epoch": 0.8373590982286635,
"grad_norm": 0.5043478969730439,
"learning_rate": 3.995451209551953e-05,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23723244667053223,
"step": 520,
"valid_targets_mean": 5929.9,
"valid_targets_min": 3640
},
{
"epoch": 0.8454106280193237,
"grad_norm": 0.4644833157640728,
"learning_rate": 3.994893807532509e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2522507905960083,
"step": 525,
"valid_targets_mean": 5560.6,
"valid_targets_min": 3146
},
{
"epoch": 0.8534621578099839,
"grad_norm": 0.5528859754209329,
"learning_rate": 3.994304242164265e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2732771635055542,
"step": 530,
"valid_targets_mean": 5438.9,
"valid_targets_min": 3095
},
{
"epoch": 0.8615136876006442,
"grad_norm": 0.475067141876231,
"learning_rate": 3.9936825229526855e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2705361843109131,
"step": 535,
"valid_targets_mean": 6153.6,
"valid_targets_min": 3325
},
{
"epoch": 0.8695652173913043,
"grad_norm": 0.4480740353625752,
"learning_rate": 3.9930286599216506e-05,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25481677055358887,
"step": 540,
"valid_targets_mean": 6176.7,
"valid_targets_min": 3690
},
{
"epoch": 0.8776167471819646,
"grad_norm": 0.5197397102755734,
"learning_rate": 3.9923426636132866e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23781773447990417,
"step": 545,
"valid_targets_mean": 5253.8,
"valid_targets_min": 2926
},
{
"epoch": 0.8856682769726248,
"grad_norm": 0.4625888856613296,
"learning_rate": 3.991624545087801e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22309911251068115,
"step": 550,
"valid_targets_mean": 6097.0,
"valid_targets_min": 3707
},
{
"epoch": 0.893719806763285,
"grad_norm": 0.4887112175957848,
"learning_rate": 3.9908743159233016e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25249046087265015,
"step": 555,
"valid_targets_mean": 5931.1,
"valid_targets_min": 3697
},
{
"epoch": 0.9017713365539453,
"grad_norm": 0.4459880666225944,
"learning_rate": 3.990091988215612e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24061977863311768,
"step": 560,
"valid_targets_mean": 6370.6,
"valid_targets_min": 3665
},
{
"epoch": 0.9098228663446055,
"grad_norm": 0.5441022062942001,
"learning_rate": 3.989277574578074e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26900017261505127,
"step": 565,
"valid_targets_mean": 6119.8,
"valid_targets_min": 2561
},
{
"epoch": 0.9178743961352657,
"grad_norm": 0.5238796115702521,
"learning_rate": 3.9884310881413473e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24351592361927032,
"step": 570,
"valid_targets_mean": 5352.8,
"valid_targets_min": 3838
},
{
"epoch": 0.9259259259259259,
"grad_norm": 0.4638163386116075,
"learning_rate": 3.987552542553194e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24837109446525574,
"step": 575,
"valid_targets_mean": 6064.1,
"valid_targets_min": 2800
},
{
"epoch": 0.9339774557165862,
"grad_norm": 0.4296037881388161,
"learning_rate": 3.9866419519782636e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21541734039783478,
"step": 580,
"valid_targets_mean": 6725.1,
"valid_targets_min": 4014
},
{
"epoch": 0.9420289855072463,
"grad_norm": 0.5667563203419782,
"learning_rate": 3.985699331097858e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25082963705062866,
"step": 585,
"valid_targets_mean": 5340.4,
"valid_targets_min": 3261
},
{
"epoch": 0.9500805152979066,
"grad_norm": 0.44699582805642185,
"learning_rate": 3.984724695109702e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24760377407073975,
"step": 590,
"valid_targets_mean": 6194.7,
"valid_targets_min": 3579
},
{
"epoch": 0.9581320450885669,
"grad_norm": 0.4523900544730103,
"learning_rate": 3.983718059727693e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22146061062812805,
"step": 595,
"valid_targets_mean": 6527.8,
"valid_targets_min": 2379
},
{
"epoch": 0.966183574879227,
"grad_norm": 0.39826806360509687,
"learning_rate": 3.9826794411816495e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23311802744865417,
"step": 600,
"valid_targets_mean": 6887.7,
"valid_targets_min": 3569
},
{
"epoch": 0.9742351046698873,
"grad_norm": 0.6229816324333505,
"learning_rate": 3.981608856217049e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21930500864982605,
"step": 605,
"valid_targets_mean": 5398.8,
"valid_targets_min": 2580
},
{
"epoch": 0.9822866344605475,
"grad_norm": 0.4999823141609161,
"learning_rate": 3.980506322094761e-05,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2858148217201233,
"step": 610,
"valid_targets_mean": 6136.1,
"valid_targets_min": 2610
},
{
"epoch": 0.9903381642512077,
"grad_norm": 0.46445064808991693,
"learning_rate": 3.979371856590762e-05,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21342137455940247,
"step": 615,
"valid_targets_mean": 5957.4,
"valid_targets_min": 2562
},
{
"epoch": 0.998389694041868,
"grad_norm": 0.5766730357055111,
"learning_rate": 3.978205477995856e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23376914858818054,
"step": 620,
"valid_targets_mean": 5860.3,
"valid_targets_min": 2833
},
{
"epoch": 1.0064412238325282,
"grad_norm": 0.5381872293931007,
"learning_rate": 3.9770072051153754e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38717740774154663,
"step": 625,
"valid_targets_mean": 5898.7,
"valid_targets_min": 2769
},
{
"epoch": 1.0144927536231885,
"grad_norm": 0.5254280438649158,
"learning_rate": 3.9757770572688786e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3415398895740509,
"step": 630,
"valid_targets_mean": 6068.6,
"valid_targets_min": 2285
},
{
"epoch": 1.0225442834138487,
"grad_norm": 0.48064107372040804,
"learning_rate": 3.9745150542898405e-05,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36373406648635864,
"step": 635,
"valid_targets_mean": 6519.8,
"valid_targets_min": 3314
},
{
"epoch": 1.0305958132045088,
"grad_norm": 0.4867942399417131,
"learning_rate": 3.97322121652533e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33237212896347046,
"step": 640,
"valid_targets_mean": 6028.6,
"valid_targets_min": 2671
},
{
"epoch": 1.038647342995169,
"grad_norm": 0.5535759217279507,
"learning_rate": 3.971895564835683e-05,
"loss": 0.3405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36408573389053345,
"step": 645,
"valid_targets_mean": 6266.9,
"valid_targets_min": 469
},
{
"epoch": 1.0466988727858293,
"grad_norm": 0.5234567604492989,
"learning_rate": 3.970538120594166e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30862703919410706,
"step": 650,
"valid_targets_mean": 5759.1,
"valid_targets_min": 2568
},
{
"epoch": 1.0547504025764896,
"grad_norm": 0.5104944272693731,
"learning_rate": 3.9691489056866324e-05,
"loss": 0.335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31290531158447266,
"step": 655,
"valid_targets_mean": 5530.2,
"valid_targets_min": 611
},
{
"epoch": 1.0628019323671498,
"grad_norm": 0.4962198988376796,
"learning_rate": 3.9677279425111684e-05,
"loss": 0.3172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292328417301178,
"step": 660,
"valid_targets_mean": 5696.9,
"valid_targets_min": 2392
},
{
"epoch": 1.07085346215781,
"grad_norm": 0.4883167094213102,
"learning_rate": 3.9662752539777314e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3085409700870514,
"step": 665,
"valid_targets_mean": 5683.9,
"valid_targets_min": 1285
},
{
"epoch": 1.0789049919484701,
"grad_norm": 0.45277731991583026,
"learning_rate": 3.9647908635077845e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27562692761421204,
"step": 670,
"valid_targets_mean": 6331.4,
"valid_targets_min": 3356
},
{
"epoch": 1.0869565217391304,
"grad_norm": 0.5167803974967058,
"learning_rate": 3.963274795033913e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28318291902542114,
"step": 675,
"valid_targets_mean": 5326.1,
"valid_targets_min": 1676
},
{
"epoch": 1.0950080515297906,
"grad_norm": 0.5095041080696596,
"learning_rate": 3.9617270729994436e-05,
"loss": 0.3183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3311567008495331,
"step": 680,
"valid_targets_mean": 6448.9,
"valid_targets_min": 2859
},
{
"epoch": 1.103059581320451,
"grad_norm": 0.49987418312419335,
"learning_rate": 3.960147722358046e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3058398962020874,
"step": 685,
"valid_targets_mean": 5910.2,
"valid_targets_min": 1417
},
{
"epoch": 1.1111111111111112,
"grad_norm": 0.4553139112077016,
"learning_rate": 3.958536768573335e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3590342402458191,
"step": 690,
"valid_targets_mean": 7141.1,
"valid_targets_min": 3571
},
{
"epoch": 1.1191626409017714,
"grad_norm": 0.4708599542937082,
"learning_rate": 3.956894237618456e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32140040397644043,
"step": 695,
"valid_targets_mean": 6492.9,
"valid_targets_min": 3446
},
{
"epoch": 1.1272141706924317,
"grad_norm": 0.48610528051988894,
"learning_rate": 3.955220155975669e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26136165857315063,
"step": 700,
"valid_targets_mean": 5447.6,
"valid_targets_min": 306
},
{
"epoch": 1.1352657004830917,
"grad_norm": 0.7998551023631064,
"learning_rate": 3.9535145506359206e-05,
"loss": 0.4179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4753114581108093,
"step": 705,
"valid_targets_mean": 3657.8,
"valid_targets_min": 1050
},
{
"epoch": 1.143317230273752,
"grad_norm": 0.8628326452111007,
"learning_rate": 3.951777449098408e-05,
"loss": 0.5288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5633917450904846,
"step": 710,
"valid_targets_mean": 2673.1,
"valid_targets_min": 1309
},
{
"epoch": 1.1513687600644122,
"grad_norm": 0.8324627405108382,
"learning_rate": 3.9500088793701387e-05,
"loss": 0.4929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4774799644947052,
"step": 715,
"valid_targets_mean": 3209.7,
"valid_targets_min": 1155
},
{
"epoch": 1.1594202898550725,
"grad_norm": 0.802960087915467,
"learning_rate": 3.948208869965473e-05,
"loss": 0.5032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5248502492904663,
"step": 720,
"valid_targets_mean": 3054.8,
"valid_targets_min": 1099
},
{
"epoch": 1.1674718196457328,
"grad_norm": 0.7752102610736108,
"learning_rate": 3.946377449905672e-05,
"loss": 0.4698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45278412103652954,
"step": 725,
"valid_targets_mean": 2978.8,
"valid_targets_min": 1175
},
{
"epoch": 1.1755233494363928,
"grad_norm": 0.7774619112330354,
"learning_rate": 3.9445146487184226e-05,
"loss": 0.4626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4363817572593689,
"step": 730,
"valid_targets_mean": 2849.6,
"valid_targets_min": 1295
},
{
"epoch": 1.183574879227053,
"grad_norm": 1.1474142413076773,
"learning_rate": 3.942620496437366e-05,
"loss": 0.4836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.519567608833313,
"step": 735,
"valid_targets_mean": 2615.8,
"valid_targets_min": 1383
},
{
"epoch": 1.1916264090177133,
"grad_norm": 0.7140245197333289,
"learning_rate": 3.940695023601612e-05,
"loss": 0.482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49396196007728577,
"step": 740,
"valid_targets_mean": 3296.4,
"valid_targets_min": 1316
},
{
"epoch": 1.1996779388083736,
"grad_norm": 0.6546808722676869,
"learning_rate": 3.938738261255247e-05,
"loss": 0.4933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46171700954437256,
"step": 745,
"valid_targets_mean": 3968.6,
"valid_targets_min": 1383
},
{
"epoch": 1.2077294685990339,
"grad_norm": 0.8090731054477709,
"learning_rate": 3.9367502409468315e-05,
"loss": 0.4818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5525240898132324,
"step": 750,
"valid_targets_mean": 3078.5,
"valid_targets_min": 1174
},
{
"epoch": 1.2157809983896941,
"grad_norm": 0.6725814967283812,
"learning_rate": 3.934730994728893e-05,
"loss": 0.4887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44579121470451355,
"step": 755,
"valid_targets_mean": 3417.5,
"valid_targets_min": 1252
},
{
"epoch": 1.2238325281803544,
"grad_norm": 0.7197375797510343,
"learning_rate": 3.932680555157413e-05,
"loss": 0.4645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5104143619537354,
"step": 760,
"valid_targets_mean": 3427.6,
"valid_targets_min": 1218
},
{
"epoch": 1.2318840579710144,
"grad_norm": 0.8543242804532502,
"learning_rate": 3.9305989552912936e-05,
"loss": 0.4923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5740408897399902,
"step": 765,
"valid_targets_mean": 2875.2,
"valid_targets_min": 1123
},
{
"epoch": 1.2399355877616747,
"grad_norm": 0.832686925614947,
"learning_rate": 3.928486228691831e-05,
"loss": 0.4789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.498767614364624,
"step": 770,
"valid_targets_mean": 2933.1,
"valid_targets_min": 1485
},
{
"epoch": 1.247987117552335,
"grad_norm": 0.8162275317686818,
"learning_rate": 3.926342409422175e-05,
"loss": 0.474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5068527460098267,
"step": 775,
"valid_targets_mean": 2699.5,
"valid_targets_min": 1170
},
{
"epoch": 1.2560386473429952,
"grad_norm": 0.6180614081605837,
"learning_rate": 3.924167532046773e-05,
"loss": 0.4594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.426825612783432,
"step": 780,
"valid_targets_mean": 3932.2,
"valid_targets_min": 1108
},
{
"epoch": 1.2640901771336555,
"grad_norm": 0.8309975887016753,
"learning_rate": 3.9219616316308215e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48292607069015503,
"step": 785,
"valid_targets_mean": 2747.4,
"valid_targets_min": 1205
},
{
"epoch": 1.2721417069243155,
"grad_norm": 0.829396143340556,
"learning_rate": 3.919724743739694e-05,
"loss": 0.4728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4963272511959076,
"step": 790,
"valid_targets_mean": 3029.8,
"valid_targets_min": 1355
},
{
"epoch": 1.2801932367149758,
"grad_norm": 0.7797044579353001,
"learning_rate": 3.91745690443837e-05,
"loss": 0.471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4795590937137604,
"step": 795,
"valid_targets_mean": 3227.2,
"valid_targets_min": 1427
},
{
"epoch": 1.288244766505636,
"grad_norm": 0.7154505490752525,
"learning_rate": 3.915158150290855e-05,
"loss": 0.4652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4680216312408447,
"step": 800,
"valid_targets_mean": 3224.4,
"valid_targets_min": 1045
},
{
"epoch": 1.2962962962962963,
"grad_norm": 0.6366798215464128,
"learning_rate": 3.912828518359588e-05,
"loss": 0.4689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4367047846317291,
"step": 805,
"valid_targets_mean": 4021.2,
"valid_targets_min": 1118
},
{
"epoch": 1.3043478260869565,
"grad_norm": 0.7245476673199482,
"learning_rate": 3.910468046204846e-05,
"loss": 0.4691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41532838344573975,
"step": 810,
"valid_targets_mean": 3145.9,
"valid_targets_min": 977
},
{
"epoch": 1.3123993558776168,
"grad_norm": 0.965081597376756,
"learning_rate": 3.908076771884139e-05,
"loss": 0.4461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47352737188339233,
"step": 815,
"valid_targets_mean": 2583.8,
"valid_targets_min": 1167
},
{
"epoch": 1.320450885668277,
"grad_norm": 0.7363364439864812,
"learning_rate": 3.905654733951595e-05,
"loss": 0.4784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4524630904197693,
"step": 820,
"valid_targets_mean": 3109.6,
"valid_targets_min": 1268
},
{
"epoch": 1.3285024154589373,
"grad_norm": 0.7636753657586481,
"learning_rate": 3.9032019714573366e-05,
"loss": 0.4786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4579421281814575,
"step": 825,
"valid_targets_mean": 2516.6,
"valid_targets_min": 1159
},
{
"epoch": 1.3365539452495974,
"grad_norm": 0.6680520600678994,
"learning_rate": 3.9007185239468554e-05,
"loss": 0.456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4591274857521057,
"step": 830,
"valid_targets_mean": 4016.8,
"valid_targets_min": 1642
},
{
"epoch": 1.3446054750402576,
"grad_norm": 0.7001951095419365,
"learning_rate": 3.8982044314603725e-05,
"loss": 0.4926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4835224151611328,
"step": 835,
"valid_targets_mean": 3258.7,
"valid_targets_min": 1158
},
{
"epoch": 1.3526570048309179,
"grad_norm": 0.6740616815716441,
"learning_rate": 3.8956597345321927e-05,
"loss": 0.4595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4707792401313782,
"step": 840,
"valid_targets_mean": 3767.5,
"valid_targets_min": 1430
},
{
"epoch": 1.3607085346215781,
"grad_norm": 0.678578864364496,
"learning_rate": 3.893084474190051e-05,
"loss": 0.4685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4893713593482971,
"step": 845,
"valid_targets_mean": 3205.4,
"valid_targets_min": 977
},
{
"epoch": 1.3687600644122382,
"grad_norm": 0.7052919421243395,
"learning_rate": 3.890478691954452e-05,
"loss": 0.465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4288814067840576,
"step": 850,
"valid_targets_mean": 3383.2,
"valid_targets_min": 1706
},
{
"epoch": 1.3768115942028984,
"grad_norm": 0.7065538252025207,
"learning_rate": 3.8878424298379996e-05,
"loss": 0.4327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43889719247817993,
"step": 855,
"valid_targets_mean": 2897.8,
"valid_targets_min": 1102
},
{
"epoch": 1.3848631239935587,
"grad_norm": 0.826059371011481,
"learning_rate": 3.885175730344718e-05,
"loss": 0.4279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.489162802696228,
"step": 860,
"valid_targets_mean": 2376.7,
"valid_targets_min": 1197
},
{
"epoch": 1.392914653784219,
"grad_norm": 0.6534195388501567,
"learning_rate": 3.882478636469372e-05,
"loss": 0.4147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40982362627983093,
"step": 865,
"valid_targets_mean": 3869.4,
"valid_targets_min": 1445
},
{
"epoch": 1.4009661835748792,
"grad_norm": 0.5643024903852305,
"learning_rate": 3.879751191696766e-05,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3592322766780853,
"step": 870,
"valid_targets_mean": 4852.6,
"valid_targets_min": 1536
},
{
"epoch": 1.4090177133655395,
"grad_norm": 0.8046362197064678,
"learning_rate": 3.8769934400010506e-05,
"loss": 0.4132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42762547731399536,
"step": 875,
"valid_targets_mean": 3675.9,
"valid_targets_min": 1260
},
{
"epoch": 1.4170692431561998,
"grad_norm": 0.6344687303861078,
"learning_rate": 3.8742054258450085e-05,
"loss": 0.4197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3801061809062958,
"step": 880,
"valid_targets_mean": 3460.8,
"valid_targets_min": 406
},
{
"epoch": 1.42512077294686,
"grad_norm": 0.6323525098555549,
"learning_rate": 3.871387194179338e-05,
"loss": 0.3821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3990853428840637,
"step": 885,
"valid_targets_mean": 4104.0,
"valid_targets_min": 1569
},
{
"epoch": 1.43317230273752,
"grad_norm": 0.7366585526555239,
"learning_rate": 3.868538790441931e-05,
"loss": 0.3944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39089301228523254,
"step": 890,
"valid_targets_mean": 3000.4,
"valid_targets_min": 1169
},
{
"epoch": 1.4412238325281803,
"grad_norm": 0.6980083863459992,
"learning_rate": 3.865660260557138e-05,
"loss": 0.3997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45632731914520264,
"step": 895,
"valid_targets_mean": 3155.8,
"valid_targets_min": 1407
},
{
"epoch": 1.4492753623188406,
"grad_norm": 0.7473196990397595,
"learning_rate": 3.8627516509350286e-05,
"loss": 0.4058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4090888500213623,
"step": 900,
"valid_targets_mean": 2876.1,
"valid_targets_min": 1097
},
{
"epoch": 1.4573268921095008,
"grad_norm": 0.7252851362258242,
"learning_rate": 3.859813008470644e-05,
"loss": 0.4055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4397547245025635,
"step": 905,
"valid_targets_mean": 3099.4,
"valid_targets_min": 1258
},
{
"epoch": 1.465378421900161,
"grad_norm": 0.8116656536711668,
"learning_rate": 3.856844380543239e-05,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4384375810623169,
"step": 910,
"valid_targets_mean": 2574.1,
"valid_targets_min": 1351
},
{
"epoch": 1.4734299516908211,
"grad_norm": 0.7311144238819602,
"learning_rate": 3.8538458150155186e-05,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4589492678642273,
"step": 915,
"valid_targets_mean": 3223.3,
"valid_targets_min": 1314
},
{
"epoch": 1.4814814814814814,
"grad_norm": 0.6970970758853244,
"learning_rate": 3.850817360232869e-05,
"loss": 0.3792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39102041721343994,
"step": 920,
"valid_targets_mean": 3132.0,
"valid_targets_min": 1272
},
{
"epoch": 1.4895330112721417,
"grad_norm": 0.6439455681571239,
"learning_rate": 3.8477590650225735e-05,
"loss": 0.4058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3645486533641815,
"step": 925,
"valid_targets_mean": 3755.3,
"valid_targets_min": 1230
},
{
"epoch": 1.497584541062802,
"grad_norm": 0.7469424687646696,
"learning_rate": 3.8446709786930305e-05,
"loss": 0.3823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36221805214881897,
"step": 930,
"valid_targets_mean": 3029.9,
"valid_targets_min": 1590
},
{
"epoch": 1.5056360708534622,
"grad_norm": 0.7074858488388046,
"learning_rate": 3.841553151032953e-05,
"loss": 0.3914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38697734475135803,
"step": 935,
"valid_targets_mean": 3930.0,
"valid_targets_min": 1734
},
{
"epoch": 1.5136876006441224,
"grad_norm": 0.6408672423143533,
"learning_rate": 3.8384056323105695e-05,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45191776752471924,
"step": 940,
"valid_targets_mean": 3632.3,
"valid_targets_min": 1021
},
{
"epoch": 1.5217391304347827,
"grad_norm": 0.6999987480130047,
"learning_rate": 3.835228473272814e-05,
"loss": 0.3926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40401631593704224,
"step": 945,
"valid_targets_mean": 3690.8,
"valid_targets_min": 1136
},
{
"epoch": 1.529790660225443,
"grad_norm": 0.7300521054387631,
"learning_rate": 3.832021725144506e-05,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40716779232025146,
"step": 950,
"valid_targets_mean": 2800.6,
"valid_targets_min": 485
},
{
"epoch": 1.537842190016103,
"grad_norm": 0.7731778429667089,
"learning_rate": 3.828785439627523e-05,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43859434127807617,
"step": 955,
"valid_targets_mean": 3744.1,
"valid_targets_min": 1267
},
{
"epoch": 1.5458937198067633,
"grad_norm": 0.6705224246744239,
"learning_rate": 3.825519668899972e-05,
"loss": 0.4118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3778587877750397,
"step": 960,
"valid_targets_mean": 3365.1,
"valid_targets_min": 1014
},
{
"epoch": 1.5539452495974235,
"grad_norm": 0.7645910195884874,
"learning_rate": 3.8222244656153444e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3704504668712616,
"step": 965,
"valid_targets_mean": 3473.1,
"valid_targets_min": 1657
},
{
"epoch": 1.5619967793880838,
"grad_norm": 0.7395785345258863,
"learning_rate": 3.818899882901666e-05,
"loss": 0.3848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4030625820159912,
"step": 970,
"valid_targets_mean": 2840.8,
"valid_targets_min": 1494
},
{
"epoch": 1.5700483091787438,
"grad_norm": 0.736229535025106,
"learning_rate": 3.815545974360644e-05,
"loss": 0.4024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4085889160633087,
"step": 975,
"valid_targets_mean": 2815.1,
"valid_targets_min": 1208
},
{
"epoch": 1.578099838969404,
"grad_norm": 0.7854099739280379,
"learning_rate": 3.812162794066802e-05,
"loss": 0.3743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.379982054233551,
"step": 980,
"valid_targets_mean": 3228.2,
"valid_targets_min": 1394
},
{
"epoch": 1.5861513687600644,
"grad_norm": 0.7315662602632311,
"learning_rate": 3.8087503965666057e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40219753980636597,
"step": 985,
"valid_targets_mean": 3174.3,
"valid_targets_min": 1240
},
{
"epoch": 1.5942028985507246,
"grad_norm": 0.6694592764443967,
"learning_rate": 3.805308836877586e-05,
"loss": 0.4112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37781035900115967,
"step": 990,
"valid_targets_mean": 3438.4,
"valid_targets_min": 1124
},
{
"epoch": 1.6022544283413849,
"grad_norm": 0.7386035260971374,
"learning_rate": 3.80183817048745e-05,
"loss": 0.3702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38043975830078125,
"step": 995,
"valid_targets_mean": 2587.6,
"valid_targets_min": 1218
},
{
"epoch": 1.6103059581320451,
"grad_norm": 0.7294675876286597,
"learning_rate": 3.7983384533531894e-05,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3978623151779175,
"step": 1000,
"valid_targets_mean": 2969.8,
"valid_targets_min": 1309
},
{
"epoch": 1.6183574879227054,
"grad_norm": 0.6439654018799925,
"learning_rate": 3.7948097419001736e-05,
"loss": 0.3842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.402493953704834,
"step": 1005,
"valid_targets_mean": 3475.1,
"valid_targets_min": 1128
},
{
"epoch": 1.6264090177133657,
"grad_norm": 0.7469049629085611,
"learning_rate": 3.7912520930212445e-05,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3579831123352051,
"step": 1010,
"valid_targets_mean": 2925.9,
"valid_targets_min": 1311
},
{
"epoch": 1.634460547504026,
"grad_norm": 0.6828460239332308,
"learning_rate": 3.7876655640757974e-05,
"loss": 0.3646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37845996022224426,
"step": 1015,
"valid_targets_mean": 3369.0,
"valid_targets_min": 1109
},
{
"epoch": 1.642512077294686,
"grad_norm": 0.916703135376311,
"learning_rate": 3.784050212888857e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3890652358531952,
"step": 1020,
"valid_targets_mean": 3307.7,
"valid_targets_min": 1172
},
{
"epoch": 1.6505636070853462,
"grad_norm": 0.8453007862430895,
"learning_rate": 3.780406097750141e-05,
"loss": 0.3892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.393949419260025,
"step": 1025,
"valid_targets_mean": 2625.4,
"valid_targets_min": 1313
},
{
"epoch": 1.6586151368760065,
"grad_norm": 0.7030261980183728,
"learning_rate": 3.776733277413127e-05,
"loss": 0.3771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3959161043167114,
"step": 1030,
"valid_targets_mean": 3028.0,
"valid_targets_min": 1602
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.6424805669240223,
"learning_rate": 3.7730318110941004e-05,
"loss": 0.3843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3867754340171814,
"step": 1035,
"valid_targets_mean": 3680.5,
"valid_targets_min": 1441
},
{
"epoch": 1.6747181964573268,
"grad_norm": 0.6723162629033781,
"learning_rate": 3.7693017584712013e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3691941499710083,
"step": 1040,
"valid_targets_mean": 3472.8,
"valid_targets_min": 1029
},
{
"epoch": 1.682769726247987,
"grad_norm": 0.66473478421512,
"learning_rate": 3.765543179683462e-05,
"loss": 0.3855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37193185091018677,
"step": 1045,
"valid_targets_mean": 3390.6,
"valid_targets_min": 1873
},
{
"epoch": 1.6908212560386473,
"grad_norm": 0.6827138169001735,
"learning_rate": 3.7617561353298395e-05,
"loss": 0.4096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.407214492559433,
"step": 1050,
"valid_targets_mean": 3282.8,
"valid_targets_min": 588
},
{
"epoch": 1.6988727858293076,
"grad_norm": 0.6054569389155301,
"learning_rate": 3.7579406864682327e-05,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39312368631362915,
"step": 1055,
"valid_targets_mean": 4544.4,
"valid_targets_min": 1616
},
{
"epoch": 1.7069243156199678,
"grad_norm": 0.6376030347219761,
"learning_rate": 3.7540968946145036e-05,
"loss": 0.3712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37451237440109253,
"step": 1060,
"valid_targets_mean": 3384.4,
"valid_targets_min": 1236
},
{
"epoch": 1.714975845410628,
"grad_norm": 0.6211030350353202,
"learning_rate": 3.750224821741486e-05,
"loss": 0.3837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38833314180374146,
"step": 1065,
"valid_targets_mean": 4230.6,
"valid_targets_min": 1229
},
{
"epoch": 1.7230273752012883,
"grad_norm": 1.3513202092043939,
"learning_rate": 3.7463245302779795e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3714137673377991,
"step": 1070,
"valid_targets_mean": 3359.7,
"valid_targets_min": 1076
},
{
"epoch": 1.7310789049919486,
"grad_norm": 0.6120247412950662,
"learning_rate": 3.742396083107751e-05,
"loss": 0.384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36947697401046753,
"step": 1075,
"valid_targets_mean": 4327.3,
"valid_targets_min": 1075
},
{
"epoch": 1.7391304347826086,
"grad_norm": 0.6000696270867342,
"learning_rate": 3.7384395435685166e-05,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33209776878356934,
"step": 1080,
"valid_targets_mean": 3812.0,
"valid_targets_min": 1142
},
{
"epoch": 1.747181964573269,
"grad_norm": 0.8080033004353664,
"learning_rate": 3.7344549754509196e-05,
"loss": 0.3952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4237212538719177,
"step": 1085,
"valid_targets_mean": 2473.6,
"valid_targets_min": 1208
},
{
"epoch": 1.7552334943639292,
"grad_norm": 0.5805164381467139,
"learning_rate": 3.7304424429975046e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3186456561088562,
"step": 1090,
"valid_targets_mean": 7490.2,
"valid_targets_min": 2721
},
{
"epoch": 1.7632850241545892,
"grad_norm": 0.4969614961756743,
"learning_rate": 3.726402010901681e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25411802530288696,
"step": 1095,
"valid_targets_mean": 6344.0,
"valid_targets_min": 3073
},
{
"epoch": 1.7713365539452495,
"grad_norm": 0.5036039262445117,
"learning_rate": 3.722333744306678e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2208937406539917,
"step": 1100,
"valid_targets_mean": 5062.1,
"valid_targets_min": 2985
},
{
"epoch": 1.7793880837359097,
"grad_norm": 0.47890617580766465,
"learning_rate": 3.7182377088044984e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27038395404815674,
"step": 1105,
"valid_targets_mean": 5613.6,
"valid_targets_min": 2620
},
{
"epoch": 1.78743961352657,
"grad_norm": 1.0317443624660205,
"learning_rate": 3.7141139704348576e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22091877460479736,
"step": 1110,
"valid_targets_mean": 6100.1,
"valid_targets_min": 3494
},
{
"epoch": 1.7954911433172303,
"grad_norm": 0.4528546728089874,
"learning_rate": 3.7099625956841175e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19431838393211365,
"step": 1115,
"valid_targets_mean": 5711.6,
"valid_targets_min": 3761
},
{
"epoch": 1.8035426731078905,
"grad_norm": 0.48395965253856643,
"learning_rate": 3.70578365148422e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23526781797409058,
"step": 1120,
"valid_targets_mean": 5863.1,
"valid_targets_min": 3178
},
{
"epoch": 1.8115942028985508,
"grad_norm": 0.40906986287532093,
"learning_rate": 3.701577205211604e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22184664011001587,
"step": 1125,
"valid_targets_mean": 6090.8,
"valid_targets_min": 2870
},
{
"epoch": 1.819645732689211,
"grad_norm": 0.4479703485506722,
"learning_rate": 3.697343324686119e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2089478075504303,
"step": 1130,
"valid_targets_mean": 5746.5,
"valid_targets_min": 3334
},
{
"epoch": 1.8276972624798713,
"grad_norm": 0.5767247918497662,
"learning_rate": 3.693082078169933e-05,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23523643612861633,
"step": 1135,
"valid_targets_mean": 5464.9,
"valid_targets_min": 3204
},
{
"epoch": 1.8357487922705316,
"grad_norm": 0.47967598737718,
"learning_rate": 3.68879353436643e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2230021208524704,
"step": 1140,
"valid_targets_mean": 5526.6,
"valid_targets_min": 2793
},
{
"epoch": 1.8438003220611916,
"grad_norm": 0.4741249695731208,
"learning_rate": 3.684477762419108e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24306999146938324,
"step": 1145,
"valid_targets_mean": 6074.9,
"valid_targets_min": 3285
},
{
"epoch": 1.8518518518518519,
"grad_norm": 0.48153493651658874,
"learning_rate": 3.6801348319104546e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2044723629951477,
"step": 1150,
"valid_targets_mean": 5260.6,
"valid_targets_min": 2292
},
{
"epoch": 1.8599033816425121,
"grad_norm": 0.584632590412221,
"learning_rate": 3.675764812860833e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.224099799990654,
"step": 1155,
"valid_targets_mean": 5752.9,
"valid_targets_min": 4204
},
{
"epoch": 1.8679549114331722,
"grad_norm": 0.5420753765458437,
"learning_rate": 3.671367775727353e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21649691462516785,
"step": 1160,
"valid_targets_mean": 4836.7,
"valid_targets_min": 2111
},
{
"epoch": 1.8760064412238324,
"grad_norm": 0.4760661908355776,
"learning_rate": 3.666943791402726e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24728357791900635,
"step": 1165,
"valid_targets_mean": 6021.0,
"valid_targets_min": 4439
},
{
"epoch": 1.8840579710144927,
"grad_norm": 0.6720080745282876,
"learning_rate": 3.662492931214137e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21869316697120667,
"step": 1170,
"valid_targets_mean": 5661.9,
"valid_targets_min": 3607
},
{
"epoch": 1.892109500805153,
"grad_norm": 0.4890482756646293,
"learning_rate": 3.6580152669220784e-05,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22565293312072754,
"step": 1175,
"valid_targets_mean": 5420.4,
"valid_targets_min": 3078
},
{
"epoch": 1.9001610305958132,
"grad_norm": 0.5189964339664618,
"learning_rate": 3.6535108707192053e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20920491218566895,
"step": 1180,
"valid_targets_mean": 5750.4,
"valid_targets_min": 2491
},
{
"epoch": 1.9082125603864735,
"grad_norm": 0.4214170728597196,
"learning_rate": 3.648979815229167e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20261229574680328,
"step": 1185,
"valid_targets_mean": 5996.6,
"valid_targets_min": 4004
},
{
"epoch": 1.9162640901771337,
"grad_norm": 0.43481442428355693,
"learning_rate": 3.644422173505433e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20599091053009033,
"step": 1190,
"valid_targets_mean": 6200.9,
"valid_targets_min": 3148
},
{
"epoch": 1.924315619967794,
"grad_norm": 0.45638204853677106,
"learning_rate": 3.639838019030123e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1937769055366516,
"step": 1195,
"valid_targets_mean": 6472.3,
"valid_targets_min": 3581
},
{
"epoch": 1.9323671497584543,
"grad_norm": 0.4186145666771615,
"learning_rate": 3.635227425712812e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2861325144767761,
"step": 1200,
"valid_targets_mean": 7532.8,
"valid_targets_min": 3206
},
{
"epoch": 1.9404186795491143,
"grad_norm": 0.5308258730995378,
"learning_rate": 3.6305904678893504e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531401515007019,
"step": 1205,
"valid_targets_mean": 5952.9,
"valid_targets_min": 3304
},
{
"epoch": 1.9484702093397746,
"grad_norm": 0.46680263986526405,
"learning_rate": 3.6259272203206535e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21227112412452698,
"step": 1210,
"valid_targets_mean": 5735.1,
"valid_targets_min": 3368
},
{
"epoch": 1.9565217391304348,
"grad_norm": 0.491355991243715,
"learning_rate": 3.621237758191505e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2222747504711151,
"step": 1215,
"valid_targets_mean": 5506.7,
"valid_targets_min": 2908
},
{
"epoch": 1.9645732689210949,
"grad_norm": 0.4862497243022364,
"learning_rate": 3.616522157109342e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2260490208864212,
"step": 1220,
"valid_targets_mean": 5777.9,
"valid_targets_min": 3451
},
{
"epoch": 1.9726247987117551,
"grad_norm": 0.4051875398639865,
"learning_rate": 3.6117804931030324e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19149649143218994,
"step": 1225,
"valid_targets_mean": 6045.9,
"valid_targets_min": 2967
},
{
"epoch": 1.9806763285024154,
"grad_norm": 0.48575560614945534,
"learning_rate": 3.607012842621657e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21349817514419556,
"step": 1230,
"valid_targets_mean": 6113.4,
"valid_targets_min": 3912
},
{
"epoch": 1.9887278582930756,
"grad_norm": 0.4334111032895171,
"learning_rate": 3.602219282533269e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1997205913066864,
"step": 1235,
"valid_targets_mean": 5837.0,
"valid_targets_min": 3528
},
{
"epoch": 1.996779388083736,
"grad_norm": 0.4425270232705891,
"learning_rate": 3.597399890123659e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22543010115623474,
"step": 1240,
"valid_targets_mean": 6356.6,
"valid_targets_min": 3725
},
{
"epoch": 2.004830917874396,
"grad_norm": 0.49848016805395046,
"learning_rate": 3.5925547430951094e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30809903144836426,
"step": 1245,
"valid_targets_mean": 6803.5,
"valid_targets_min": 3040
},
{
"epoch": 2.0128824476650564,
"grad_norm": 0.5893052782286002,
"learning_rate": 3.587683919565136e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27029603719711304,
"step": 1250,
"valid_targets_mean": 5952.2,
"valid_targets_min": 3694
},
{
"epoch": 2.0209339774557167,
"grad_norm": 0.5557870949459839,
"learning_rate": 3.582787498065237e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3327678442001343,
"step": 1255,
"valid_targets_mean": 5764.1,
"valid_targets_min": 2130
},
{
"epoch": 2.028985507246377,
"grad_norm": 0.4584733838358168,
"learning_rate": 3.577865557539621e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30011194944381714,
"step": 1260,
"valid_targets_mean": 6953.2,
"valid_targets_min": 3425
},
{
"epoch": 2.037037037037037,
"grad_norm": 1.64628767564844,
"learning_rate": 3.572918177343935e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30400946736335754,
"step": 1265,
"valid_targets_mean": 6372.9,
"valid_targets_min": 2633
},
{
"epoch": 2.0450885668276975,
"grad_norm": 0.47363097381646996,
"learning_rate": 3.567945437243987e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3237455487251282,
"step": 1270,
"valid_targets_mean": 6667.6,
"valid_targets_min": 3230
},
{
"epoch": 2.0531400966183573,
"grad_norm": 0.6121579597876319,
"learning_rate": 3.5629474174144564e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3143073320388794,
"step": 1275,
"valid_targets_mean": 5952.1,
"valid_targets_min": 3816
},
{
"epoch": 2.0611916264090175,
"grad_norm": 0.5122726834409544,
"learning_rate": 3.5579241984376065e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792460322380066,
"step": 1280,
"valid_targets_mean": 6181.7,
"valid_targets_min": 1726
},
{
"epoch": 2.069243156199678,
"grad_norm": 0.5279318998363034,
"learning_rate": 3.5528758613019804e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2636644244194031,
"step": 1285,
"valid_targets_mean": 5198.9,
"valid_targets_min": 1161
},
{
"epoch": 2.077294685990338,
"grad_norm": 0.4637806256747439,
"learning_rate": 3.547802487401097e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678183317184448,
"step": 1290,
"valid_targets_mean": 5936.2,
"valid_targets_min": 2526
},
{
"epoch": 2.0853462157809983,
"grad_norm": 0.44332589750107415,
"learning_rate": 3.54270415853214e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2518324851989746,
"step": 1295,
"valid_targets_mean": 6524.1,
"valid_targets_min": 3439
},
{
"epoch": 2.0933977455716586,
"grad_norm": 0.5070450536840013,
"learning_rate": 3.537580956894638e-05,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27724772691726685,
"step": 1300,
"valid_targets_mean": 6404.5,
"valid_targets_min": 2689
},
{
"epoch": 2.101449275362319,
"grad_norm": 0.6584385593174998,
"learning_rate": 3.532432965089138e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2892034649848938,
"step": 1305,
"valid_targets_mean": 5932.1,
"valid_targets_min": 2432
},
{
"epoch": 2.109500805152979,
"grad_norm": 0.4944188614557695,
"learning_rate": 3.527260266115876e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32951074838638306,
"step": 1310,
"valid_targets_mean": 6782.6,
"valid_targets_min": 3784
},
{
"epoch": 2.1175523349436394,
"grad_norm": 0.4980617413022126,
"learning_rate": 3.522062943373438e-05,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2504119575023651,
"step": 1315,
"valid_targets_mean": 6065.6,
"valid_targets_min": 3311
},
{
"epoch": 2.1256038647342996,
"grad_norm": 0.5112205537054673,
"learning_rate": 3.516841080657413e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678036689758301,
"step": 1320,
"valid_targets_mean": 4948.5,
"valid_targets_min": 1373
},
{
"epoch": 2.13365539452496,
"grad_norm": 0.9291687075910791,
"learning_rate": 3.511594762159046e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42405465245246887,
"step": 1325,
"valid_targets_mean": 2751.3,
"valid_targets_min": 1151
},
{
"epoch": 2.14170692431562,
"grad_norm": 0.8796559274131959,
"learning_rate": 3.506324072463878e-05,
"loss": 0.4501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4509429931640625,
"step": 1330,
"valid_targets_mean": 2481.8,
"valid_targets_min": 872
},
{
"epoch": 2.14975845410628,
"grad_norm": 0.7338052792870016,
"learning_rate": 3.5010290965503826e-05,
"loss": 0.4473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42610806226730347,
"step": 1335,
"valid_targets_mean": 3228.8,
"valid_targets_min": 1082
},
{
"epoch": 2.1578099838969402,
"grad_norm": 0.9099556688067492,
"learning_rate": 3.495709919788597e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4756355881690979,
"step": 1340,
"valid_targets_mean": 3290.7,
"valid_targets_min": 905
},
{
"epoch": 2.1658615136876005,
"grad_norm": 0.7280295738870289,
"learning_rate": 3.490366627938742e-05,
"loss": 0.4281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4415823817253113,
"step": 1345,
"valid_targets_mean": 3735.3,
"valid_targets_min": 1115
},
{
"epoch": 2.1739130434782608,
"grad_norm": 0.8552032601411625,
"learning_rate": 3.484999307149846e-05,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4188133478164673,
"step": 1350,
"valid_targets_mean": 2806.2,
"valid_targets_min": 1140
},
{
"epoch": 2.181964573268921,
"grad_norm": 0.7699287073880586,
"learning_rate": 3.47960804395835e-05,
"loss": 0.4144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38652926683425903,
"step": 1355,
"valid_targets_mean": 2498.2,
"valid_targets_min": 970
},
{
"epoch": 2.1900161030595813,
"grad_norm": 0.6914816395930312,
"learning_rate": 3.474192925286714e-05,
"loss": 0.4313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39671099185943604,
"step": 1360,
"valid_targets_mean": 3014.8,
"valid_targets_min": 1130
},
{
"epoch": 2.1980676328502415,
"grad_norm": 0.8257531389708893,
"learning_rate": 3.468754038442017e-05,
"loss": 0.4392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4281843304634094,
"step": 1365,
"valid_targets_mean": 2247.2,
"valid_targets_min": 1125
},
{
"epoch": 2.206119162640902,
"grad_norm": 0.7268372945505573,
"learning_rate": 3.463291471114548e-05,
"loss": 0.4095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4062803387641907,
"step": 1370,
"valid_targets_mean": 3460.9,
"valid_targets_min": 1652
},
{
"epoch": 2.214170692431562,
"grad_norm": 0.8070422587353386,
"learning_rate": 3.4578053113763936e-05,
"loss": 0.4513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4336710572242737,
"step": 1375,
"valid_targets_mean": 2609.9,
"valid_targets_min": 1079
},
{
"epoch": 2.2222222222222223,
"grad_norm": 1.67186958813965,
"learning_rate": 3.452295647680014e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40693116188049316,
"step": 1380,
"valid_targets_mean": 3187.6,
"valid_targets_min": 1303
},
{
"epoch": 2.2302737520128826,
"grad_norm": 0.7010798669064308,
"learning_rate": 3.4467625688568245e-05,
"loss": 0.4279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40231195092201233,
"step": 1385,
"valid_targets_mean": 3980.8,
"valid_targets_min": 1495
},
{
"epoch": 2.238325281803543,
"grad_norm": 0.9239851489046476,
"learning_rate": 3.4412061641157546e-05,
"loss": 0.4443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.434467613697052,
"step": 1390,
"valid_targets_mean": 2712.9,
"valid_targets_min": 1495
},
{
"epoch": 2.246376811594203,
"grad_norm": 0.7442921098581603,
"learning_rate": 3.435626523041815e-05,
"loss": 0.4188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4101715683937073,
"step": 1395,
"valid_targets_mean": 3055.6,
"valid_targets_min": 1216
},
{
"epoch": 2.2544283413848634,
"grad_norm": 0.7796509221772335,
"learning_rate": 3.430023735594653e-05,
"loss": 0.4248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43132680654525757,
"step": 1400,
"valid_targets_mean": 3022.4,
"valid_targets_min": 1130
},
{
"epoch": 2.262479871175523,
"grad_norm": 0.8845650683341554,
"learning_rate": 3.4243978921071005e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4295615553855896,
"step": 1405,
"valid_targets_mean": 2932.4,
"valid_targets_min": 1319
},
{
"epoch": 2.2705314009661834,
"grad_norm": 0.7654694935136631,
"learning_rate": 3.418749083283719e-05,
"loss": 0.4139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41558438539505005,
"step": 1410,
"valid_targets_mean": 2893.2,
"valid_targets_min": 1501
},
{
"epoch": 2.2785829307568437,
"grad_norm": 0.7620855439193758,
"learning_rate": 3.413077400199334e-05,
"loss": 0.4227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3939434885978699,
"step": 1415,
"valid_targets_mean": 2413.7,
"valid_targets_min": 1044
},
{
"epoch": 2.286634460547504,
"grad_norm": 0.6909091800489532,
"learning_rate": 3.407382934297571e-05,
"loss": 0.4174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3776891231536865,
"step": 1420,
"valid_targets_mean": 3168.1,
"valid_targets_min": 1035
},
{
"epoch": 2.2946859903381642,
"grad_norm": 0.7978903184807417,
"learning_rate": 3.4016657773893785e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46548742055892944,
"step": 1425,
"valid_targets_mean": 3087.7,
"valid_targets_min": 1699
},
{
"epoch": 2.3027375201288245,
"grad_norm": 0.8248703939493464,
"learning_rate": 3.3959260216515495e-05,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41521650552749634,
"step": 1430,
"valid_targets_mean": 2646.4,
"valid_targets_min": 1509
},
{
"epoch": 2.3107890499194848,
"grad_norm": 0.7311952260051283,
"learning_rate": 3.3901637596252325e-05,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36918574571609497,
"step": 1435,
"valid_targets_mean": 2969.6,
"valid_targets_min": 1251
},
{
"epoch": 2.318840579710145,
"grad_norm": 0.7976719684765547,
"learning_rate": 3.384379084214443e-05,
"loss": 0.432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4152054190635681,
"step": 1440,
"valid_targets_mean": 3140.2,
"valid_targets_min": 1161
},
{
"epoch": 2.3268921095008053,
"grad_norm": 0.7964318060668145,
"learning_rate": 3.378572088684562e-05,
"loss": 0.4245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45041656494140625,
"step": 1445,
"valid_targets_mean": 2786.8,
"valid_targets_min": 1501
},
{
"epoch": 2.3349436392914655,
"grad_norm": 0.779177762219085,
"learning_rate": 3.372742866660836e-05,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42900824546813965,
"step": 1450,
"valid_targets_mean": 3073.4,
"valid_targets_min": 1434
},
{
"epoch": 2.342995169082126,
"grad_norm": 0.8252841045839578,
"learning_rate": 3.3668915121268636e-05,
"loss": 0.4356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42234331369400024,
"step": 1455,
"valid_targets_mean": 2718.1,
"valid_targets_min": 1147
},
{
"epoch": 2.3510466988727856,
"grad_norm": 0.7559789239050331,
"learning_rate": 3.361018119423085e-05,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3902217745780945,
"step": 1460,
"valid_targets_mean": 3051.3,
"valid_targets_min": 1170
},
{
"epoch": 2.359098228663446,
"grad_norm": 0.7118532524697113,
"learning_rate": 3.3551227832452555e-05,
"loss": 0.4167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4386996924877167,
"step": 1465,
"valid_targets_mean": 3645.1,
"valid_targets_min": 1319
},
{
"epoch": 2.367149758454106,
"grad_norm": 0.7314007089106499,
"learning_rate": 3.3492055986429235e-05,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3893301486968994,
"step": 1470,
"valid_targets_mean": 3020.9,
"valid_targets_min": 1036
},
{
"epoch": 2.3752012882447664,
"grad_norm": 0.7883519271357176,
"learning_rate": 3.3432666610178936e-05,
"loss": 0.3829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3778621554374695,
"step": 1475,
"valid_targets_mean": 2636.9,
"valid_targets_min": 632
},
{
"epoch": 2.3832528180354267,
"grad_norm": 0.5950705396292623,
"learning_rate": 3.3373060661226944e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3533982038497925,
"step": 1480,
"valid_targets_mean": 4681.1,
"valid_targets_min": 1703
},
{
"epoch": 2.391304347826087,
"grad_norm": 0.6284697509500937,
"learning_rate": 3.331323910059027e-05,
"loss": 0.3813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36771711707115173,
"step": 1485,
"valid_targets_mean": 4288.2,
"valid_targets_min": 349
},
{
"epoch": 2.399355877616747,
"grad_norm": 0.6241002825603361,
"learning_rate": 3.3253202892762244e-05,
"loss": 0.3774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35911619663238525,
"step": 1490,
"valid_targets_mean": 4145.6,
"valid_targets_min": 1505
},
{
"epoch": 2.4074074074074074,
"grad_norm": 0.7195975803486768,
"learning_rate": 3.319295300569686e-05,
"loss": 0.3541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3680953085422516,
"step": 1495,
"valid_targets_mean": 3169.7,
"valid_targets_min": 1125
},
{
"epoch": 2.4154589371980677,
"grad_norm": 0.6678894669137365,
"learning_rate": 3.3132490410793294e-05,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40425896644592285,
"step": 1500,
"valid_targets_mean": 3801.9,
"valid_targets_min": 1805
},
{
"epoch": 2.423510466988728,
"grad_norm": 0.67381554336476,
"learning_rate": 3.3071816082880115e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3536141514778137,
"step": 1505,
"valid_targets_mean": 3517.1,
"valid_targets_min": 1172
},
{
"epoch": 2.4315619967793882,
"grad_norm": 0.5844843611773384,
"learning_rate": 3.3010931000199674e-05,
"loss": 0.3513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3546409606933594,
"step": 1510,
"valid_targets_mean": 4191.2,
"valid_targets_min": 2286
},
{
"epoch": 2.4396135265700485,
"grad_norm": 0.6086706004595346,
"learning_rate": 3.2949836144392256e-05,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32763075828552246,
"step": 1515,
"valid_targets_mean": 4189.8,
"valid_targets_min": 1568
},
{
"epoch": 2.4476650563607087,
"grad_norm": 0.8158802293533742,
"learning_rate": 3.28885325004803e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35021084547042847,
"step": 1520,
"valid_targets_mean": 3081.1,
"valid_targets_min": 1168
},
{
"epoch": 2.455716586151369,
"grad_norm": 0.6124714609883762,
"learning_rate": 3.282702105685251e-05,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33643293380737305,
"step": 1525,
"valid_targets_mean": 3844.6,
"valid_targets_min": 1318
},
{
"epoch": 2.463768115942029,
"grad_norm": 0.6419535517935,
"learning_rate": 3.2765302805247885e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.324346661567688,
"step": 1530,
"valid_targets_mean": 3268.8,
"valid_targets_min": 1153
},
{
"epoch": 2.471819645732689,
"grad_norm": 0.707763033567243,
"learning_rate": 3.270337874073977e-05,
"loss": 0.3842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39264971017837524,
"step": 1535,
"valid_targets_mean": 3251.4,
"valid_targets_min": 1576
},
{
"epoch": 2.4798711755233493,
"grad_norm": 0.6517860581223903,
"learning_rate": 3.264124986171981e-05,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30974501371383667,
"step": 1540,
"valid_targets_mean": 3231.7,
"valid_targets_min": 1471
},
{
"epoch": 2.4879227053140096,
"grad_norm": 0.6861932870077228,
"learning_rate": 3.2578917169881816e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3639856278896332,
"step": 1545,
"valid_targets_mean": 3158.2,
"valid_targets_min": 373
},
{
"epoch": 2.49597423510467,
"grad_norm": 0.5800378877703327,
"learning_rate": 3.2516381670205665e-05,
"loss": 0.3418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33077770471572876,
"step": 1550,
"valid_targets_mean": 4750.0,
"valid_targets_min": 1270
},
{
"epoch": 2.50402576489533,
"grad_norm": 0.6790879537056581,
"learning_rate": 3.245364437094105e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36615103483200073,
"step": 1555,
"valid_targets_mean": 3425.2,
"valid_targets_min": 1034
},
{
"epoch": 2.5120772946859904,
"grad_norm": 0.7532708248786624,
"learning_rate": 3.239070628359126e-05,
"loss": 0.3473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3348079025745392,
"step": 1560,
"valid_targets_mean": 2773.3,
"valid_targets_min": 1054
},
{
"epoch": 2.5201288244766507,
"grad_norm": 0.6602490038924721,
"learning_rate": 3.232756842289685e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3299705982208252,
"step": 1565,
"valid_targets_mean": 4059.8,
"valid_targets_min": 1416
},
{
"epoch": 2.528180354267311,
"grad_norm": 0.635105782473463,
"learning_rate": 3.2264231806819286e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3414621353149414,
"step": 1570,
"valid_targets_mean": 3796.5,
"valid_targets_min": 1490
},
{
"epoch": 2.536231884057971,
"grad_norm": 0.6634194373750147,
"learning_rate": 3.220069745652456e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3682880997657776,
"step": 1575,
"valid_targets_mean": 3359.2,
"valid_targets_min": 1401
},
{
"epoch": 2.544283413848631,
"grad_norm": 0.6748832386881813,
"learning_rate": 3.213696639636666e-05,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37244677543640137,
"step": 1580,
"valid_targets_mean": 3234.9,
"valid_targets_min": 1543
},
{
"epoch": 2.5523349436392913,
"grad_norm": 0.6147417333490566,
"learning_rate": 3.207303965387114e-05,
"loss": 0.3398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2844334840774536,
"step": 1585,
"valid_targets_mean": 3613.4,
"valid_targets_min": 1535
},
{
"epoch": 2.5603864734299515,
"grad_norm": 0.6644115534295828,
"learning_rate": 3.200891825971846e-05,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34174948930740356,
"step": 1590,
"valid_targets_mean": 3520.8,
"valid_targets_min": 1561
},
{
"epoch": 2.5684380032206118,
"grad_norm": 0.6492076929001203,
"learning_rate": 3.194460324772746e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34135136008262634,
"step": 1595,
"valid_targets_mean": 3454.2,
"valid_targets_min": 1036
},
{
"epoch": 2.576489533011272,
"grad_norm": 0.6262401028348537,
"learning_rate": 3.188009565483861e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37102776765823364,
"step": 1600,
"valid_targets_mean": 3877.2,
"valid_targets_min": 1400
},
{
"epoch": 2.5845410628019323,
"grad_norm": 0.6690368914483794,
"learning_rate": 3.1815396521097376e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30660367012023926,
"step": 1605,
"valid_targets_mean": 3103.3,
"valid_targets_min": 1327
},
{
"epoch": 2.5925925925925926,
"grad_norm": 0.6782490130071587,
"learning_rate": 3.1750506889637366e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3212292492389679,
"step": 1610,
"valid_targets_mean": 3301.8,
"valid_targets_min": 1530
},
{
"epoch": 2.600644122383253,
"grad_norm": 0.6136219154267422,
"learning_rate": 3.1685427806663574e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3197278678417206,
"step": 1615,
"valid_targets_mean": 3827.2,
"valid_targets_min": 1604
},
{
"epoch": 2.608695652173913,
"grad_norm": 0.7590245604099114,
"learning_rate": 3.1620160321435475e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41536277532577515,
"step": 1620,
"valid_targets_mean": 3155.0,
"valid_targets_min": 1301
},
{
"epoch": 2.6167471819645733,
"grad_norm": 0.6668069970888741,
"learning_rate": 3.155470548625014e-05,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34977424144744873,
"step": 1625,
"valid_targets_mean": 3495.8,
"valid_targets_min": 1108
},
{
"epoch": 2.6247987117552336,
"grad_norm": 0.6443781380528575,
"learning_rate": 3.1489064356425235e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.348181813955307,
"step": 1630,
"valid_targets_mean": 3598.6,
"valid_targets_min": 1663
},
{
"epoch": 2.632850241545894,
"grad_norm": 0.6477230031259141,
"learning_rate": 3.142323799028204e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34765568375587463,
"step": 1635,
"valid_targets_mean": 3781.5,
"valid_targets_min": 1585
},
{
"epoch": 2.640901771336554,
"grad_norm": 0.6757898090196188,
"learning_rate": 3.135722744912836e-05,
"loss": 0.3501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38952842354774475,
"step": 1640,
"valid_targets_mean": 4125.3,
"valid_targets_min": 1262
},
{
"epoch": 2.6489533011272144,
"grad_norm": 0.6699916964095252,
"learning_rate": 3.129103379724143e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37032926082611084,
"step": 1645,
"valid_targets_mean": 3489.9,
"valid_targets_min": 1525
},
{
"epoch": 2.6570048309178746,
"grad_norm": 0.639493421870476,
"learning_rate": 3.122465810185075e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33100080490112305,
"step": 1650,
"valid_targets_mean": 3673.7,
"valid_targets_min": 1354
},
{
"epoch": 2.6650563607085345,
"grad_norm": 0.5871950095800859,
"learning_rate": 3.1158101433120863e-05,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34115904569625854,
"step": 1655,
"valid_targets_mean": 4327.2,
"valid_targets_min": 1228
},
{
"epoch": 2.6731078904991947,
"grad_norm": 0.6666026792346776,
"learning_rate": 3.1091364864134136e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39104804396629333,
"step": 1660,
"valid_targets_mean": 3398.6,
"valid_targets_min": 1445
},
{
"epoch": 2.681159420289855,
"grad_norm": 0.6426036994837567,
"learning_rate": 3.102444947087342e-05,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34018710255622864,
"step": 1665,
"valid_targets_mean": 3618.1,
"valid_targets_min": 1665
},
{
"epoch": 2.6892109500805152,
"grad_norm": 0.7200889886232774,
"learning_rate": 3.0957356332204745e-05,
"loss": 0.3624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4483473300933838,
"step": 1670,
"valid_targets_mean": 3554.4,
"valid_targets_min": 1075
},
{
"epoch": 2.6972624798711755,
"grad_norm": 0.6807458182499385,
"learning_rate": 3.089008652985989e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31604230403900146,
"step": 1675,
"valid_targets_mean": 3257.0,
"valid_targets_min": 1286
},
{
"epoch": 2.7053140096618358,
"grad_norm": 0.7052899877260982,
"learning_rate": 3.082264114841892e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3132331371307373,
"step": 1680,
"valid_targets_mean": 2975.9,
"valid_targets_min": 1470
},
{
"epoch": 2.713365539452496,
"grad_norm": 0.6354810637538505,
"learning_rate": 3.07550212752928e-05,
"loss": 0.3442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128201365470886,
"step": 1685,
"valid_targets_mean": 3791.3,
"valid_targets_min": 1211
},
{
"epoch": 2.7214170692431563,
"grad_norm": 0.5906889884547679,
"learning_rate": 3.068722800070574e-05,
"loss": 0.334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894616723060608,
"step": 1690,
"valid_targets_mean": 3958.0,
"valid_targets_min": 1407
},
{
"epoch": 2.7294685990338166,
"grad_norm": 0.643609035593482,
"learning_rate": 3.0619262417677695e-05,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34073030948638916,
"step": 1695,
"valid_targets_mean": 3950.0,
"valid_targets_min": 1116
},
{
"epoch": 2.7375201288244764,
"grad_norm": 0.7282369023618399,
"learning_rate": 3.055112562200673e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3716239631175995,
"step": 1700,
"valid_targets_mean": 3736.1,
"valid_targets_min": 991
},
{
"epoch": 2.7455716586151366,
"grad_norm": 0.7474926314066599,
"learning_rate": 3.0482818712251318e-05,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35656508803367615,
"step": 1705,
"valid_targets_mean": 3098.4,
"valid_targets_min": 1529
},
{
"epoch": 2.753623188405797,
"grad_norm": 0.5882343918140231,
"learning_rate": 3.0414342789712675e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22480350732803345,
"step": 1710,
"valid_targets_mean": 6031.0,
"valid_targets_min": 1980
},
{
"epoch": 2.761674718196457,
"grad_norm": 0.7860705058373512,
"learning_rate": 3.034569895841699e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21748200058937073,
"step": 1715,
"valid_targets_mean": 5359.5,
"valid_targets_min": 3428
},
{
"epoch": 2.7697262479871174,
"grad_norm": 0.46882998249925517,
"learning_rate": 3.0276888325097583e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.211460679769516,
"step": 1720,
"valid_targets_mean": 5453.4,
"valid_targets_min": 2625
},
{
"epoch": 2.7777777777777777,
"grad_norm": 0.5396421101555618,
"learning_rate": 3.020791199917713e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22912117838859558,
"step": 1725,
"valid_targets_mean": 6407.3,
"valid_targets_min": 4226
},
{
"epoch": 2.785829307568438,
"grad_norm": 0.44331928629182393,
"learning_rate": 3.0138771092749722e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19119247794151306,
"step": 1730,
"valid_targets_mean": 6119.8,
"valid_targets_min": 2891
},
{
"epoch": 2.793880837359098,
"grad_norm": 0.4549848502323358,
"learning_rate": 3.006946672056297e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18082711100578308,
"step": 1735,
"valid_targets_mean": 5309.0,
"valid_targets_min": 3122
},
{
"epoch": 2.8019323671497585,
"grad_norm": 0.5088412843130042,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18192598223686218,
"step": 1740,
"valid_targets_mean": 5206.8,
"valid_targets_min": 3536
},
{
"epoch": 2.8099838969404187,
"grad_norm": 0.4533466677445726,
"learning_rate": 2.993037205106147e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22841483354568481,
"step": 1745,
"valid_targets_mean": 6110.2,
"valid_targets_min": 3433
},
{
"epoch": 2.818035426731079,
"grad_norm": 0.42286915041535666,
"learning_rate": 2.9860583996347495e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16705384850502014,
"step": 1750,
"valid_targets_mean": 5580.4,
"valid_targets_min": 2346
},
{
"epoch": 2.8260869565217392,
"grad_norm": 0.46308406661472623,
"learning_rate": 2.9790636961039524e-05,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20052894949913025,
"step": 1755,
"valid_targets_mean": 5809.4,
"valid_targets_min": 2808
},
{
"epoch": 2.8341384863123995,
"grad_norm": 0.4973033226604493,
"learning_rate": 2.9720532072882268e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19987952709197998,
"step": 1760,
"valid_targets_mean": 5466.4,
"valid_targets_min": 1878
},
{
"epoch": 2.8421900161030598,
"grad_norm": 0.49364706625593213,
"learning_rate": 2.965027046216544e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24134349822998047,
"step": 1765,
"valid_targets_mean": 6193.4,
"valid_targets_min": 2985
},
{
"epoch": 2.85024154589372,
"grad_norm": 0.44774305114424784,
"learning_rate": 2.9579853261705573e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1811220645904541,
"step": 1770,
"valid_targets_mean": 5857.2,
"valid_targets_min": 3369
},
{
"epoch": 2.8582930756843803,
"grad_norm": 0.5084367346859436,
"learning_rate": 2.950928160682775e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16717293858528137,
"step": 1775,
"valid_targets_mean": 4669.6,
"valid_targets_min": 2984
},
{
"epoch": 2.86634460547504,
"grad_norm": 0.5258355536138191,
"learning_rate": 2.943855663534731e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21475860476493835,
"step": 1780,
"valid_targets_mean": 5739.6,
"valid_targets_min": 3163
},
{
"epoch": 2.8743961352657004,
"grad_norm": 0.624047290830488,
"learning_rate": 2.9367679487551473e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17102691531181335,
"step": 1785,
"valid_targets_mean": 5951.2,
"valid_targets_min": 2774
},
{
"epoch": 2.8824476650563606,
"grad_norm": 0.48242204698030056,
"learning_rate": 2.929665130618098e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20739901065826416,
"step": 1790,
"valid_targets_mean": 5372.6,
"valid_targets_min": 2692
},
{
"epoch": 2.890499194847021,
"grad_norm": 0.4326608763924011,
"learning_rate": 2.9225473236411655e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17670348286628723,
"step": 1795,
"valid_targets_mean": 5611.9,
"valid_targets_min": 3302
},
{
"epoch": 2.898550724637681,
"grad_norm": 0.4674400578356549,
"learning_rate": 2.915414642583596e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.192458838224411,
"step": 1800,
"valid_targets_mean": 5552.4,
"valid_targets_min": 3435
},
{
"epoch": 2.9066022544283414,
"grad_norm": 0.46590415009442393,
"learning_rate": 2.9082672024444485e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20876693725585938,
"step": 1805,
"valid_targets_mean": 5709.1,
"valid_targets_min": 3713
},
{
"epoch": 2.9146537842190017,
"grad_norm": 0.55521296635976,
"learning_rate": 2.901105118460737e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20165735483169556,
"step": 1810,
"valid_targets_mean": 5800.1,
"valid_targets_min": 3378
},
{
"epoch": 2.922705314009662,
"grad_norm": 0.44671622462161964,
"learning_rate": 2.8939285061055807e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20931756496429443,
"step": 1815,
"valid_targets_mean": 5923.8,
"valid_targets_min": 3662
},
{
"epoch": 2.930756843800322,
"grad_norm": 0.45724838211116503,
"learning_rate": 2.8867374810863325e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18910741806030273,
"step": 1820,
"valid_targets_mean": 5651.0,
"valid_targets_min": 3365
},
{
"epoch": 2.938808373590982,
"grad_norm": 0.45924176560852137,
"learning_rate": 2.8795321593427227e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2153066247701645,
"step": 1825,
"valid_targets_mean": 6766.6,
"valid_targets_min": 3372
},
{
"epoch": 2.9468599033816423,
"grad_norm": 0.4602179071328878,
"learning_rate": 2.8723126570449813e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17615215480327606,
"step": 1830,
"valid_targets_mean": 5546.4,
"valid_targets_min": 3374
},
{
"epoch": 2.9549114331723025,
"grad_norm": 0.4757535168677279,
"learning_rate": 2.8650790905919724e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18606898188591003,
"step": 1835,
"valid_targets_mean": 5870.6,
"valid_targets_min": 3626
},
{
"epoch": 2.962962962962963,
"grad_norm": 0.4550197511497243,
"learning_rate": 2.8578315766093133e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20954301953315735,
"step": 1840,
"valid_targets_mean": 5978.6,
"valid_targets_min": 3695
},
{
"epoch": 2.971014492753623,
"grad_norm": 0.48815632704334255,
"learning_rate": 2.850570231947493e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20100757479667664,
"step": 1845,
"valid_targets_mean": 5347.4,
"valid_targets_min": 3463
},
{
"epoch": 2.9790660225442833,
"grad_norm": 0.45140508763909315,
"learning_rate": 2.8432951736799933e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1854209005832672,
"step": 1850,
"valid_targets_mean": 5264.8,
"valid_targets_min": 3132
},
{
"epoch": 2.9871175523349436,
"grad_norm": 0.47657839693030885,
"learning_rate": 2.8360065191013967e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1967577189207077,
"step": 1855,
"valid_targets_mean": 5723.9,
"valid_targets_min": 3017
},
{
"epoch": 2.995169082125604,
"grad_norm": 0.4892874249873267,
"learning_rate": 2.8287043857254957e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1871507167816162,
"step": 1860,
"valid_targets_mean": 6460.0,
"valid_targets_min": 2935
},
{
"epoch": 3.003220611916264,
"grad_norm": 0.5527497946640381,
"learning_rate": 2.8213888912834026e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.258331298828125,
"step": 1865,
"valid_targets_mean": 5212.3,
"valid_targets_min": 987
},
{
"epoch": 3.0112721417069244,
"grad_norm": 0.5830002451186027,
"learning_rate": 2.814060153721644e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999268174171448,
"step": 1870,
"valid_targets_mean": 6001.2,
"valid_targets_min": 433
},
{
"epoch": 3.0193236714975846,
"grad_norm": 0.4500521340884674,
"learning_rate": 2.8067182912002663e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2809280753135681,
"step": 1875,
"valid_targets_mean": 6695.0,
"valid_targets_min": 3606
},
{
"epoch": 3.027375201288245,
"grad_norm": 0.4652104269522271,
"learning_rate": 2.7993634220909254e-05,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22316525876522064,
"step": 1880,
"valid_targets_mean": 5460.7,
"valid_targets_min": 284
},
{
"epoch": 3.035426731078905,
"grad_norm": 0.46090061714203895,
"learning_rate": 2.7919956649749826e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2710314095020294,
"step": 1885,
"valid_targets_mean": 6763.2,
"valid_targets_min": 3435
},
{
"epoch": 3.0434782608695654,
"grad_norm": 0.4611138651345071,
"learning_rate": 2.784615138641588e-05,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.242034912109375,
"step": 1890,
"valid_targets_mean": 6750.6,
"valid_targets_min": 3554
},
{
"epoch": 3.0515297906602252,
"grad_norm": 0.49645873562039455,
"learning_rate": 2.7772219620857685e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28464362025260925,
"step": 1895,
"valid_targets_mean": 6853.2,
"valid_targets_min": 4715
},
{
"epoch": 3.0595813204508855,
"grad_norm": 0.4950622875309601,
"learning_rate": 2.769816254506509e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540530562400818,
"step": 1900,
"valid_targets_mean": 5465.6,
"valid_targets_min": 2485
},
{
"epoch": 3.0676328502415457,
"grad_norm": 0.4737619492864805,
"learning_rate": 2.76239813530483e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536058723926544,
"step": 1905,
"valid_targets_mean": 7040.4,
"valid_targets_min": 3642
},
{
"epoch": 3.075684380032206,
"grad_norm": 0.43563346257793917,
"learning_rate": 2.7549677240818628e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25332552194595337,
"step": 1910,
"valid_targets_mean": 6890.4,
"valid_targets_min": 3408
},
{
"epoch": 3.0837359098228663,
"grad_norm": 0.5538637159995918,
"learning_rate": 2.7475251406369197e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27943116426467896,
"step": 1915,
"valid_targets_mean": 5696.9,
"valid_targets_min": 2285
},
{
"epoch": 3.0917874396135265,
"grad_norm": 0.502755804416658,
"learning_rate": 2.740070504965565e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2628275156021118,
"step": 1920,
"valid_targets_mean": 5780.6,
"valid_targets_min": 1991
},
{
"epoch": 3.099838969404187,
"grad_norm": 0.46642134348041764,
"learning_rate": 2.7326039372576782e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26721107959747314,
"step": 1925,
"valid_targets_mean": 5684.6,
"valid_targets_min": 2267
},
{
"epoch": 3.107890499194847,
"grad_norm": 0.4761056162555204,
"learning_rate": 2.7251255578955186e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24499773979187012,
"step": 1930,
"valid_targets_mean": 6097.4,
"valid_targets_min": 536
},
{
"epoch": 3.1159420289855073,
"grad_norm": 0.4574904350207186,
"learning_rate": 2.7176354874517805e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528035044670105,
"step": 1935,
"valid_targets_mean": 5954.2,
"valid_targets_min": 3071
},
{
"epoch": 3.1239935587761676,
"grad_norm": 0.5257344524597956,
"learning_rate": 2.7101338466876542e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25541383028030396,
"step": 1940,
"valid_targets_mean": 5115.2,
"valid_targets_min": 2196
},
{
"epoch": 3.132045088566828,
"grad_norm": 0.9148021670271776,
"learning_rate": 2.702620756550874e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4044179320335388,
"step": 1945,
"valid_targets_mean": 2789.6,
"valid_targets_min": 1009
},
{
"epoch": 3.140096618357488,
"grad_norm": 0.8933463865740449,
"learning_rate": 2.6950963381737728e-05,
"loss": 0.4008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43537747859954834,
"step": 1950,
"valid_targets_mean": 3042.1,
"valid_targets_min": 1721
},
{
"epoch": 3.148148148148148,
"grad_norm": 0.7586492212375334,
"learning_rate": 2.687560712871325e-05,
"loss": 0.4051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40004706382751465,
"step": 1955,
"valid_targets_mean": 3377.2,
"valid_targets_min": 860
},
{
"epoch": 3.156199677938808,
"grad_norm": 0.8200189711325815,
"learning_rate": 2.6800140021391933e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42270979285240173,
"step": 1960,
"valid_targets_mean": 3314.4,
"valid_targets_min": 1619
},
{
"epoch": 3.1642512077294684,
"grad_norm": 0.7884155012819621,
"learning_rate": 2.6724563276517697e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36296790838241577,
"step": 1965,
"valid_targets_mean": 3112.6,
"valid_targets_min": 1068
},
{
"epoch": 3.1723027375201287,
"grad_norm": 0.6764869788258896,
"learning_rate": 2.6648878112602115e-05,
"loss": 0.3728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35345786809921265,
"step": 1970,
"valid_targets_mean": 3572.9,
"valid_targets_min": 1413
},
{
"epoch": 3.180354267310789,
"grad_norm": 0.7225388514917793,
"learning_rate": 2.6573085749904784e-05,
"loss": 0.3774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39635008573532104,
"step": 1975,
"valid_targets_mean": 3774.3,
"valid_targets_min": 1338
},
{
"epoch": 3.1884057971014492,
"grad_norm": 0.8231423436666249,
"learning_rate": 2.6497187410413676e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3863440752029419,
"step": 1980,
"valid_targets_mean": 2317.6,
"valid_targets_min": 1079
},
{
"epoch": 3.1964573268921095,
"grad_norm": 0.7285170435595408,
"learning_rate": 2.642118431782537e-05,
"loss": 0.3874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3951292335987091,
"step": 1985,
"valid_targets_mean": 3185.3,
"valid_targets_min": 985
},
{
"epoch": 3.2045088566827697,
"grad_norm": 0.7017080619872773,
"learning_rate": 2.6345077697525394e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.347123384475708,
"step": 1990,
"valid_targets_mean": 3075.4,
"valid_targets_min": 1376
},
{
"epoch": 3.21256038647343,
"grad_norm": 0.8231794679729749,
"learning_rate": 2.6268868776568416e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35584574937820435,
"step": 1995,
"valid_targets_mean": 2823.5,
"valid_targets_min": 1187
},
{
"epoch": 3.2206119162640903,
"grad_norm": 0.7683051537663695,
"learning_rate": 2.619255878365849e-05,
"loss": 0.3626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33899423480033875,
"step": 2000,
"valid_targets_mean": 3121.4,
"valid_targets_min": 1260
},
{
"epoch": 3.2286634460547505,
"grad_norm": 1.0228623510526746,
"learning_rate": 2.6116148949129237e-05,
"loss": 0.3926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3965111970901489,
"step": 2005,
"valid_targets_mean": 3859.0,
"valid_targets_min": 1457
},
{
"epoch": 3.236714975845411,
"grad_norm": 0.8910998328193267,
"learning_rate": 2.603964050492401e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4256768822669983,
"step": 2010,
"valid_targets_mean": 2689.9,
"valid_targets_min": 909
},
{
"epoch": 3.244766505636071,
"grad_norm": 0.7345012383668745,
"learning_rate": 2.5963034684576024e-05,
"loss": 0.3855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3804903030395508,
"step": 2015,
"valid_targets_mean": 3814.0,
"valid_targets_min": 1182
},
{
"epoch": 3.2528180354267313,
"grad_norm": 0.7678805707006796,
"learning_rate": 2.5886332723188484e-05,
"loss": 0.3777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36300283670425415,
"step": 2020,
"valid_targets_mean": 3139.2,
"valid_targets_min": 999
},
{
"epoch": 3.260869565217391,
"grad_norm": 0.8103254411230125,
"learning_rate": 2.5809535857414637e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3861234784126282,
"step": 2025,
"valid_targets_mean": 3032.6,
"valid_targets_min": 1346
},
{
"epoch": 3.2689210950080514,
"grad_norm": 0.8485120319760017,
"learning_rate": 2.573264532543788e-05,
"loss": 0.3716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.399763822555542,
"step": 2030,
"valid_targets_mean": 2960.4,
"valid_targets_min": 1292
},
{
"epoch": 3.2769726247987117,
"grad_norm": 0.7941028816750529,
"learning_rate": 2.5655662366951778e-05,
"loss": 0.3836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38156741857528687,
"step": 2035,
"valid_targets_mean": 3008.5,
"valid_targets_min": 1031
},
{
"epoch": 3.285024154589372,
"grad_norm": 0.7517179718878059,
"learning_rate": 2.557858822314007e-05,
"loss": 0.3784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3794868588447571,
"step": 2040,
"valid_targets_mean": 2940.0,
"valid_targets_min": 1404
},
{
"epoch": 3.293075684380032,
"grad_norm": 0.7474671950243801,
"learning_rate": 2.5501424136656635e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3578556180000305,
"step": 2045,
"valid_targets_mean": 2994.5,
"valid_targets_min": 1383
},
{
"epoch": 3.3011272141706924,
"grad_norm": 0.8073459873948605,
"learning_rate": 2.5424171351605518e-05,
"loss": 0.3917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35137873888015747,
"step": 2050,
"valid_targets_mean": 2981.6,
"valid_targets_min": 1013
},
{
"epoch": 3.3091787439613527,
"grad_norm": 0.7363545984797931,
"learning_rate": 2.5346831113520827e-05,
"loss": 0.3558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33045268058776855,
"step": 2055,
"valid_targets_mean": 2965.2,
"valid_targets_min": 1119
},
{
"epoch": 3.317230273752013,
"grad_norm": 0.8551622649502074,
"learning_rate": 2.526940466934664e-05,
"loss": 0.3791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4106612801551819,
"step": 2060,
"valid_targets_mean": 2819.8,
"valid_targets_min": 1638
},
{
"epoch": 3.325281803542673,
"grad_norm": 0.8197438218947848,
"learning_rate": 2.5191893267416964e-05,
"loss": 0.3761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35730135440826416,
"step": 2065,
"valid_targets_mean": 3237.6,
"valid_targets_min": 1255
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.8675787777451592,
"learning_rate": 2.5114298157435526e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3833295404911041,
"step": 2070,
"valid_targets_mean": 3031.8,
"valid_targets_min": 1244
},
{
"epoch": 3.3413848631239937,
"grad_norm": 0.7989238817393547,
"learning_rate": 2.503662059045568e-05,
"loss": 0.3959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39606934785842896,
"step": 2075,
"valid_targets_mean": 2751.6,
"valid_targets_min": 1349
},
{
"epoch": 3.3494363929146536,
"grad_norm": 0.7649931205299405,
"learning_rate": 2.4958861818860217e-05,
"loss": 0.3756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3948572874069214,
"step": 2080,
"valid_targets_mean": 2998.9,
"valid_targets_min": 1344
},
{
"epoch": 3.357487922705314,
"grad_norm": 0.6957699032853977,
"learning_rate": 2.488102309634119e-05,
"loss": 0.3733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36002251505851746,
"step": 2085,
"valid_targets_mean": 3551.8,
"valid_targets_min": 1310
},
{
"epoch": 3.365539452495974,
"grad_norm": 0.8172302341279781,
"learning_rate": 2.480310567787967e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3608362078666687,
"step": 2090,
"valid_targets_mean": 2457.2,
"valid_targets_min": 1285
},
{
"epoch": 3.3735909822866343,
"grad_norm": 0.6603911880036989,
"learning_rate": 2.4725110819725542e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34838154911994934,
"step": 2095,
"valid_targets_mean": 4338.5,
"valid_targets_min": 1915
},
{
"epoch": 3.3816425120772946,
"grad_norm": 0.7013111479678409,
"learning_rate": 2.464703977937723e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3159921169281006,
"step": 2100,
"valid_targets_mean": 3443.4,
"valid_targets_min": 1224
},
{
"epoch": 3.389694041867955,
"grad_norm": 0.7271690127494458,
"learning_rate": 2.456889381556144e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3470936417579651,
"step": 2105,
"valid_targets_mean": 3482.4,
"valid_targets_min": 1451
},
{
"epoch": 3.397745571658615,
"grad_norm": 0.6846909480553407,
"learning_rate": 2.449067418821285e-05,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3760640025138855,
"step": 2110,
"valid_targets_mean": 3535.4,
"valid_targets_min": 1258
},
{
"epoch": 3.4057971014492754,
"grad_norm": 0.6498807742334415,
"learning_rate": 2.4412382158453807e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31845319271087646,
"step": 2115,
"valid_targets_mean": 3810.8,
"valid_targets_min": 1412
},
{
"epoch": 3.4138486312399356,
"grad_norm": 0.7280328109327153,
"learning_rate": 2.4334018988573983e-05,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33589398860931396,
"step": 2120,
"valid_targets_mean": 3309.2,
"valid_targets_min": 815
},
{
"epoch": 3.421900161030596,
"grad_norm": 0.5931265791786551,
"learning_rate": 2.425558594201004e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26291149854660034,
"step": 2125,
"valid_targets_mean": 4325.1,
"valid_targets_min": 1575
},
{
"epoch": 3.429951690821256,
"grad_norm": 0.7111318648584927,
"learning_rate": 2.417708428332525e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34463876485824585,
"step": 2130,
"valid_targets_mean": 3129.6,
"valid_targets_min": 1545
},
{
"epoch": 3.4380032206119164,
"grad_norm": 0.6250487281091418,
"learning_rate": 2.4098515278189097e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3047589063644409,
"step": 2135,
"valid_targets_mean": 4161.9,
"valid_targets_min": 1557
},
{
"epoch": 3.4460547504025767,
"grad_norm": 0.626198180719724,
"learning_rate": 2.4019880193356902e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3424261808395386,
"step": 2140,
"valid_targets_mean": 3786.2,
"valid_targets_min": 1129
},
{
"epoch": 3.454106280193237,
"grad_norm": 0.6155081722038326,
"learning_rate": 2.3941180296649348e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31505197286605835,
"step": 2145,
"valid_targets_mean": 4313.6,
"valid_targets_min": 1130
},
{
"epoch": 3.4621578099838968,
"grad_norm": 0.6956667846707119,
"learning_rate": 2.3862416856932087e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32704436779022217,
"step": 2150,
"valid_targets_mean": 3571.6,
"valid_targets_min": 1459
},
{
"epoch": 3.470209339774557,
"grad_norm": 0.7061438709341965,
"learning_rate": 2.378359114409527e-05,
"loss": 0.334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3402191996574402,
"step": 2155,
"valid_targets_mean": 3576.9,
"valid_targets_min": 1717
},
{
"epoch": 3.4782608695652173,
"grad_norm": 0.6733367985439651,
"learning_rate": 2.370470442903306e-05,
"loss": 0.3334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29829442501068115,
"step": 2160,
"valid_targets_mean": 3445.9,
"valid_targets_min": 1340
},
{
"epoch": 3.4863123993558776,
"grad_norm": 0.7199769182800366,
"learning_rate": 2.362575798362315e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3266036808490753,
"step": 2165,
"valid_targets_mean": 3381.9,
"valid_targets_min": 968
},
{
"epoch": 3.494363929146538,
"grad_norm": 0.762977409147056,
"learning_rate": 2.3546753080706242e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32624316215515137,
"step": 2170,
"valid_targets_mean": 3398.4,
"valid_targets_min": 732
},
{
"epoch": 3.502415458937198,
"grad_norm": 0.7356969210292927,
"learning_rate": 2.346769099406557e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3401956260204315,
"step": 2175,
"valid_targets_mean": 3281.4,
"valid_targets_min": 1153
},
{
"epoch": 3.5104669887278583,
"grad_norm": 0.6884173861250173,
"learning_rate": 2.33885729984063e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33478766679763794,
"step": 2180,
"valid_targets_mean": 3259.2,
"valid_targets_min": 1348
},
{
"epoch": 3.5185185185185186,
"grad_norm": 0.6833192926719988,
"learning_rate": 2.3309400369335033e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29600557684898376,
"step": 2185,
"valid_targets_mean": 3833.4,
"valid_targets_min": 1495
},
{
"epoch": 3.526570048309179,
"grad_norm": 0.6951855497662062,
"learning_rate": 2.3230174383339196e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3087206780910492,
"step": 2190,
"valid_targets_mean": 3652.0,
"valid_targets_min": 1088
},
{
"epoch": 3.534621578099839,
"grad_norm": 0.6613560062519789,
"learning_rate": 2.3150896317766505e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983492612838745,
"step": 2195,
"valid_targets_mean": 3762.8,
"valid_targets_min": 1512
},
{
"epoch": 3.542673107890499,
"grad_norm": 0.68550903113913,
"learning_rate": 2.3071567450804325e-05,
"loss": 0.3477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35058295726776123,
"step": 2200,
"valid_targets_mean": 3278.4,
"valid_targets_min": 1405
},
{
"epoch": 3.550724637681159,
"grad_norm": 0.8603392885960655,
"learning_rate": 2.299218906145909e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34910333156585693,
"step": 2205,
"valid_targets_mean": 2441.1,
"valid_targets_min": 1235
},
{
"epoch": 3.5587761674718195,
"grad_norm": 0.6801260592469724,
"learning_rate": 2.2912762429535684e-05,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2981488108634949,
"step": 2210,
"valid_targets_mean": 3300.4,
"valid_targets_min": 1317
},
{
"epoch": 3.5668276972624797,
"grad_norm": 0.7979499575329786,
"learning_rate": 2.2833288835616784e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3507813513278961,
"step": 2215,
"valid_targets_mean": 3180.9,
"valid_targets_min": 1377
},
{
"epoch": 3.57487922705314,
"grad_norm": 0.7589237518218688,
"learning_rate": 2.2753769561042235e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2893664240837097,
"step": 2220,
"valid_targets_mean": 2736.6,
"valid_targets_min": 1348
},
{
"epoch": 3.5829307568438002,
"grad_norm": 0.7842484155012712,
"learning_rate": 2.2674205887888386e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34598594903945923,
"step": 2225,
"valid_targets_mean": 2817.1,
"valid_targets_min": 1021
},
{
"epoch": 3.5909822866344605,
"grad_norm": 0.7553985888978503,
"learning_rate": 2.259459909894742e-05,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3397219777107239,
"step": 2230,
"valid_targets_mean": 3038.3,
"valid_targets_min": 1150
},
{
"epoch": 3.5990338164251208,
"grad_norm": 0.6631101299213469,
"learning_rate": 2.2514950477706657e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631319761276245,
"step": 2235,
"valid_targets_mean": 3378.8,
"valid_targets_min": 1412
},
{
"epoch": 3.607085346215781,
"grad_norm": 0.6917879399712983,
"learning_rate": 2.2435261308327875e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921825051307678,
"step": 2240,
"valid_targets_mean": 3375.1,
"valid_targets_min": 950
},
{
"epoch": 3.6151368760064413,
"grad_norm": 0.6646988908267994,
"learning_rate": 2.2355532875626612e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28387004137039185,
"step": 2245,
"valid_targets_mean": 3651.2,
"valid_targets_min": 938
},
{
"epoch": 3.6231884057971016,
"grad_norm": 0.7566641430033721,
"learning_rate": 2.2275766465051444e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3653978705406189,
"step": 2250,
"valid_targets_mean": 3000.1,
"valid_targets_min": 937
},
{
"epoch": 3.631239935587762,
"grad_norm": 0.640762301083058,
"learning_rate": 2.2195963362663236e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2885698080062866,
"step": 2255,
"valid_targets_mean": 4016.1,
"valid_targets_min": 1710
},
{
"epoch": 3.639291465378422,
"grad_norm": 0.7312405714684358,
"learning_rate": 2.211612485511446e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3239280581474304,
"step": 2260,
"valid_targets_mean": 3113.6,
"valid_targets_min": 1036
},
{
"epoch": 3.6473429951690823,
"grad_norm": 0.6797552789086924,
"learning_rate": 2.2036252229628392e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30023393034935,
"step": 2265,
"valid_targets_mean": 3113.1,
"valid_targets_min": 1421
},
{
"epoch": 3.6553945249597426,
"grad_norm": 0.7033890984196507,
"learning_rate": 2.19563467739784e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33096373081207275,
"step": 2270,
"valid_targets_mean": 3861.4,
"valid_targets_min": 1570
},
{
"epoch": 3.6634460547504024,
"grad_norm": 0.693299418919331,
"learning_rate": 2.1876409776467165e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31812596321105957,
"step": 2275,
"valid_targets_mean": 3224.8,
"valid_targets_min": 1644
},
{
"epoch": 3.6714975845410627,
"grad_norm": 0.7050830766977225,
"learning_rate": 2.1796442525905923e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2968364953994751,
"step": 2280,
"valid_targets_mean": 3072.1,
"valid_targets_min": 1239
},
{
"epoch": 3.679549114331723,
"grad_norm": 0.7092053234510587,
"learning_rate": 2.171644631159366e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33621740341186523,
"step": 2285,
"valid_targets_mean": 3552.6,
"valid_targets_min": 1180
},
{
"epoch": 3.687600644122383,
"grad_norm": 0.7327779149808457,
"learning_rate": 2.163642242329633e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3615042567253113,
"step": 2290,
"valid_targets_mean": 3199.9,
"valid_targets_min": 1402
},
{
"epoch": 3.6956521739130435,
"grad_norm": 0.6747000049468731,
"learning_rate": 2.1556372151226097e-05,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30473870038986206,
"step": 2295,
"valid_targets_mean": 3625.8,
"valid_targets_min": 1668
},
{
"epoch": 3.7037037037037037,
"grad_norm": 0.6905439473556321,
"learning_rate": 2.1476296786020502e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3153340816497803,
"step": 2300,
"valid_targets_mean": 3234.1,
"valid_targets_min": 1476
},
{
"epoch": 3.711755233494364,
"grad_norm": 0.757410046151389,
"learning_rate": 2.139619761872163e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32494598627090454,
"step": 2305,
"valid_targets_mean": 3108.1,
"valid_targets_min": 1329
},
{
"epoch": 3.7198067632850242,
"grad_norm": 0.6333814485490104,
"learning_rate": 2.1316075940755363e-05,
"loss": 0.3101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30045998096466064,
"step": 2310,
"valid_targets_mean": 4108.0,
"valid_targets_min": 1439
},
{
"epoch": 3.7278582930756845,
"grad_norm": 0.8569424628003814,
"learning_rate": 2.1235933043910488e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3410085439682007,
"step": 2315,
"valid_targets_mean": 2746.4,
"valid_targets_min": 965
},
{
"epoch": 3.7359098228663448,
"grad_norm": 0.7003250678607069,
"learning_rate": 2.1155770220317918e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29915452003479004,
"step": 2320,
"valid_targets_mean": 3250.2,
"valid_targets_min": 1373
},
{
"epoch": 3.7439613526570046,
"grad_norm": 0.731064940807403,
"learning_rate": 2.107558876242983e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.330859899520874,
"step": 2325,
"valid_targets_mean": 3688.2,
"valid_targets_min": 1267
},
{
"epoch": 3.752012882447665,
"grad_norm": 0.6231472245606579,
"learning_rate": 2.0995389962998845e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20000654458999634,
"step": 2330,
"valid_targets_mean": 4773.8,
"valid_targets_min": 1417
},
{
"epoch": 3.760064412238325,
"grad_norm": 1.1067173824667762,
"learning_rate": 2.091517511505719e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921842396259308,
"step": 2335,
"valid_targets_mean": 5335.0,
"valid_targets_min": 2383
},
{
"epoch": 3.7681159420289854,
"grad_norm": 0.4630108390914341,
"learning_rate": 2.0834945511895816e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726524531841278,
"step": 2340,
"valid_targets_mean": 5678.3,
"valid_targets_min": 2928
},
{
"epoch": 3.7761674718196456,
"grad_norm": 0.5122162205986636,
"learning_rate": 2.0754702447043585e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21546904742717743,
"step": 2345,
"valid_targets_mean": 6460.8,
"valid_targets_min": 2335
},
{
"epoch": 3.784219001610306,
"grad_norm": 0.43207305254475,
"learning_rate": 2.0674447214246394e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15075618028640747,
"step": 2350,
"valid_targets_mean": 6145.8,
"valid_targets_min": 3540
},
{
"epoch": 3.792270531400966,
"grad_norm": 0.4774154606281994,
"learning_rate": 2.059418110744633e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17323094606399536,
"step": 2355,
"valid_targets_mean": 5129.8,
"valid_targets_min": 3650
},
{
"epoch": 3.8003220611916264,
"grad_norm": 0.46983051174721563,
"learning_rate": 2.0513905420760798e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1917821168899536,
"step": 2360,
"valid_targets_mean": 6283.1,
"valid_targets_min": 3367
},
{
"epoch": 3.8083735909822867,
"grad_norm": 0.4902336033194191,
"learning_rate": 2.043362144846164e-05,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25147587060928345,
"step": 2365,
"valid_targets_mean": 5965.1,
"valid_targets_min": 3021
},
{
"epoch": 3.816425120772947,
"grad_norm": 0.42280694124833545,
"learning_rate": 2.035333048495431e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20615729689598083,
"step": 2370,
"valid_targets_mean": 7093.3,
"valid_targets_min": 2985
},
{
"epoch": 3.824476650563607,
"grad_norm": 0.4889232418853953,
"learning_rate": 2.0273033824756964e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2106115221977234,
"step": 2375,
"valid_targets_mean": 5944.9,
"valid_targets_min": 3130
},
{
"epoch": 3.8325281803542675,
"grad_norm": 0.4486166262691516,
"learning_rate": 2.0192732762479616e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20369920134544373,
"step": 2380,
"valid_targets_mean": 6768.1,
"valid_targets_min": 2346
},
{
"epoch": 3.8405797101449277,
"grad_norm": 0.5052893828675203,
"learning_rate": 2.011242859280325e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20773877203464508,
"step": 2385,
"valid_targets_mean": 5635.4,
"valid_targets_min": 3421
},
{
"epoch": 3.848631239935588,
"grad_norm": 0.552069432523759,
"learning_rate": 2.0032122610458947e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16113221645355225,
"step": 2390,
"valid_targets_mean": 4650.4,
"valid_targets_min": 2970
},
{
"epoch": 3.8566827697262482,
"grad_norm": 0.524046615447888,
"learning_rate": 1.9951816110207004e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20094186067581177,
"step": 2395,
"valid_targets_mean": 5519.9,
"valid_targets_min": 3054
},
{
"epoch": 3.864734299516908,
"grad_norm": 0.48693523721557375,
"learning_rate": 1.9871510386816103e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18589508533477783,
"step": 2400,
"valid_targets_mean": 6197.9,
"valid_targets_min": 3424
},
{
"epoch": 3.8727858293075683,
"grad_norm": 0.49674650842025453,
"learning_rate": 1.979120673504235e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16874763369560242,
"step": 2405,
"valid_targets_mean": 5672.4,
"valid_targets_min": 3860
},
{
"epoch": 3.8808373590982286,
"grad_norm": 0.5935011533211295,
"learning_rate": 1.9710906449608498e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16884219646453857,
"step": 2410,
"valid_targets_mean": 5892.7,
"valid_targets_min": 2898
},
{
"epoch": 3.888888888888889,
"grad_norm": 0.4678758596506749,
"learning_rate": 1.9630610825182992e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1843390017747879,
"step": 2415,
"valid_targets_mean": 5762.8,
"valid_targets_min": 3670
},
{
"epoch": 3.896940418679549,
"grad_norm": 0.466433159436347,
"learning_rate": 1.955032115635915e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16634991765022278,
"step": 2420,
"valid_targets_mean": 6079.9,
"valid_targets_min": 3135
},
{
"epoch": 3.9049919484702094,
"grad_norm": 0.4703450305531825,
"learning_rate": 1.9470038737634257e-05,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18430741131305695,
"step": 2425,
"valid_targets_mean": 5954.4,
"valid_targets_min": 2502
},
{
"epoch": 3.9130434782608696,
"grad_norm": 0.4988164707549782,
"learning_rate": 1.9389764863388706e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18756403028964996,
"step": 2430,
"valid_targets_mean": 5311.7,
"valid_targets_min": 3278
},
{
"epoch": 3.92109500805153,
"grad_norm": 0.4630341885874764,
"learning_rate": 1.9309500827865136e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15896305441856384,
"step": 2435,
"valid_targets_mean": 5995.9,
"valid_targets_min": 2819
},
{
"epoch": 3.92914653784219,
"grad_norm": 0.4913791539120621,
"learning_rate": 1.9229247925147553e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16495642066001892,
"step": 2440,
"valid_targets_mean": 5220.8,
"valid_targets_min": 3358
},
{
"epoch": 3.9371980676328504,
"grad_norm": 0.46392543060132874,
"learning_rate": 1.9149007449140462e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17253006994724274,
"step": 2445,
"valid_targets_mean": 4946.7,
"valid_targets_min": 2665
},
{
"epoch": 3.9452495974235102,
"grad_norm": 0.4222579875698941,
"learning_rate": 1.906878069354804e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16640131175518036,
"step": 2450,
"valid_targets_mean": 6109.9,
"valid_targets_min": 2762
},
{
"epoch": 3.9533011272141705,
"grad_norm": 0.5936694712109022,
"learning_rate": 1.898856895185322e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1677541732788086,
"step": 2455,
"valid_targets_mean": 5266.1,
"valid_targets_min": 3731
},
{
"epoch": 3.9613526570048307,
"grad_norm": 0.5089530035696851,
"learning_rate": 1.8908373517296888e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17881962656974792,
"step": 2460,
"valid_targets_mean": 6246.1,
"valid_targets_min": 2970
},
{
"epoch": 3.969404186795491,
"grad_norm": 0.4163908705213259,
"learning_rate": 1.882819568285701e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16383564472198486,
"step": 2465,
"valid_targets_mean": 6126.9,
"valid_targets_min": 3345
},
{
"epoch": 3.9774557165861513,
"grad_norm": 0.5352174387805062,
"learning_rate": 1.874803674122778e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686192899942398,
"step": 2470,
"valid_targets_mean": 5409.5,
"valid_targets_min": 2785
},
{
"epoch": 3.9855072463768115,
"grad_norm": 0.5174379593558874,
"learning_rate": 1.8667897984798804e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20292040705680847,
"step": 2475,
"valid_targets_mean": 6526.0,
"valid_targets_min": 3724
},
{
"epoch": 3.993558776167472,
"grad_norm": 0.46174047001815965,
"learning_rate": 1.858778070563422e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856258511543274,
"step": 2480,
"valid_targets_mean": 5751.2,
"valid_targets_min": 3683
},
{
"epoch": 4.001610305958132,
"grad_norm": 0.486458689377258,
"learning_rate": 1.8507686195451918e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22269584238529205,
"step": 2485,
"valid_targets_mean": 6743.1,
"valid_targets_min": 2494
},
{
"epoch": 4.009661835748792,
"grad_norm": 0.49067053864038795,
"learning_rate": 1.8427615745602667e-05,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24867583811283112,
"step": 2490,
"valid_targets_mean": 6679.0,
"valid_targets_min": 2802
},
{
"epoch": 4.017713365539453,
"grad_norm": 0.48082700217324775,
"learning_rate": 1.834757064704933e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2587515413761139,
"step": 2495,
"valid_targets_mean": 6534.6,
"valid_targets_min": 2100
},
{
"epoch": 4.025764895330113,
"grad_norm": 0.463238335944571,
"learning_rate": 1.826755219034603e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24451354146003723,
"step": 2500,
"valid_targets_mean": 6190.5,
"valid_targets_min": 2430
},
{
"epoch": 4.033816425120773,
"grad_norm": 0.47115946029794054,
"learning_rate": 1.818756166561733e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2353125512599945,
"step": 2505,
"valid_targets_mean": 6432.6,
"valid_targets_min": 1969
},
{
"epoch": 4.041867954911433,
"grad_norm": 0.5556347094263723,
"learning_rate": 1.8107600362537473e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25839778780937195,
"step": 2510,
"valid_targets_mean": 4996.2,
"valid_targets_min": 695
},
{
"epoch": 4.049919484702094,
"grad_norm": 0.4828357803593343,
"learning_rate": 1.8027669570309572e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28702059388160706,
"step": 2515,
"valid_targets_mean": 7438.4,
"valid_targets_min": 3650
},
{
"epoch": 4.057971014492754,
"grad_norm": 0.4732689439450728,
"learning_rate": 1.7947770577644787e-05,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24621464312076569,
"step": 2520,
"valid_targets_mean": 5771.1,
"valid_targets_min": 2778
},
{
"epoch": 4.066022544283414,
"grad_norm": 0.51704075854913,
"learning_rate": 1.786790467274161e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27112066745758057,
"step": 2525,
"valid_targets_mean": 6732.4,
"valid_targets_min": 880
},
{
"epoch": 4.074074074074074,
"grad_norm": 0.4888484890427802,
"learning_rate": 1.778807314326505e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2849244475364685,
"step": 2530,
"valid_targets_mean": 6322.0,
"valid_targets_min": 2822
},
{
"epoch": 4.082125603864735,
"grad_norm": 0.5118382404505906,
"learning_rate": 1.7708277276325886e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2283010631799698,
"step": 2535,
"valid_targets_mean": 6036.7,
"valid_targets_min": 1334
},
{
"epoch": 4.090177133655395,
"grad_norm": 0.47873074069899385,
"learning_rate": 1.762851835845992e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20961812138557434,
"step": 2540,
"valid_targets_mean": 5966.9,
"valid_targets_min": 3109
},
{
"epoch": 4.098228663446055,
"grad_norm": 0.5079150029764018,
"learning_rate": 1.754879767560723e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23400455713272095,
"step": 2545,
"valid_targets_mean": 5874.7,
"valid_targets_min": 2080
},
{
"epoch": 4.106280193236715,
"grad_norm": 0.4709937790052201,
"learning_rate": 1.746911651309144e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23563805222511292,
"step": 2550,
"valid_targets_mean": 5984.3,
"valid_targets_min": 2278
},
{
"epoch": 4.114331723027375,
"grad_norm": 0.5582460016862327,
"learning_rate": 1.7389476155598974e-05,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261229932308197,
"step": 2555,
"valid_targets_mean": 4817.7,
"valid_targets_min": 1991
},
{
"epoch": 4.122383252818035,
"grad_norm": 0.4613472981940905,
"learning_rate": 1.7309877887158388e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22766956686973572,
"step": 2560,
"valid_targets_mean": 6135.9,
"valid_targets_min": 1736
},
{
"epoch": 4.130434782608695,
"grad_norm": 0.5809580379347714,
"learning_rate": 1.723032299111964e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2500440180301666,
"step": 2565,
"valid_targets_mean": 5818.6,
"valid_targets_min": 2083
},
{
"epoch": 4.138486312399356,
"grad_norm": 0.9151207208782325,
"learning_rate": 1.7150812750133382e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3996202051639557,
"step": 2570,
"valid_targets_mean": 3210.2,
"valid_targets_min": 1526
},
{
"epoch": 4.146537842190016,
"grad_norm": 0.8283372169743392,
"learning_rate": 1.707134844613032e-05,
"loss": 0.3757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34221383929252625,
"step": 2575,
"valid_targets_mean": 2571.2,
"valid_targets_min": 1220
},
{
"epoch": 4.154589371980676,
"grad_norm": 0.7100117027673157,
"learning_rate": 1.699193136030052e-05,
"loss": 0.3546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34208422899246216,
"step": 2580,
"valid_targets_mean": 3851.6,
"valid_targets_min": 1610
},
{
"epoch": 4.162640901771336,
"grad_norm": 0.7684487763500514,
"learning_rate": 1.6912562773072765e-05,
"loss": 0.3701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3207693099975586,
"step": 2585,
"valid_targets_mean": 3207.0,
"valid_targets_min": 1232
},
{
"epoch": 4.170692431561997,
"grad_norm": 0.8557363619696622,
"learning_rate": 1.6833243964093877e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3694392144680023,
"step": 2590,
"valid_targets_mean": 2929.4,
"valid_targets_min": 1174
},
{
"epoch": 4.178743961352657,
"grad_norm": 0.8161354731224225,
"learning_rate": 1.6753976212208137e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3618141710758209,
"step": 2595,
"valid_targets_mean": 3058.9,
"valid_targets_min": 1415
},
{
"epoch": 4.186795491143317,
"grad_norm": 0.7945413438871889,
"learning_rate": 1.667476079543664e-05,
"loss": 0.3499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3769470155239105,
"step": 2600,
"valid_targets_mean": 3233.4,
"valid_targets_min": 910
},
{
"epoch": 4.194847020933977,
"grad_norm": 0.7506914826900978,
"learning_rate": 1.659559899095667e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3336166739463806,
"step": 2605,
"valid_targets_mean": 3071.4,
"valid_targets_min": 1422
},
{
"epoch": 4.202898550724638,
"grad_norm": 0.8680474470245183,
"learning_rate": 1.651649207508114e-05,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3558621406555176,
"step": 2610,
"valid_targets_mean": 2435.2,
"valid_targets_min": 1299
},
{
"epoch": 4.210950080515298,
"grad_norm": 0.850673248513953,
"learning_rate": 1.643744132323801e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3782421946525574,
"step": 2615,
"valid_targets_mean": 2803.0,
"valid_targets_min": 1129
},
{
"epoch": 4.219001610305958,
"grad_norm": 0.9623854143221985,
"learning_rate": 1.6358448009949714e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3601483106613159,
"step": 2620,
"valid_targets_mean": 2628.6,
"valid_targets_min": 1147
},
{
"epoch": 4.2270531400966185,
"grad_norm": 0.7298752703256921,
"learning_rate": 1.6279513408812603e-05,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3530423641204834,
"step": 2625,
"valid_targets_mean": 3935.0,
"valid_targets_min": 1136
},
{
"epoch": 4.235104669887279,
"grad_norm": 0.7922927416603631,
"learning_rate": 1.620063879247643e-05,
"loss": 0.357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33408689498901367,
"step": 2630,
"valid_targets_mean": 2861.8,
"valid_targets_min": 1352
},
{
"epoch": 4.243156199677939,
"grad_norm": 0.8225640040752034,
"learning_rate": 1.6121825432623827e-05,
"loss": 0.3569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34123361110687256,
"step": 2635,
"valid_targets_mean": 2913.5,
"valid_targets_min": 1603
},
{
"epoch": 4.251207729468599,
"grad_norm": 0.862014730987376,
"learning_rate": 1.6043074599949785e-05,
"loss": 0.3476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35428357124328613,
"step": 2640,
"valid_targets_mean": 2604.4,
"valid_targets_min": 1216
},
{
"epoch": 4.2592592592592595,
"grad_norm": 0.8556648106440016,
"learning_rate": 1.5964387564141192e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.339069128036499,
"step": 2645,
"valid_targets_mean": 3359.8,
"valid_targets_min": 1454
},
{
"epoch": 4.26731078904992,
"grad_norm": 0.849595092751884,
"learning_rate": 1.588576559385635e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3184316158294678,
"step": 2650,
"valid_targets_mean": 2601.7,
"valid_targets_min": 1398
},
{
"epoch": 4.27536231884058,
"grad_norm": 0.7834684766024429,
"learning_rate": 1.5807209956704505e-05,
"loss": 0.3522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3305340111255646,
"step": 2655,
"valid_targets_mean": 3171.8,
"valid_targets_min": 1293
},
{
"epoch": 4.28341384863124,
"grad_norm": 0.8658423398271352,
"learning_rate": 1.5728721919225428e-05,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35852861404418945,
"step": 2660,
"valid_targets_mean": 3561.2,
"valid_targets_min": 995
},
{
"epoch": 4.291465378421901,
"grad_norm": 0.7999552824406122,
"learning_rate": 1.5650302746869004e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3435271978378296,
"step": 2665,
"valid_targets_mean": 3375.6,
"valid_targets_min": 1027
},
{
"epoch": 4.29951690821256,
"grad_norm": 0.8649636583204158,
"learning_rate": 1.5571953703974813e-05,
"loss": 0.3578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37238696217536926,
"step": 2670,
"valid_targets_mean": 2952.2,
"valid_targets_min": 1455
},
{
"epoch": 4.30756843800322,
"grad_norm": 0.8745862341667207,
"learning_rate": 1.5493676053751747e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36845505237579346,
"step": 2675,
"valid_targets_mean": 3117.5,
"valid_targets_min": 1411
},
{
"epoch": 4.3156199677938805,
"grad_norm": 0.9341881778545614,
"learning_rate": 1.5415471058257638e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37140941619873047,
"step": 2680,
"valid_targets_mean": 2730.5,
"valid_targets_min": 1549
},
{
"epoch": 4.323671497584541,
"grad_norm": 0.9405657665431416,
"learning_rate": 1.533733997837893e-05,
"loss": 0.3553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3740704655647278,
"step": 2685,
"valid_targets_mean": 2825.3,
"valid_targets_min": 1180
},
{
"epoch": 4.331723027375201,
"grad_norm": 0.7710353538662376,
"learning_rate": 1.5259284073810333e-05,
"loss": 0.3317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32604238390922546,
"step": 2690,
"valid_targets_mean": 3510.8,
"valid_targets_min": 1347
},
{
"epoch": 4.339774557165861,
"grad_norm": 0.781426537140954,
"learning_rate": 1.5181304603034513e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37608543038368225,
"step": 2695,
"valid_targets_mean": 3150.6,
"valid_targets_min": 877
},
{
"epoch": 4.3478260869565215,
"grad_norm": 0.7237047762120449,
"learning_rate": 1.5103402823301819e-05,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33800530433654785,
"step": 2700,
"valid_targets_mean": 3118.8,
"valid_targets_min": 1146
},
{
"epoch": 4.355877616747182,
"grad_norm": 0.7630896900796991,
"learning_rate": 1.5025579990609973e-05,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3303137421607971,
"step": 2705,
"valid_targets_mean": 3119.9,
"valid_targets_min": 1082
},
{
"epoch": 4.363929146537842,
"grad_norm": 0.8601788048234646,
"learning_rate": 1.4947837359683882e-05,
"loss": 0.3547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3552572727203369,
"step": 2710,
"valid_targets_mean": 2656.8,
"valid_targets_min": 1224
},
{
"epoch": 4.371980676328502,
"grad_norm": 0.7820969944556317,
"learning_rate": 1.487017618395534e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.309645414352417,
"step": 2715,
"valid_targets_mean": 3481.2,
"valid_targets_min": 1468
},
{
"epoch": 4.3800322061191626,
"grad_norm": 0.7637150424395313,
"learning_rate": 1.479259771554288e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34639042615890503,
"step": 2720,
"valid_targets_mean": 3636.6,
"valid_targets_min": 784
},
{
"epoch": 4.388083735909823,
"grad_norm": 0.6908525532816608,
"learning_rate": 1.4715103205231545e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.327004075050354,
"step": 2725,
"valid_targets_mean": 4069.1,
"valid_targets_min": 1625
},
{
"epoch": 4.396135265700483,
"grad_norm": 0.6634760061573296,
"learning_rate": 1.463769390245273e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30868253111839294,
"step": 2730,
"valid_targets_mean": 4105.0,
"valid_targets_min": 1173
},
{
"epoch": 4.404186795491143,
"grad_norm": 0.6687824762796025,
"learning_rate": 1.4560371055264052e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3181726336479187,
"step": 2735,
"valid_targets_mean": 4012.6,
"valid_targets_min": 2398
},
{
"epoch": 4.412238325281804,
"grad_norm": 0.7648132029162774,
"learning_rate": 1.448313591032922e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30312180519104004,
"step": 2740,
"valid_targets_mean": 3146.2,
"valid_targets_min": 1247
},
{
"epoch": 4.420289855072464,
"grad_norm": 0.6458192190255184,
"learning_rate": 1.4405989712897923e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30585235357284546,
"step": 2745,
"valid_targets_mean": 4329.4,
"valid_targets_min": 1125
},
{
"epoch": 4.428341384863124,
"grad_norm": 0.6550907118099679,
"learning_rate": 1.4328933706785782e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688300609588623,
"step": 2750,
"valid_targets_mean": 3632.9,
"valid_targets_min": 1076
},
{
"epoch": 4.436392914653784,
"grad_norm": 0.7080323021524921,
"learning_rate": 1.4251969134354247e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29432380199432373,
"step": 2755,
"valid_targets_mean": 3553.6,
"valid_targets_min": 1094
},
{
"epoch": 4.444444444444445,
"grad_norm": 0.7541689777697117,
"learning_rate": 1.4175097236490627e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3119310438632965,
"step": 2760,
"valid_targets_mean": 3095.5,
"valid_targets_min": 1793
},
{
"epoch": 4.452495974235105,
"grad_norm": 0.7223929430673088,
"learning_rate": 1.409831925258805e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2738376259803772,
"step": 2765,
"valid_targets_mean": 3082.8,
"valid_targets_min": 1495
},
{
"epoch": 4.460547504025765,
"grad_norm": 0.7341114060579149,
"learning_rate": 1.4021636420525466e-05,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992332875728607,
"step": 2770,
"valid_targets_mean": 2982.9,
"valid_targets_min": 1490
},
{
"epoch": 4.468599033816425,
"grad_norm": 0.7930767785136432,
"learning_rate": 1.3945049976647726e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3382141590118408,
"step": 2775,
"valid_targets_mean": 3224.7,
"valid_targets_min": 1414
},
{
"epoch": 4.476650563607086,
"grad_norm": 0.7051589780334897,
"learning_rate": 1.3868561155745628e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.302938848733902,
"step": 2780,
"valid_targets_mean": 4591.2,
"valid_targets_min": 1895
},
{
"epoch": 4.484702093397746,
"grad_norm": 0.776963321434189,
"learning_rate": 1.3792171191036001e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32361382246017456,
"step": 2785,
"valid_targets_mean": 3124.8,
"valid_targets_min": 987
},
{
"epoch": 4.492753623188406,
"grad_norm": 0.8112701248746712,
"learning_rate": 1.3715881314141835e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2923651337623596,
"step": 2790,
"valid_targets_mean": 2744.4,
"valid_targets_min": 1399
},
{
"epoch": 4.500805152979066,
"grad_norm": 0.7331706558443012,
"learning_rate": 1.3639692755072429e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007197380065918,
"step": 2795,
"valid_targets_mean": 3716.5,
"valid_targets_min": 1383
},
{
"epoch": 4.508856682769727,
"grad_norm": 0.647744700371841,
"learning_rate": 1.3563606742203548e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2892110347747803,
"step": 2800,
"valid_targets_mean": 4289.1,
"valid_targets_min": 1433
},
{
"epoch": 4.516908212560386,
"grad_norm": 0.9421850377075999,
"learning_rate": 1.3487624502257598e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3276273310184479,
"step": 2805,
"valid_targets_mean": 2789.2,
"valid_targets_min": 1322
},
{
"epoch": 4.524959742351046,
"grad_norm": 0.7188700197789585,
"learning_rate": 1.3411747260283905e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845657765865326,
"step": 2810,
"valid_targets_mean": 3436.0,
"valid_targets_min": 1213
},
{
"epoch": 4.533011272141707,
"grad_norm": 0.7781869831067078,
"learning_rate": 1.333597623963892e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29683226346969604,
"step": 2815,
"valid_targets_mean": 2580.9,
"valid_targets_min": 1280
},
{
"epoch": 4.541062801932367,
"grad_norm": 0.7012527244821464,
"learning_rate": 1.3260312661966487e-05,
"loss": 0.3125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30411043763160706,
"step": 2820,
"valid_targets_mean": 4231.2,
"valid_targets_min": 1381
},
{
"epoch": 4.549114331723027,
"grad_norm": 0.6896904130191109,
"learning_rate": 1.3184757747178187e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29390496015548706,
"step": 2825,
"valid_targets_mean": 3503.9,
"valid_targets_min": 1033
},
{
"epoch": 4.557165861513687,
"grad_norm": 0.696983130694775,
"learning_rate": 1.3109312713433642e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31736573576927185,
"step": 2830,
"valid_targets_mean": 3569.1,
"valid_targets_min": 1245
},
{
"epoch": 4.565217391304348,
"grad_norm": 0.7902589844756526,
"learning_rate": 1.3033978777120861e-05,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30584877729415894,
"step": 2835,
"valid_targets_mean": 2826.0,
"valid_targets_min": 1012
},
{
"epoch": 4.573268921095008,
"grad_norm": 0.7274888924433361,
"learning_rate": 1.2958757152836671e-05,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25177866220474243,
"step": 2840,
"valid_targets_mean": 3450.6,
"valid_targets_min": 1486
},
{
"epoch": 4.581320450885668,
"grad_norm": 0.725180749478288,
"learning_rate": 1.2883649053367106e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2852326035499573,
"step": 2845,
"valid_targets_mean": 3446.2,
"valid_targets_min": 1140
},
{
"epoch": 4.5893719806763285,
"grad_norm": 0.8999719879391306,
"learning_rate": 1.2808655689667846e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.386888325214386,
"step": 2850,
"valid_targets_mean": 3519.2,
"valid_targets_min": 1327
},
{
"epoch": 4.597423510466989,
"grad_norm": 0.7442219129910428,
"learning_rate": 1.2733778270844712e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3202979862689972,
"step": 2855,
"valid_targets_mean": 3581.2,
"valid_targets_min": 1277
},
{
"epoch": 4.605475040257649,
"grad_norm": 0.7961958367210087,
"learning_rate": 1.265901800413416e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289141982793808,
"step": 2860,
"valid_targets_mean": 3373.2,
"valid_targets_min": 1205
},
{
"epoch": 4.613526570048309,
"grad_norm": 0.7594348180961747,
"learning_rate": 1.2584376094883832e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29926833510398865,
"step": 2865,
"valid_targets_mean": 3217.2,
"valid_targets_min": 1432
},
{
"epoch": 4.6215780998389695,
"grad_norm": 0.7903300067618602,
"learning_rate": 1.250985374653311e-05,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2627432942390442,
"step": 2870,
"valid_targets_mean": 2827.8,
"valid_targets_min": 368
},
{
"epoch": 4.62962962962963,
"grad_norm": 0.746273737284161,
"learning_rate": 1.2435452160593698e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2513338625431061,
"step": 2875,
"valid_targets_mean": 3353.4,
"valid_targets_min": 1064
},
{
"epoch": 4.63768115942029,
"grad_norm": 0.7106900237367672,
"learning_rate": 1.2361172536630288e-05,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2939052879810333,
"step": 2880,
"valid_targets_mean": 4223.3,
"valid_targets_min": 1746
},
{
"epoch": 4.64573268921095,
"grad_norm": 0.6667954441747274,
"learning_rate": 1.2287016072241195e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2683846652507782,
"step": 2885,
"valid_targets_mean": 3858.1,
"valid_targets_min": 1327
},
{
"epoch": 4.6537842190016105,
"grad_norm": 0.9490652913436398,
"learning_rate": 1.221298396303904e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2613232135772705,
"step": 2890,
"valid_targets_mean": 2620.6,
"valid_targets_min": 1039
},
{
"epoch": 4.661835748792271,
"grad_norm": 0.7333762476710057,
"learning_rate": 1.2139077402631495e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2822628617286682,
"step": 2895,
"valid_targets_mean": 3479.4,
"valid_targets_min": 1238
},
{
"epoch": 4.669887278582931,
"grad_norm": 0.6515841944617482,
"learning_rate": 1.2065297582602037e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25587737560272217,
"step": 2900,
"valid_targets_mean": 3427.9,
"valid_targets_min": 1281
},
{
"epoch": 4.677938808373591,
"grad_norm": 0.8050654547421896,
"learning_rate": 1.199164569249071e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.299319863319397,
"step": 2905,
"valid_targets_mean": 2845.1,
"valid_targets_min": 991
},
{
"epoch": 4.685990338164252,
"grad_norm": 0.6708735466300162,
"learning_rate": 1.191812291977497e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744864225387573,
"step": 2910,
"valid_targets_mean": 4298.4,
"valid_targets_min": 1411
},
{
"epoch": 4.694041867954912,
"grad_norm": 0.7514813752903359,
"learning_rate": 1.1844730449850546e-05,
"loss": 0.33,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3047374486923218,
"step": 2915,
"valid_targets_mean": 3738.6,
"valid_targets_min": 1555
},
{
"epoch": 4.702093397745571,
"grad_norm": 0.8585820063404703,
"learning_rate": 1.1771469466012309e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.263333261013031,
"step": 2920,
"valid_targets_mean": 2371.1,
"valid_targets_min": 1181
},
{
"epoch": 4.710144927536232,
"grad_norm": 0.9084047054321588,
"learning_rate": 1.1698341149435196e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29706811904907227,
"step": 2925,
"valid_targets_mean": 3284.2,
"valid_targets_min": 1517
},
{
"epoch": 4.718196457326892,
"grad_norm": 0.7335312030781107,
"learning_rate": 1.1625346679155179e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2993118166923523,
"step": 2930,
"valid_targets_mean": 3596.9,
"valid_targets_min": 1119
},
{
"epoch": 4.726247987117552,
"grad_norm": 0.7645383662240981,
"learning_rate": 1.1552487232050242e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27383461594581604,
"step": 2935,
"valid_targets_mean": 3022.3,
"valid_targets_min": 1298
},
{
"epoch": 4.734299516908212,
"grad_norm": 0.7045343410442323,
"learning_rate": 1.1479763982821414e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30053383111953735,
"step": 2940,
"valid_targets_mean": 3824.2,
"valid_targets_min": 1978
},
{
"epoch": 4.7423510466988725,
"grad_norm": 0.7631623179378855,
"learning_rate": 1.1407178103973834e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2785217761993408,
"step": 2945,
"valid_targets_mean": 3441.6,
"valid_targets_min": 1594
},
{
"epoch": 4.750402576489533,
"grad_norm": 0.6749936353133249,
"learning_rate": 1.1334730765797843e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28506165742874146,
"step": 2950,
"valid_targets_mean": 3849.7,
"valid_targets_min": 1650
},
{
"epoch": 4.758454106280193,
"grad_norm": 0.737322666574153,
"learning_rate": 1.1262423136350087e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161736398935318,
"step": 2955,
"valid_targets_mean": 5966.6,
"valid_targets_min": 3184
},
{
"epoch": 4.766505636070853,
"grad_norm": 0.5423893032678805,
"learning_rate": 1.1190256381434738e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1538485288619995,
"step": 2960,
"valid_targets_mean": 5159.4,
"valid_targets_min": 3589
},
{
"epoch": 4.774557165861514,
"grad_norm": 0.5128933204704713,
"learning_rate": 1.1118231664584674e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17879360914230347,
"step": 2965,
"valid_targets_mean": 6292.2,
"valid_targets_min": 3131
},
{
"epoch": 4.782608695652174,
"grad_norm": 0.5098998582752253,
"learning_rate": 1.1046350147042681e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15875032544136047,
"step": 2970,
"valid_targets_mean": 5304.0,
"valid_targets_min": 3117
},
{
"epoch": 4.790660225442834,
"grad_norm": 0.5044753740910969,
"learning_rate": 1.0974612987742807e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18598923087120056,
"step": 2975,
"valid_targets_mean": 6316.2,
"valid_targets_min": 3455
},
{
"epoch": 4.798711755233494,
"grad_norm": 0.4536792935375198,
"learning_rate": 1.0903021343291613e-05,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1645420491695404,
"step": 2980,
"valid_targets_mean": 6636.1,
"valid_targets_min": 3364
},
{
"epoch": 4.806763285024155,
"grad_norm": 1.0919493102135451,
"learning_rate": 1.0831576367949555e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1736430525779724,
"step": 2985,
"valid_targets_mean": 5804.9,
"valid_targets_min": 2579
},
{
"epoch": 4.814814814814815,
"grad_norm": 0.44890465909191923,
"learning_rate": 1.0760279213612362e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23404830694198608,
"step": 2990,
"valid_targets_mean": 6861.9,
"valid_targets_min": 2907
},
{
"epoch": 4.822866344605475,
"grad_norm": 0.5343037492936906,
"learning_rate": 1.068913102979248e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1848660707473755,
"step": 2995,
"valid_targets_mean": 6218.1,
"valid_targets_min": 2748
},
{
"epoch": 4.830917874396135,
"grad_norm": 0.4771916103447067,
"learning_rate": 1.0618132963600507e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1645662933588028,
"step": 3000,
"valid_targets_mean": 5813.8,
"valid_targets_min": 3623
},
{
"epoch": 4.838969404186796,
"grad_norm": 0.5572712759897953,
"learning_rate": 1.0547286159726743e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15293219685554504,
"step": 3005,
"valid_targets_mean": 5563.2,
"valid_targets_min": 2843
},
{
"epoch": 4.847020933977456,
"grad_norm": 0.5223306827253792,
"learning_rate": 1.047659176042268e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16464412212371826,
"step": 3010,
"valid_targets_mean": 6044.7,
"valid_targets_min": 3602
},
{
"epoch": 4.855072463768116,
"grad_norm": 0.47001363201449686,
"learning_rate": 1.0406050905482647e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.183122456073761,
"step": 3015,
"valid_targets_mean": 6674.1,
"valid_targets_min": 3783
},
{
"epoch": 4.8631239935587764,
"grad_norm": 0.5165001888223757,
"learning_rate": 1.033566473222539e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18210646510124207,
"step": 3020,
"valid_targets_mean": 5845.1,
"valid_targets_min": 2402
},
{
"epoch": 4.871175523349437,
"grad_norm": 0.5031892171999971,
"learning_rate": 1.0265434375475744e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17503511905670166,
"step": 3025,
"valid_targets_mean": 5448.2,
"valid_targets_min": 3720
},
{
"epoch": 4.879227053140097,
"grad_norm": 0.49986928711541884,
"learning_rate": 1.0195360967546342e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18064576387405396,
"step": 3030,
"valid_targets_mean": 5979.9,
"valid_targets_min": 2553
},
{
"epoch": 4.887278582930757,
"grad_norm": 0.5125587155597235,
"learning_rate": 1.0125445638219369e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16748838126659393,
"step": 3035,
"valid_targets_mean": 6232.3,
"valid_targets_min": 2860
},
{
"epoch": 4.8953301127214175,
"grad_norm": 0.4616045885291346,
"learning_rate": 1.00556895147283e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.162489652633667,
"step": 3040,
"valid_targets_mean": 5831.9,
"valid_targets_min": 3564
},
{
"epoch": 4.903381642512077,
"grad_norm": 0.46322600369785283,
"learning_rate": 9.986093721739793e-06,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18634885549545288,
"step": 3045,
"valid_targets_mean": 6287.4,
"valid_targets_min": 2925
},
{
"epoch": 4.911433172302738,
"grad_norm": 0.46732093070548425,
"learning_rate": 9.916659381335524e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14257997274398804,
"step": 3050,
"valid_targets_mean": 5975.3,
"valid_targets_min": 2785
},
{
"epoch": 4.919484702093397,
"grad_norm": 0.49090695641865617,
"learning_rate": 9.847387612994065e-06,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1775178611278534,
"step": 3055,
"valid_targets_mean": 5815.7,
"valid_targets_min": 2991
},
{
"epoch": 4.927536231884058,
"grad_norm": 0.4936584974779153,
"learning_rate": 9.778279533572894e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16541126370429993,
"step": 3060,
"valid_targets_mean": 6023.0,
"valid_targets_min": 3528
},
{
"epoch": 4.935587761674718,
"grad_norm": 0.4843782424726677,
"learning_rate": 9.70933625729035e-06,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17926865816116333,
"step": 3065,
"valid_targets_mean": 6609.0,
"valid_targets_min": 3348
},
{
"epoch": 4.943639291465378,
"grad_norm": 0.6642579622564159,
"learning_rate": 9.640558895707681e-06,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745370775461197,
"step": 3070,
"valid_targets_mean": 5392.2,
"valid_targets_min": 2988
},
{
"epoch": 4.951690821256038,
"grad_norm": 0.5815282039563188,
"learning_rate": 9.571948557711104e-06,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16913628578186035,
"step": 3075,
"valid_targets_mean": 5687.4,
"valid_targets_min": 3662
},
{
"epoch": 4.959742351046699,
"grad_norm": 0.4644634261413639,
"learning_rate": 9.503506349493959e-06,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1633993536233902,
"step": 3080,
"valid_targets_mean": 5669.5,
"valid_targets_min": 2991
},
{
"epoch": 4.967793880837359,
"grad_norm": 0.5022295538466749,
"learning_rate": 9.435233374538848e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15409933030605316,
"step": 3085,
"valid_targets_mean": 5877.1,
"valid_targets_min": 3272
},
{
"epoch": 4.975845410628019,
"grad_norm": 0.5467333590771565,
"learning_rate": 9.367130733599863e-06,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1819993257522583,
"step": 3090,
"valid_targets_mean": 5579.3,
"valid_targets_min": 2743
},
{
"epoch": 4.9838969404186795,
"grad_norm": 0.47589633784217944,
"learning_rate": 9.299199524684815e-06,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16169019043445587,
"step": 3095,
"valid_targets_mean": 6154.2,
"valid_targets_min": 3288
},
{
"epoch": 4.99194847020934,
"grad_norm": 0.4987072791545887,
"learning_rate": 9.23144084303756e-06,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14372682571411133,
"step": 3100,
"valid_targets_mean": 5617.6,
"valid_targets_min": 2206
},
{
"epoch": 5.0,
"grad_norm": 0.5420052690244692,
"learning_rate": 9.163855781120302e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929244101047516,
"step": 3105,
"valid_targets_mean": 6658.9,
"valid_targets_min": 2494
},
{
"epoch": 5.00805152979066,
"grad_norm": 0.5838464125620735,
"learning_rate": 9.096445428596026e-06,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26280146837234497,
"step": 3110,
"valid_targets_mean": 6454.3,
"valid_targets_min": 2941
},
{
"epoch": 5.0161030595813205,
"grad_norm": 0.5544032083369451,
"learning_rate": 9.029210872310884e-06,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2069273293018341,
"step": 3115,
"valid_targets_mean": 6041.3,
"valid_targets_min": 3050
},
{
"epoch": 5.024154589371981,
"grad_norm": 0.5060239859737673,
"learning_rate": 8.962153196276713e-06,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2327526956796646,
"step": 3120,
"valid_targets_mean": 6337.3,
"valid_targets_min": 3318
},
{
"epoch": 5.032206119162641,
"grad_norm": 0.5024924584087652,
"learning_rate": 8.895273481653527e-06,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556541860103607,
"step": 3125,
"valid_targets_mean": 6536.2,
"valid_targets_min": 3943
},
{
"epoch": 5.040257648953301,
"grad_norm": 0.5532271429624148,
"learning_rate": 8.828572806732103e-06,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23633992671966553,
"step": 3130,
"valid_targets_mean": 6144.0,
"valid_targets_min": 1873
},
{
"epoch": 5.048309178743962,
"grad_norm": 0.5020434087339521,
"learning_rate": 8.76205224691659e-06,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.220601886510849,
"step": 3135,
"valid_targets_mean": 5658.6,
"valid_targets_min": 3195
},
{
"epoch": 5.056360708534622,
"grad_norm": 0.5004024186733302,
"learning_rate": 8.695712874707169e-06,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531841993331909,
"step": 3140,
"valid_targets_mean": 5992.8,
"valid_targets_min": 3207
},
{
"epoch": 5.064412238325282,
"grad_norm": 0.5475537882143925,
"learning_rate": 8.629555759682756e-06,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2494160532951355,
"step": 3145,
"valid_targets_mean": 5498.4,
"valid_targets_min": 2385
},
{
"epoch": 5.072463768115942,
"grad_norm": 0.5809278130638802,
"learning_rate": 8.563581968483774e-06,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22677326202392578,
"step": 3150,
"valid_targets_mean": 6101.3,
"valid_targets_min": 2571
},
{
"epoch": 5.080515297906603,
"grad_norm": 0.5328987070977548,
"learning_rate": 8.497792564794935e-06,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23735421895980835,
"step": 3155,
"valid_targets_mean": 5591.6,
"valid_targets_min": 436
},
{
"epoch": 5.088566827697263,
"grad_norm": 0.4993503923966659,
"learning_rate": 8.432188609328112e-06,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28377091884613037,
"step": 3160,
"valid_targets_mean": 7175.1,
"valid_targets_min": 3309
},
{
"epoch": 5.096618357487923,
"grad_norm": 0.5672470270119984,
"learning_rate": 8.366771159805222e-06,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22815349698066711,
"step": 3165,
"valid_targets_mean": 5700.9,
"valid_targets_min": 1417
},
{
"epoch": 5.1046698872785825,
"grad_norm": 0.5110748498614881,
"learning_rate": 8.301541270941178e-06,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25175783038139343,
"step": 3170,
"valid_targets_mean": 6462.1,
"valid_targets_min": 3176
},
{
"epoch": 5.112721417069243,
"grad_norm": 0.5146196376849012,
"learning_rate": 8.236499994426886e-06,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2239510416984558,
"step": 3175,
"valid_targets_mean": 6671.4,
"valid_targets_min": 2978
},
{
"epoch": 5.120772946859903,
"grad_norm": 0.5276651861060871,
"learning_rate": 8.171648378912272e-06,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24736565351486206,
"step": 3180,
"valid_targets_mean": 5441.8,
"valid_targets_min": 2285
},
{
"epoch": 5.128824476650563,
"grad_norm": 0.5713617059940914,
"learning_rate": 8.1069874699894e-06,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21684984862804413,
"step": 3185,
"valid_targets_mean": 5118.4,
"valid_targets_min": 2205
},
{
"epoch": 5.1368760064412236,
"grad_norm": 0.9446935557315936,
"learning_rate": 8.042518310175607e-06,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3164033889770508,
"step": 3190,
"valid_targets_mean": 2431.5,
"valid_targets_min": 1052
},
{
"epoch": 5.144927536231884,
"grad_norm": 0.8102422471310984,
"learning_rate": 7.978241938896679e-06,
"loss": 0.3619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3511773347854614,
"step": 3195,
"valid_targets_mean": 3045.8,
"valid_targets_min": 1348
},
{
"epoch": 5.152979066022544,
"grad_norm": 0.8229058252512985,
"learning_rate": 7.914159392470118e-06,
"loss": 0.3316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3436507284641266,
"step": 3200,
"valid_targets_mean": 3644.5,
"valid_targets_min": 1127
},
{
"epoch": 5.161030595813204,
"grad_norm": 0.7911041242061355,
"learning_rate": 7.850271704088396e-06,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3280431628227234,
"step": 3205,
"valid_targets_mean": 2985.6,
"valid_targets_min": 1353
},
{
"epoch": 5.169082125603865,
"grad_norm": 0.7417281880292826,
"learning_rate": 7.786579903802342e-06,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3037336766719818,
"step": 3210,
"valid_targets_mean": 4235.5,
"valid_targets_min": 1153
},
{
"epoch": 5.177133655394525,
"grad_norm": 0.8043169878590806,
"learning_rate": 7.723085018504512e-06,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31899648904800415,
"step": 3215,
"valid_targets_mean": 3142.8,
"valid_targets_min": 1555
},
{
"epoch": 5.185185185185185,
"grad_norm": 0.7681103865645257,
"learning_rate": 7.659788071912612e-06,
"loss": 0.3224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3006795644760132,
"step": 3220,
"valid_targets_mean": 3279.6,
"valid_targets_min": 1283
},
{
"epoch": 5.193236714975845,
"grad_norm": 0.9279631678919613,
"learning_rate": 7.59669008455304e-06,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3557708263397217,
"step": 3225,
"valid_targets_mean": 2693.6,
"valid_targets_min": 1497
},
{
"epoch": 5.201288244766506,
"grad_norm": 0.8325517861916301,
"learning_rate": 7.533792073744395e-06,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29200559854507446,
"step": 3230,
"valid_targets_mean": 2785.3,
"valid_targets_min": 1343
},
{
"epoch": 5.209339774557166,
"grad_norm": 0.9000004067843751,
"learning_rate": 7.471095053581086e-06,
"loss": 0.3322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33962708711624146,
"step": 3235,
"valid_targets_mean": 2680.9,
"valid_targets_min": 1319
},
{
"epoch": 5.217391304347826,
"grad_norm": 0.7351616652174657,
"learning_rate": 7.4086000349169864e-06,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27437877655029297,
"step": 3240,
"valid_targets_mean": 3356.8,
"valid_targets_min": 1216
},
{
"epoch": 5.225442834138486,
"grad_norm": 0.8649092507616926,
"learning_rate": 7.346308025349138e-06,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3227480947971344,
"step": 3245,
"valid_targets_mean": 2648.8,
"valid_targets_min": 1013
},
{
"epoch": 5.233494363929147,
"grad_norm": 0.7894068022798766,
"learning_rate": 7.2842200292014805e-06,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2977900505065918,
"step": 3250,
"valid_targets_mean": 3610.2,
"valid_targets_min": 1346
},
{
"epoch": 5.241545893719807,
"grad_norm": 0.8348958744102947,
"learning_rate": 7.2223370475086896e-06,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31349635124206543,
"step": 3255,
"valid_targets_mean": 2815.4,
"valid_targets_min": 1085
},
{
"epoch": 5.249597423510467,
"grad_norm": 0.783279282550219,
"learning_rate": 7.160660078000028e-06,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31384730339050293,
"step": 3260,
"valid_targets_mean": 3536.7,
"valid_targets_min": 1598
},
{
"epoch": 5.2576489533011275,
"grad_norm": 0.8474474930539333,
"learning_rate": 7.099190115083259e-06,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2967156171798706,
"step": 3265,
"valid_targets_mean": 2561.4,
"valid_targets_min": 1339
},
{
"epoch": 5.265700483091788,
"grad_norm": 0.808644026983678,
"learning_rate": 7.037928149828608e-06,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2750012278556824,
"step": 3270,
"valid_targets_mean": 2889.4,
"valid_targets_min": 1076
},
{
"epoch": 5.273752012882448,
"grad_norm": 0.9194627850557411,
"learning_rate": 6.97687516995279e-06,
"loss": 0.3234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3373414874076843,
"step": 3275,
"valid_targets_mean": 2557.4,
"valid_targets_min": 1094
},
{
"epoch": 5.281803542673108,
"grad_norm": 0.822826899306057,
"learning_rate": 6.916032159803088e-06,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3265712857246399,
"step": 3280,
"valid_targets_mean": 3530.8,
"valid_targets_min": 1290
},
{
"epoch": 5.2898550724637685,
"grad_norm": 1.0801701198259575,
"learning_rate": 6.855400100341458e-06,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31815803050994873,
"step": 3285,
"valid_targets_mean": 2579.7,
"valid_targets_min": 1229
},
{
"epoch": 5.297906602254429,
"grad_norm": 0.9189668274655115,
"learning_rate": 6.794979969128755e-06,
"loss": 0.3284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35337209701538086,
"step": 3290,
"valid_targets_mean": 3024.5,
"valid_targets_min": 1126
},
{
"epoch": 5.305958132045088,
"grad_norm": 0.7830019148830716,
"learning_rate": 6.7347727403089325e-06,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3025501072406769,
"step": 3295,
"valid_targets_mean": 3523.4,
"valid_targets_min": 1277
},
{
"epoch": 5.314009661835748,
"grad_norm": 0.7973020737314889,
"learning_rate": 6.674779384593373e-06,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3119211196899414,
"step": 3300,
"valid_targets_mean": 3317.8,
"valid_targets_min": 1389
},
{
"epoch": 5.322061191626409,
"grad_norm": 0.8741442602989578,
"learning_rate": 6.61500086924519e-06,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32590872049331665,
"step": 3305,
"valid_targets_mean": 2728.8,
"valid_targets_min": 1062
},
{
"epoch": 5.330112721417069,
"grad_norm": 0.7121746609134123,
"learning_rate": 6.555438158063683e-06,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29646340012550354,
"step": 3310,
"valid_targets_mean": 3474.4,
"valid_targets_min": 1520
},
{
"epoch": 5.338164251207729,
"grad_norm": 0.8449323115888453,
"learning_rate": 6.4960922113687695e-06,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3494471311569214,
"step": 3315,
"valid_targets_mean": 2857.8,
"valid_targets_min": 1154
},
{
"epoch": 5.3462157809983895,
"grad_norm": 0.885312187387555,
"learning_rate": 6.4369639859855115e-06,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2813508212566376,
"step": 3320,
"valid_targets_mean": 2419.3,
"valid_targets_min": 1115
},
{
"epoch": 5.35426731078905,
"grad_norm": 0.9927190814901663,
"learning_rate": 6.378054435228671e-06,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34994691610336304,
"step": 3325,
"valid_targets_mean": 2817.8,
"valid_targets_min": 1383
},
{
"epoch": 5.36231884057971,
"grad_norm": 0.8385621560859085,
"learning_rate": 6.319364508887371e-06,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3212810456752777,
"step": 3330,
"valid_targets_mean": 2906.6,
"valid_targets_min": 1414
},
{
"epoch": 5.37037037037037,
"grad_norm": 0.9132443618507105,
"learning_rate": 6.260895153209763e-06,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3039951026439667,
"step": 3335,
"valid_targets_mean": 2699.4,
"valid_targets_min": 1140
},
{
"epoch": 5.3784219001610305,
"grad_norm": 0.7695295851549366,
"learning_rate": 6.202647310887764e-06,
"loss": 0.2929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2774300277233124,
"step": 3340,
"valid_targets_mean": 3474.1,
"valid_targets_min": 1060
},
{
"epoch": 5.386473429951691,
"grad_norm": 0.6668937071959811,
"learning_rate": 6.14462192104188e-06,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27856311202049255,
"step": 3345,
"valid_targets_mean": 4942.6,
"valid_targets_min": 1358
},
{
"epoch": 5.394524959742351,
"grad_norm": 0.8455706950790055,
"learning_rate": 6.086819919206051e-06,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30070313811302185,
"step": 3350,
"valid_targets_mean": 3203.9,
"valid_targets_min": 1109
},
{
"epoch": 5.402576489533011,
"grad_norm": 0.836900372814081,
"learning_rate": 6.029242237312554e-06,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704571485519409,
"step": 3355,
"valid_targets_mean": 2741.4,
"valid_targets_min": 990
},
{
"epoch": 5.4106280193236715,
"grad_norm": 1.0931862207345193,
"learning_rate": 5.971889803676996e-06,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953025698661804,
"step": 3360,
"valid_targets_mean": 2505.7,
"valid_targets_min": 1217
},
{
"epoch": 5.418679549114332,
"grad_norm": 0.7654117324257275,
"learning_rate": 5.914763542983355e-06,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26454564929008484,
"step": 3365,
"valid_targets_mean": 2908.2,
"valid_targets_min": 977
},
{
"epoch": 5.426731078904992,
"grad_norm": 0.7330273533335651,
"learning_rate": 5.857864376269051e-06,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26756301522254944,
"step": 3370,
"valid_targets_mean": 3492.0,
"valid_targets_min": 1549
},
{
"epoch": 5.434782608695652,
"grad_norm": 0.8733408409541297,
"learning_rate": 5.801193220910108e-06,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26825398206710815,
"step": 3375,
"valid_targets_mean": 2432.0,
"valid_targets_min": 838
},
{
"epoch": 5.442834138486313,
"grad_norm": 0.7169076864712473,
"learning_rate": 5.744750990606356e-06,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24838054180145264,
"step": 3380,
"valid_targets_mean": 3069.9,
"valid_targets_min": 269
},
{
"epoch": 5.450885668276973,
"grad_norm": 0.7502178650889314,
"learning_rate": 5.688538595366706e-06,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31911134719848633,
"step": 3385,
"valid_targets_mean": 3644.1,
"valid_targets_min": 1308
},
{
"epoch": 5.458937198067633,
"grad_norm": 1.414216146795669,
"learning_rate": 5.632556941494482e-06,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25184541940689087,
"step": 3390,
"valid_targets_mean": 3538.7,
"valid_targets_min": 865
},
{
"epoch": 5.466988727858293,
"grad_norm": 0.8372271865966336,
"learning_rate": 5.5768069315727895e-06,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27714282274246216,
"step": 3395,
"valid_targets_mean": 2789.2,
"valid_targets_min": 1084
},
{
"epoch": 5.475040257648954,
"grad_norm": 0.8184499988808632,
"learning_rate": 5.521289464449975e-06,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2645953595638275,
"step": 3400,
"valid_targets_mean": 2663.7,
"valid_targets_min": 1007
},
{
"epoch": 5.483091787439614,
"grad_norm": 0.7185289726192565,
"learning_rate": 5.46600543522515e-06,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30967646837234497,
"step": 3405,
"valid_targets_mean": 3865.0,
"valid_targets_min": 556
},
{
"epoch": 5.491143317230274,
"grad_norm": 0.705180498725472,
"learning_rate": 5.410955735233736e-06,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2706761658191681,
"step": 3410,
"valid_targets_mean": 4117.5,
"valid_targets_min": 1094
},
{
"epoch": 5.499194847020934,
"grad_norm": 0.6957397872406959,
"learning_rate": 5.3561412520331025e-06,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23413681983947754,
"step": 3415,
"valid_targets_mean": 3565.3,
"valid_targets_min": 333
},
{
"epoch": 5.507246376811594,
"grad_norm": 0.7323699706744174,
"learning_rate": 5.30156286938826e-06,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27193206548690796,
"step": 3420,
"valid_targets_mean": 3507.9,
"valid_targets_min": 1135
},
{
"epoch": 5.515297906602254,
"grad_norm": 0.7948157490925247,
"learning_rate": 5.24722146725761e-06,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30066072940826416,
"step": 3425,
"valid_targets_mean": 3822.9,
"valid_targets_min": 428
},
{
"epoch": 5.523349436392914,
"grad_norm": 0.7330705322398546,
"learning_rate": 5.193117921778743e-06,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2574806809425354,
"step": 3430,
"valid_targets_mean": 2932.9,
"valid_targets_min": 1398
},
{
"epoch": 5.531400966183575,
"grad_norm": 0.737623162777766,
"learning_rate": 5.139253105254336e-06,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2380131632089615,
"step": 3435,
"valid_targets_mean": 3473.2,
"valid_targets_min": 1265
},
{
"epoch": 5.539452495974235,
"grad_norm": 0.872809824307193,
"learning_rate": 5.085627886138078e-06,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3099297881126404,
"step": 3440,
"valid_targets_mean": 2707.5,
"valid_targets_min": 1453
},
{
"epoch": 5.547504025764895,
"grad_norm": 0.698343107099745,
"learning_rate": 5.032243129020671e-06,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.263833224773407,
"step": 3445,
"valid_targets_mean": 3770.1,
"valid_targets_min": 1554
},
{
"epoch": 5.555555555555555,
"grad_norm": 0.7253845641200191,
"learning_rate": 4.9790996946158695e-06,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2566887438297272,
"step": 3450,
"valid_targets_mean": 3687.9,
"valid_targets_min": 1423
},
{
"epoch": 5.563607085346216,
"grad_norm": 0.7712918784806847,
"learning_rate": 4.926198439746641e-06,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26648885011672974,
"step": 3455,
"valid_targets_mean": 3580.0,
"valid_targets_min": 1778
},
{
"epoch": 5.571658615136876,
"grad_norm": 0.856414024782782,
"learning_rate": 4.873540217331325e-06,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561458945274353,
"step": 3460,
"valid_targets_mean": 3154.2,
"valid_targets_min": 1070
},
{
"epoch": 5.579710144927536,
"grad_norm": 0.7683716866413719,
"learning_rate": 4.82112587636989e-06,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2730039358139038,
"step": 3465,
"valid_targets_mean": 3442.1,
"valid_targets_min": 1222
},
{
"epoch": 5.587761674718196,
"grad_norm": 0.8230430968296925,
"learning_rate": 4.768956261930233e-06,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27767133712768555,
"step": 3470,
"valid_targets_mean": 2991.2,
"valid_targets_min": 1344
},
{
"epoch": 5.595813204508857,
"grad_norm": 0.8004415970586688,
"learning_rate": 4.717032215134576e-06,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605861723423004,
"step": 3475,
"valid_targets_mean": 3584.1,
"valid_targets_min": 1080
},
{
"epoch": 5.603864734299517,
"grad_norm": 0.7353749562835018,
"learning_rate": 4.66535457314589e-06,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24795982241630554,
"step": 3480,
"valid_targets_mean": 3283.6,
"valid_targets_min": 1136
},
{
"epoch": 5.611916264090177,
"grad_norm": 0.7934788767299171,
"learning_rate": 4.613924169154406e-06,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561984658241272,
"step": 3485,
"valid_targets_mean": 3267.1,
"valid_targets_min": 1469
},
{
"epoch": 5.6199677938808374,
"grad_norm": 0.6451673243838487,
"learning_rate": 4.5627418323641705e-06,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23117291927337646,
"step": 3490,
"valid_targets_mean": 4220.8,
"valid_targets_min": 1141
},
{
"epoch": 5.628019323671498,
"grad_norm": 0.7547471899894796,
"learning_rate": 4.51180838797969e-06,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534325420856476,
"step": 3495,
"valid_targets_mean": 3403.3,
"valid_targets_min": 1315
},
{
"epoch": 5.636070853462158,
"grad_norm": 0.773278558835617,
"learning_rate": 4.461124657192612e-06,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26870912313461304,
"step": 3500,
"valid_targets_mean": 3994.0,
"valid_targets_min": 1243
},
{
"epoch": 5.644122383252818,
"grad_norm": 0.810555778973838,
"learning_rate": 4.410691457168488e-06,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28086018562316895,
"step": 3505,
"valid_targets_mean": 2728.6,
"valid_targets_min": 1205
},
{
"epoch": 5.6521739130434785,
"grad_norm": 0.8120077352409444,
"learning_rate": 4.3605096010336115e-06,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24294914305210114,
"step": 3510,
"valid_targets_mean": 2805.7,
"valid_targets_min": 1316
},
{
"epoch": 5.660225442834139,
"grad_norm": 0.8130325924281421,
"learning_rate": 4.310579897861902e-06,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28100401163101196,
"step": 3515,
"valid_targets_mean": 3165.5,
"valid_targets_min": 1339
},
{
"epoch": 5.668276972624799,
"grad_norm": 0.8162870406632708,
"learning_rate": 4.26090315266185e-06,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26572561264038086,
"step": 3520,
"valid_targets_mean": 2954.1,
"valid_targets_min": 1158
},
{
"epoch": 5.676328502415459,
"grad_norm": 0.6514530451354953,
"learning_rate": 4.2114801663635504e-06,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2698674201965332,
"step": 3525,
"valid_targets_mean": 4536.0,
"valid_targets_min": 1647
},
{
"epoch": 5.6843800322061195,
"grad_norm": 0.7583758417148468,
"learning_rate": 4.1623117358057865e-06,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24608030915260315,
"step": 3530,
"valid_targets_mean": 3440.9,
"valid_targets_min": 1237
},
{
"epoch": 5.692431561996779,
"grad_norm": 0.8068612199962942,
"learning_rate": 4.113398653723168e-06,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30153918266296387,
"step": 3535,
"valid_targets_mean": 3381.9,
"valid_targets_min": 1538
},
{
"epoch": 5.70048309178744,
"grad_norm": 0.6753881803646461,
"learning_rate": 4.0647417087333776e-06,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815188765525818,
"step": 3540,
"valid_targets_mean": 4124.1,
"valid_targets_min": 1524
},
{
"epoch": 5.708534621578099,
"grad_norm": 0.7538186575725058,
"learning_rate": 4.0163416853244385e-06,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3041001558303833,
"step": 3545,
"valid_targets_mean": 3666.5,
"valid_targets_min": 1144
},
{
"epoch": 5.71658615136876,
"grad_norm": 0.7597861294821214,
"learning_rate": 3.968199363842056e-06,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28277167677879333,
"step": 3550,
"valid_targets_mean": 3813.6,
"valid_targets_min": 1150
},
{
"epoch": 5.72463768115942,
"grad_norm": 0.8692552896889315,
"learning_rate": 3.920315520477065e-06,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290031373500824,
"step": 3555,
"valid_targets_mean": 3184.7,
"valid_targets_min": 1064
},
{
"epoch": 5.73268921095008,
"grad_norm": 0.725354422712945,
"learning_rate": 3.872690927252891e-06,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602255642414093,
"step": 3560,
"valid_targets_mean": 3734.6,
"valid_targets_min": 1689
},
{
"epoch": 5.7407407407407405,
"grad_norm": 0.7906077868844616,
"learning_rate": 3.825326352013119e-06,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2873994708061218,
"step": 3565,
"valid_targets_mean": 3706.6,
"valid_targets_min": 1537
},
{
"epoch": 5.748792270531401,
"grad_norm": 0.7271200769973074,
"learning_rate": 3.7782225584091016e-06,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29486900568008423,
"step": 3570,
"valid_targets_mean": 3998.4,
"valid_targets_min": 1261
},
{
"epoch": 5.756843800322061,
"grad_norm": 0.6627264051632484,
"learning_rate": 3.731380305887644e-06,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17932528257369995,
"step": 3575,
"valid_targets_mean": 6379.5,
"valid_targets_min": 3100
},
{
"epoch": 5.764895330112721,
"grad_norm": 0.5856709563027361,
"learning_rate": 3.684800349678781e-06,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15101756155490875,
"step": 3580,
"valid_targets_mean": 5043.8,
"valid_targets_min": 2708
},
{
"epoch": 5.7729468599033815,
"grad_norm": 0.5383802419402726,
"learning_rate": 3.638483440783576e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1619020700454712,
"step": 3585,
"valid_targets_mean": 5717.3,
"valid_targets_min": 3191
},
{
"epoch": 5.780998389694042,
"grad_norm": 0.5400164906310356,
"learning_rate": 3.5924303259620307e-06,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22362828254699707,
"step": 3590,
"valid_targets_mean": 6198.8,
"valid_targets_min": 2599
},
{
"epoch": 5.789049919484702,
"grad_norm": 0.49147798358688005,
"learning_rate": 3.546641747721036e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16704602539539337,
"step": 3595,
"valid_targets_mean": 5880.9,
"valid_targets_min": 3427
},
{
"epoch": 5.797101449275362,
"grad_norm": 0.5344086768922587,
"learning_rate": 3.501118444302394e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16091877222061157,
"step": 3600,
"valid_targets_mean": 5429.1,
"valid_targets_min": 3331
},
{
"epoch": 5.805152979066023,
"grad_norm": 0.5393969729072521,
"learning_rate": 3.4558611496709384e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1679922491312027,
"step": 3605,
"valid_targets_mean": 5318.9,
"valid_targets_min": 3176
},
{
"epoch": 5.813204508856683,
"grad_norm": 0.5476815168907639,
"learning_rate": 3.4108705935026685e-06,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21377882361412048,
"step": 3610,
"valid_targets_mean": 6334.5,
"valid_targets_min": 3200
},
{
"epoch": 5.821256038647343,
"grad_norm": 0.5454273677417246,
"learning_rate": 3.3661475011730206e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15195472538471222,
"step": 3615,
"valid_targets_mean": 5575.2,
"valid_targets_min": 2982
},
{
"epoch": 5.829307568438003,
"grad_norm": 0.487579490900084,
"learning_rate": 3.321692593745147e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14653947949409485,
"step": 3620,
"valid_targets_mean": 5045.2,
"valid_targets_min": 2662
},
{
"epoch": 5.837359098228664,
"grad_norm": 0.46110914845574164,
"learning_rate": 3.2775065879582948e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14655046164989471,
"step": 3625,
"valid_targets_mean": 5929.9,
"valid_targets_min": 3640
},
{
"epoch": 5.845410628019324,
"grad_norm": 0.5371793623726028,
"learning_rate": 3.233590196216263e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15916280448436737,
"step": 3630,
"valid_targets_mean": 5560.6,
"valid_targets_min": 3146
},
{
"epoch": 5.853462157809984,
"grad_norm": 0.5336623676265232,
"learning_rate": 3.1899441265759036e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17341580986976624,
"step": 3635,
"valid_targets_mean": 5438.9,
"valid_targets_min": 3095
},
{
"epoch": 5.861513687600644,
"grad_norm": 0.506978820179007,
"learning_rate": 3.1465690827356955e-06,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16827458143234253,
"step": 3640,
"valid_targets_mean": 6153.6,
"valid_targets_min": 3325
},
{
"epoch": 5.869565217391305,
"grad_norm": 0.48238153810687057,
"learning_rate": 3.103465764024438e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1539824903011322,
"step": 3645,
"valid_targets_mean": 6176.7,
"valid_targets_min": 3690
},
{
"epoch": 5.877616747181965,
"grad_norm": 0.6316647612921683,
"learning_rate": 3.0606348653899288e-06,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14262428879737854,
"step": 3650,
"valid_targets_mean": 5253.8,
"valid_targets_min": 2926
},
{
"epoch": 5.885668276972625,
"grad_norm": 0.5087670946379775,
"learning_rate": 3.0180770773877866e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1334628015756607,
"step": 3655,
"valid_targets_mean": 6097.0,
"valid_targets_min": 3707
},
{
"epoch": 5.8937198067632846,
"grad_norm": 0.5000631591042055,
"learning_rate": 2.9757930861703223e-06,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16042768955230713,
"step": 3660,
"valid_targets_mean": 5931.1,
"valid_targets_min": 3697
},
{
"epoch": 5.901771336553946,
"grad_norm": 0.5448493291259932,
"learning_rate": 2.9337835734754504e-06,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15106025338172913,
"step": 3665,
"valid_targets_mean": 6370.6,
"valid_targets_min": 3665
},
{
"epoch": 5.909822866344605,
"grad_norm": 0.4904247806452323,
"learning_rate": 2.892049216615724e-06,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17938336730003357,
"step": 3670,
"valid_targets_mean": 6119.8,
"valid_targets_min": 2561
},
{
"epoch": 5.917874396135265,
"grad_norm": 0.5176054978636475,
"learning_rate": 2.850590688467405e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1513424813747406,
"step": 3675,
"valid_targets_mean": 5352.8,
"valid_targets_min": 3838
},
{
"epoch": 5.925925925925926,
"grad_norm": 0.5014302674357601,
"learning_rate": 2.8094086574595934e-06,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16385960578918457,
"step": 3680,
"valid_targets_mean": 6064.1,
"valid_targets_min": 2800
},
{
"epoch": 5.933977455716586,
"grad_norm": 0.4897422253909219,
"learning_rate": 2.768503787563497e-06,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14840051531791687,
"step": 3685,
"valid_targets_mean": 6725.1,
"valid_targets_min": 4014
},
{
"epoch": 5.942028985507246,
"grad_norm": 0.527797846005594,
"learning_rate": 2.7278767382816828e-06,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15732444822788239,
"step": 3690,
"valid_targets_mean": 5340.4,
"valid_targets_min": 3261
},
{
"epoch": 5.950080515297906,
"grad_norm": 0.4537750452077363,
"learning_rate": 2.687528164637474e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15537717938423157,
"step": 3695,
"valid_targets_mean": 6194.7,
"valid_targets_min": 3579
},
{
"epoch": 5.958132045088567,
"grad_norm": 0.481130982772452,
"learning_rate": 2.647458717164357e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1415160596370697,
"step": 3700,
"valid_targets_mean": 6527.8,
"valid_targets_min": 2379
},
{
"epoch": 5.966183574879227,
"grad_norm": 0.4971167453343456,
"learning_rate": 2.607669041895535e-06,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16012218594551086,
"step": 3705,
"valid_targets_mean": 6887.7,
"valid_targets_min": 3569
},
{
"epoch": 5.974235104669887,
"grad_norm": 0.47404245776286746,
"learning_rate": 2.568159780353476e-06,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134698748588562,
"step": 3710,
"valid_targets_mean": 5398.8,
"valid_targets_min": 2580
},
{
"epoch": 5.982286634460547,
"grad_norm": 0.5394680793747297,
"learning_rate": 2.5289315695395834e-06,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1926458775997162,
"step": 3715,
"valid_targets_mean": 6136.1,
"valid_targets_min": 2610
},
{
"epoch": 5.990338164251208,
"grad_norm": 0.5073583213947698,
"learning_rate": 2.489985041923928e-06,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1339704990386963,
"step": 3720,
"valid_targets_mean": 5957.4,
"valid_targets_min": 2562
},
{
"epoch": 5.998389694041868,
"grad_norm": 0.5506968197613669,
"learning_rate": 2.4513208254350486e-06,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1555670201778412,
"step": 3725,
"valid_targets_mean": 5860.3,
"valid_targets_min": 2833
},
{
"epoch": 6.006441223832528,
"grad_norm": 0.6724494776596883,
"learning_rate": 2.412939543449828e-06,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2651374936103821,
"step": 3730,
"valid_targets_mean": 5898.7,
"valid_targets_min": 2769
},
{
"epoch": 6.0144927536231885,
"grad_norm": 0.5836006033084224,
"learning_rate": 2.3748418147834394e-06,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323194146156311,
"step": 3735,
"valid_targets_mean": 6068.6,
"valid_targets_min": 2285
},
{
"epoch": 6.022544283413849,
"grad_norm": 0.5642017551180925,
"learning_rate": 2.337028253679381e-06,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26346156001091003,
"step": 3740,
"valid_targets_mean": 6519.8,
"valid_targets_min": 3314
},
{
"epoch": 6.030595813204509,
"grad_norm": 0.7066259408147071,
"learning_rate": 2.299499469799542e-06,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2269531935453415,
"step": 3745,
"valid_targets_mean": 6028.6,
"valid_targets_min": 2671
},
{
"epoch": 6.038647342995169,
"grad_norm": 0.5632095775983418,
"learning_rate": 2.262256068214421e-06,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2706316113471985,
"step": 3750,
"valid_targets_mean": 6266.9,
"valid_targets_min": 469
},
{
"epoch": 6.0466988727858295,
"grad_norm": 0.5348831735859538,
"learning_rate": 2.2252986493933237e-06,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21734777092933655,
"step": 3755,
"valid_targets_mean": 5759.1,
"valid_targets_min": 2568
},
{
"epoch": 6.05475040257649,
"grad_norm": 0.5569500892452331,
"learning_rate": 2.18862780919471e-06,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21391534805297852,
"step": 3760,
"valid_targets_mean": 5530.2,
"valid_targets_min": 611
},
{
"epoch": 6.06280193236715,
"grad_norm": 0.5382181428705697,
"learning_rate": 2.152244138856585e-06,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20388023555278778,
"step": 3765,
"valid_targets_mean": 5696.9,
"valid_targets_min": 2392
},
{
"epoch": 6.07085346215781,
"grad_norm": 0.6463190792326495,
"learning_rate": 2.1161482249869513e-06,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21541935205459595,
"step": 3770,
"valid_targets_mean": 5683.9,
"valid_targets_min": 1285
},
{
"epoch": 6.078904991948471,
"grad_norm": 0.4769019487796991,
"learning_rate": 2.080340649554369e-06,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1947912871837616,
"step": 3775,
"valid_targets_mean": 6331.4,
"valid_targets_min": 3356
},
{
"epoch": 6.086956521739131,
"grad_norm": 0.5260688671936042,
"learning_rate": 2.044821989878558e-06,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972348690032959,
"step": 3780,
"valid_targets_mean": 5326.1,
"valid_targets_min": 1676
},
{
"epoch": 6.095008051529791,
"grad_norm": 0.5385684220997624,
"learning_rate": 2.0095928186210956e-06,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24432078003883362,
"step": 3785,
"valid_targets_mean": 6448.9,
"valid_targets_min": 2859
},
{
"epoch": 6.1030595813204505,
"grad_norm": 0.5134775076305466,
"learning_rate": 1.974653703776188e-06,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21769499778747559,
"step": 3790,
"valid_targets_mean": 5910.2,
"valid_targets_min": 1417
},
{
"epoch": 6.111111111111111,
"grad_norm": 0.500956162314828,
"learning_rate": 1.9400052086615153e-06,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26993608474731445,
"step": 3795,
"valid_targets_mean": 7141.1,
"valid_targets_min": 3571
},
{
"epoch": 6.119162640901771,
"grad_norm": 0.5451480445857494,
"learning_rate": 1.9056478919091236e-06,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23594680428504944,
"step": 3800,
"valid_targets_mean": 6492.9,
"valid_targets_min": 3446
},
{
"epoch": 6.127214170692431,
"grad_norm": 0.4970674059635784,
"learning_rate": 1.8715823074564587e-06,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18086868524551392,
"step": 3805,
"valid_targets_mean": 5447.6,
"valid_targets_min": 306
},
{
"epoch": 6.1352657004830915,
"grad_norm": 0.8407143099623481,
"learning_rate": 1.837809004537401e-06,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31480419635772705,
"step": 3810,
"valid_targets_mean": 3657.8,
"valid_targets_min": 1050
},
{
"epoch": 6.143317230273752,
"grad_norm": 0.9619594700485488,
"learning_rate": 1.8043285276734334e-06,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3486429452896118,
"step": 3815,
"valid_targets_mean": 2673.1,
"valid_targets_min": 1309
},
{
"epoch": 6.151368760064412,
"grad_norm": 0.8500263557004369,
"learning_rate": 1.7711414166648365e-06,
"loss": 0.3224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3212417662143707,
"step": 3820,
"valid_targets_mean": 3209.7,
"valid_targets_min": 1155
},
{
"epoch": 6.159420289855072,
"grad_norm": 0.9189308209039743,
"learning_rate": 1.7382482065820138e-06,
"loss": 0.3419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35360682010650635,
"step": 3825,
"valid_targets_mean": 3054.8,
"valid_targets_min": 1099
},
{
"epoch": 6.1674718196457325,
"grad_norm": 0.843417341220929,
"learning_rate": 1.7056494277568503e-06,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28352683782577515,
"step": 3830,
"valid_targets_mean": 2978.8,
"valid_targets_min": 1175
},
{
"epoch": 6.175523349436393,
"grad_norm": 0.8163445646433484,
"learning_rate": 1.6733456057741592e-06,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696455121040344,
"step": 3835,
"valid_targets_mean": 2849.6,
"valid_targets_min": 1295
},
{
"epoch": 6.183574879227053,
"grad_norm": 0.9881052112221266,
"learning_rate": 1.641337261463216e-06,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.332567423582077,
"step": 3840,
"valid_targets_mean": 2615.8,
"valid_targets_min": 1383
},
{
"epoch": 6.191626409017713,
"grad_norm": 0.8302563038314946,
"learning_rate": 1.6096249108893602e-06,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33189308643341064,
"step": 3845,
"valid_targets_mean": 3296.4,
"valid_targets_min": 1316
},
{
"epoch": 6.199677938808374,
"grad_norm": 0.8685755282410109,
"learning_rate": 1.5782090653456616e-06,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31094080209732056,
"step": 3850,
"valid_targets_mean": 3968.6,
"valid_targets_min": 1383
},
{
"epoch": 6.207729468599034,
"grad_norm": 0.9006410427832183,
"learning_rate": 1.547090231344699e-06,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37766462564468384,
"step": 3855,
"valid_targets_mean": 3078.5,
"valid_targets_min": 1174
},
{
"epoch": 6.215780998389694,
"grad_norm": 0.8145924540125793,
"learning_rate": 1.5162689106103746e-06,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.283829003572464,
"step": 3860,
"valid_targets_mean": 3417.5,
"valid_targets_min": 1252
},
{
"epoch": 6.223832528180354,
"grad_norm": 0.8259786070193814,
"learning_rate": 1.4857456000698366e-06,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3424111008644104,
"step": 3865,
"valid_targets_mean": 3427.6,
"valid_targets_min": 1218
},
{
"epoch": 6.231884057971015,
"grad_norm": 0.9647531902604716,
"learning_rate": 1.4555207918454662e-06,
"loss": 0.3322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37204068899154663,
"step": 3870,
"valid_targets_mean": 2875.2,
"valid_targets_min": 1123
},
{
"epoch": 6.239935587761675,
"grad_norm": 0.878124106513052,
"learning_rate": 1.4255949732469309e-06,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.326835960149765,
"step": 3875,
"valid_targets_mean": 2933.1,
"valid_targets_min": 1485
},
{
"epoch": 6.247987117552335,
"grad_norm": 0.9256224608559495,
"learning_rate": 1.3959686267633488e-06,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32315731048583984,
"step": 3880,
"valid_targets_mean": 2699.5,
"valid_targets_min": 1170
},
{
"epoch": 6.256038647342995,
"grad_norm": 0.7806676732625024,
"learning_rate": 1.3666422300554905e-06,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884427607059479,
"step": 3885,
"valid_targets_mean": 3932.2,
"valid_targets_min": 1108
},
{
"epoch": 6.264090177133656,
"grad_norm": 0.8683190375235182,
"learning_rate": 1.3376162559480822e-06,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3049579858779907,
"step": 3890,
"valid_targets_mean": 2747.4,
"valid_targets_min": 1205
},
{
"epoch": 6.272141706924316,
"grad_norm": 0.8710255989708383,
"learning_rate": 1.308891172422193e-06,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33199816942214966,
"step": 3895,
"valid_targets_mean": 3029.8,
"valid_targets_min": 1355
},
{
"epoch": 6.280193236714976,
"grad_norm": 0.8477552990968392,
"learning_rate": 1.2804674426076757e-06,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325872540473938,
"step": 3900,
"valid_targets_mean": 3227.2,
"valid_targets_min": 1427
},
{
"epoch": 6.2882447665056365,
"grad_norm": 0.7965348453218628,
"learning_rate": 1.2523455247757088e-06,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30131930112838745,
"step": 3905,
"valid_targets_mean": 3224.4,
"valid_targets_min": 1045
},
{
"epoch": 6.296296296296296,
"grad_norm": 0.7395568722630161,
"learning_rate": 1.224525872331408e-06,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3066796660423279,
"step": 3910,
"valid_targets_mean": 4021.2,
"valid_targets_min": 1118
},
{
"epoch": 6.304347826086957,
"grad_norm": 0.8162687764572345,
"learning_rate": 1.1970089338065071e-06,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2592276334762573,
"step": 3915,
"valid_targets_mean": 3145.9,
"valid_targets_min": 977
},
{
"epoch": 6.312399355877616,
"grad_norm": 0.8944188897503945,
"learning_rate": 1.1697951528521422e-06,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3102479875087738,
"step": 3920,
"valid_targets_mean": 2583.8,
"valid_targets_min": 1167
},
{
"epoch": 6.320450885668277,
"grad_norm": 0.8873873245958489,
"learning_rate": 1.1428849682316766e-06,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2901550829410553,
"step": 3925,
"valid_targets_mean": 3109.6,
"valid_targets_min": 1268
},
{
"epoch": 6.328502415458937,
"grad_norm": 0.8886136259904959,
"learning_rate": 1.116278813813647e-06,
"loss": 0.3118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2849825918674469,
"step": 3930,
"valid_targets_mean": 2516.6,
"valid_targets_min": 1159
},
{
"epoch": 6.336553945249597,
"grad_norm": 0.8340658998428512,
"learning_rate": 1.08997711856476e-06,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31567925214767456,
"step": 3935,
"valid_targets_mean": 4016.8,
"valid_targets_min": 1642
},
{
"epoch": 6.344605475040257,
"grad_norm": 0.8397362085202228,
"learning_rate": 1.0639803065429755e-06,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3202289938926697,
"step": 3940,
"valid_targets_mean": 3258.7,
"valid_targets_min": 1158
},
{
"epoch": 6.352657004830918,
"grad_norm": 0.8392706087036921,
"learning_rate": 1.0382887968906718e-06,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3209483027458191,
"step": 3945,
"valid_targets_mean": 3767.5,
"valid_targets_min": 1430
},
{
"epoch": 6.360708534621578,
"grad_norm": 0.8201489913983286,
"learning_rate": 1.012903003827883e-06,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3404323160648346,
"step": 3950,
"valid_targets_mean": 3205.4,
"valid_targets_min": 977
},
{
"epoch": 6.368760064412238,
"grad_norm": 0.811177676991476,
"learning_rate": 9.87823336645628e-07,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27225881814956665,
"step": 3955,
"valid_targets_mean": 3383.2,
"valid_targets_min": 1706
},
{
"epoch": 6.3768115942028984,
"grad_norm": 0.858309663982121,
"learning_rate": 9.630501996993091e-07,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884863018989563,
"step": 3960,
"valid_targets_mean": 2897.8,
"valid_targets_min": 1102
},
{
"epoch": 6.384863123993559,
"grad_norm": 0.9879313892597844,
"learning_rate": 9.385839924021844e-07,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3102876842021942,
"step": 3965,
"valid_targets_mean": 2376.7,
"valid_targets_min": 1197
},
{
"epoch": 6.392914653784219,
"grad_norm": 0.8341622182276683,
"learning_rate": 9.144251092189416e-07,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29059672355651855,
"step": 3970,
"valid_targets_mean": 3869.4,
"valid_targets_min": 1445
},
{
"epoch": 6.400966183574879,
"grad_norm": 0.6305412459076566,
"learning_rate": 8.905739396593316e-07,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2593904137611389,
"step": 3975,
"valid_targets_mean": 4852.6,
"valid_targets_min": 1536
},
{
"epoch": 6.4090177133655395,
"grad_norm": 0.8415630056656381,
"learning_rate": 8.670308682718853e-07,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30260005593299866,
"step": 3980,
"valid_targets_mean": 3675.9,
"valid_targets_min": 1260
},
{
"epoch": 6.4170692431562,
"grad_norm": 0.7289917763669883,
"learning_rate": 8.437962746377204e-07,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25300300121307373,
"step": 3985,
"valid_targets_mean": 3460.8,
"valid_targets_min": 406
},
{
"epoch": 6.42512077294686,
"grad_norm": 0.8183662125493177,
"learning_rate": 8.208705333644129e-07,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27502337098121643,
"step": 3990,
"valid_targets_mean": 4104.0,
"valid_targets_min": 1569
},
{
"epoch": 6.43317230273752,
"grad_norm": 0.8025243264792566,
"learning_rate": 7.982540140799688e-07,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2634972333908081,
"step": 3995,
"valid_targets_mean": 3000.4,
"valid_targets_min": 1169
},
{
"epoch": 6.4412238325281805,
"grad_norm": 0.8460006631505339,
"learning_rate": 7.759470814268489e-07,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3205861449241638,
"step": 4000,
"valid_targets_mean": 3155.8,
"valid_targets_min": 1407
},
{
"epoch": 6.449275362318841,
"grad_norm": 0.8293418081000622,
"learning_rate": 7.539500950561063e-07,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261262983083725,
"step": 4005,
"valid_targets_mean": 2876.1,
"valid_targets_min": 1097
},
{
"epoch": 6.457326892109501,
"grad_norm": 0.8476655987165361,
"learning_rate": 7.322634096215831e-07,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2980925440788269,
"step": 4010,
"valid_targets_mean": 3099.4,
"valid_targets_min": 1258
},
{
"epoch": 6.465378421900161,
"grad_norm": 0.8876078091742649,
"learning_rate": 7.108873747741807e-07,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28537583351135254,
"step": 4015,
"valid_targets_mean": 2574.1,
"valid_targets_min": 1351
},
{
"epoch": 6.473429951690822,
"grad_norm": 0.8957582444852635,
"learning_rate": 6.898223351562405e-07,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32109585404396057,
"step": 4020,
"valid_targets_mean": 3223.3,
"valid_targets_min": 1314
},
{
"epoch": 6.481481481481482,
"grad_norm": 0.764077364410412,
"learning_rate": 6.690686303959748e-07,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2634509801864624,
"step": 4025,
"valid_targets_mean": 3132.0,
"valid_targets_min": 1272
},
{
"epoch": 6.489533011272142,
"grad_norm": 0.7443505087806759,
"learning_rate": 6.48626595101991e-07,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569301724433899,
"step": 4030,
"valid_targets_mean": 3755.3,
"valid_targets_min": 1230
},
{
"epoch": 6.4975845410628015,
"grad_norm": 0.7930493772415029,
"learning_rate": 6.284965588579028e-07,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24235209822654724,
"step": 4035,
"valid_targets_mean": 3029.9,
"valid_targets_min": 1590
},
{
"epoch": 6.505636070853463,
"grad_norm": 0.7138369856169103,
"learning_rate": 6.08678846217019e-07,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27324530482292175,
"step": 4040,
"valid_targets_mean": 3930.0,
"valid_targets_min": 1734
},
{
"epoch": 6.513687600644122,
"grad_norm": 0.7841606768019419,
"learning_rate": 5.891737766970984e-07,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32244470715522766,
"step": 4045,
"valid_targets_mean": 3632.3,
"valid_targets_min": 1021
},
{
"epoch": 6.521739130434782,
"grad_norm": 0.761125195078748,
"learning_rate": 5.699816647752077e-07,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867166996002197,
"step": 4050,
"valid_targets_mean": 3690.8,
"valid_targets_min": 1136
},
{
"epoch": 6.5297906602254425,
"grad_norm": 0.9595718427005088,
"learning_rate": 5.511028198826496e-07,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2752280831336975,
"step": 4055,
"valid_targets_mean": 2800.6,
"valid_targets_min": 485
},
{
"epoch": 6.537842190016103,
"grad_norm": 0.7724065995439069,
"learning_rate": 5.32537546399976e-07,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3199930787086487,
"step": 4060,
"valid_targets_mean": 3744.1,
"valid_targets_min": 1267
},
{
"epoch": 6.545893719806763,
"grad_norm": 0.7955896348465847,
"learning_rate": 5.142861436520763e-07,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26323774456977844,
"step": 4065,
"valid_targets_mean": 3365.1,
"valid_targets_min": 1014
},
{
"epoch": 6.553945249597423,
"grad_norm": 0.7123095433809674,
"learning_rate": 4.963489059033477e-07,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2584189176559448,
"step": 4070,
"valid_targets_mean": 3473.1,
"valid_targets_min": 1657
},
{
"epoch": 6.561996779388084,
"grad_norm": 0.8106421482681555,
"learning_rate": 4.787261223529616e-07,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26411914825439453,
"step": 4075,
"valid_targets_mean": 2840.8,
"valid_targets_min": 1494
},
{
"epoch": 6.570048309178744,
"grad_norm": 0.7944422290785246,
"learning_rate": 4.6141807713019793e-07,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28050708770751953,
"step": 4080,
"valid_targets_mean": 2815.1,
"valid_targets_min": 1208
},
{
"epoch": 6.578099838969404,
"grad_norm": 0.7829124652037258,
"learning_rate": 4.444250492898539e-07,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2613917589187622,
"step": 4085,
"valid_targets_mean": 3228.2,
"valid_targets_min": 1394
},
{
"epoch": 6.586151368760064,
"grad_norm": 0.785576038884685,
"learning_rate": 4.277473128077625e-07,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2885136008262634,
"step": 4090,
"valid_targets_mean": 3174.3,
"valid_targets_min": 1240
},
{
"epoch": 6.594202898550725,
"grad_norm": 0.7531252267510662,
"learning_rate": 4.113851365763544e-07,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605210542678833,
"step": 4095,
"valid_targets_mean": 3438.4,
"valid_targets_min": 1124
},
{
"epoch": 6.602254428341385,
"grad_norm": 0.8483462893898233,
"learning_rate": 3.953387844003431e-07,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24956530332565308,
"step": 4100,
"valid_targets_mean": 2587.6,
"valid_targets_min": 1218
},
{
"epoch": 6.610305958132045,
"grad_norm": 0.8250120431362822,
"learning_rate": 3.7960851499245554e-07,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2679558992385864,
"step": 4105,
"valid_targets_mean": 2969.8,
"valid_targets_min": 1309
},
{
"epoch": 6.618357487922705,
"grad_norm": 0.9900756494723584,
"learning_rate": 3.6419458196926825e-07,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.276964396238327,
"step": 4110,
"valid_targets_mean": 3475.1,
"valid_targets_min": 1128
},
{
"epoch": 6.626409017713366,
"grad_norm": 0.7872199755262294,
"learning_rate": 3.4909723384712436e-07,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2374078333377838,
"step": 4115,
"valid_targets_mean": 2925.9,
"valid_targets_min": 1311
},
{
"epoch": 6.634460547504026,
"grad_norm": 0.7593732626595731,
"learning_rate": 3.3431671403811207e-07,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528577148914337,
"step": 4120,
"valid_targets_mean": 3369.0,
"valid_targets_min": 1109
},
{
"epoch": 6.642512077294686,
"grad_norm": 0.7712701520481997,
"learning_rate": 3.198532608461524e-07,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27561864256858826,
"step": 4125,
"valid_targets_mean": 3307.7,
"valid_targets_min": 1172
},
{
"epoch": 6.650563607085346,
"grad_norm": 0.8293254928497902,
"learning_rate": 3.0570710746314903e-07,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669210433959961,
"step": 4130,
"valid_targets_mean": 2625.4,
"valid_targets_min": 1313
},
{
"epoch": 6.658615136876007,
"grad_norm": 0.9102984688640577,
"learning_rate": 2.9187848196524205e-07,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29154983162879944,
"step": 4135,
"valid_targets_mean": 3028.0,
"valid_targets_min": 1602
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.7950386744860756,
"learning_rate": 2.7836760730910464e-07,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2758431136608124,
"step": 4140,
"valid_targets_mean": 3680.5,
"valid_targets_min": 1441
},
{
"epoch": 6.674718196457327,
"grad_norm": 0.77773549922398,
"learning_rate": 2.6517470132838117e-07,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2587966322898865,
"step": 4145,
"valid_targets_mean": 3472.8,
"valid_targets_min": 1029
},
{
"epoch": 6.6827697262479875,
"grad_norm": 0.8232297238523694,
"learning_rate": 2.522999767301482e-07,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.251497745513916,
"step": 4150,
"valid_targets_mean": 3390.6,
"valid_targets_min": 1873
},
{
"epoch": 6.690821256038648,
"grad_norm": 0.8278987027552264,
"learning_rate": 2.3974364109149886e-07,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2831830382347107,
"step": 4155,
"valid_targets_mean": 3282.8,
"valid_targets_min": 588
},
{
"epoch": 6.698872785829307,
"grad_norm": 0.7184574441839767,
"learning_rate": 2.2750589685619495e-07,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29470086097717285,
"step": 4160,
"valid_targets_mean": 4544.4,
"valid_targets_min": 1616
},
{
"epoch": 6.706924315619968,
"grad_norm": 0.6991872186724033,
"learning_rate": 2.1558694133139823e-07,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618224620819092,
"step": 4165,
"valid_targets_mean": 3384.4,
"valid_targets_min": 1236
},
{
"epoch": 6.714975845410628,
"grad_norm": 0.6730952845085181,
"learning_rate": 2.039869666844929e-07,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2868538200855255,
"step": 4170,
"valid_targets_mean": 4230.6,
"valid_targets_min": 1229
},
{
"epoch": 6.723027375201288,
"grad_norm": 0.8142353289352747,
"learning_rate": 1.9270615993998375e-07,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27020856738090515,
"step": 4175,
"valid_targets_mean": 3359.7,
"valid_targets_min": 1076
},
{
"epoch": 6.731078904991948,
"grad_norm": 0.6894366977045292,
"learning_rate": 1.817447029764874e-07,
"loss": 0.2735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2708439230918884,
"step": 4180,
"valid_targets_mean": 4327.3,
"valid_targets_min": 1075
},
{
"epoch": 6.739130434782608,
"grad_norm": 0.6974543175965264,
"learning_rate": 1.7110277252379238e-07,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23700222373008728,
"step": 4185,
"valid_targets_mean": 3812.0,
"valid_targets_min": 1142
},
{
"epoch": 6.747181964573269,
"grad_norm": 0.902579622282395,
"learning_rate": 1.607805401600149e-07,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28798216581344604,
"step": 4190,
"valid_targets_mean": 2473.6,
"valid_targets_min": 1208
},
{
"epoch": 6.755233494363929,
"grad_norm": 1.1198738028974389,
"learning_rate": 1.5077817230883419e-07,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24988670647144318,
"step": 4195,
"valid_targets_mean": 7490.2,
"valid_targets_min": 2721
},
{
"epoch": 6.763285024154589,
"grad_norm": 0.6445241702724612,
"learning_rate": 1.4109583023679706e-07,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19134119153022766,
"step": 4200,
"valid_targets_mean": 6344.0,
"valid_targets_min": 3073
},
{
"epoch": 6.7713365539452495,
"grad_norm": 0.6558044755460182,
"learning_rate": 1.3173367005073545e-07,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14993247389793396,
"step": 4205,
"valid_targets_mean": 5062.1,
"valid_targets_min": 2985
},
{
"epoch": 6.77938808373591,
"grad_norm": 0.6428349765980677,
"learning_rate": 1.2269184269523282e-07,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19283941388130188,
"step": 4210,
"valid_targets_mean": 5613.6,
"valid_targets_min": 2620
},
{
"epoch": 6.78743961352657,
"grad_norm": 0.6404100414290556,
"learning_rate": 1.1397049395020842e-07,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16561368107795715,
"step": 4215,
"valid_targets_mean": 6100.1,
"valid_targets_min": 3494
},
{
"epoch": 6.79549114331723,
"grad_norm": 0.5799011128340407,
"learning_rate": 1.0556976442854805e-07,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1338614821434021,
"step": 4220,
"valid_targets_mean": 5711.6,
"valid_targets_min": 3761
},
{
"epoch": 6.8035426731078905,
"grad_norm": 0.5831529495090866,
"learning_rate": 9.748978957385025e-08,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16792958974838257,
"step": 4225,
"valid_targets_mean": 5863.1,
"valid_targets_min": 3178
},
{
"epoch": 6.811594202898551,
"grad_norm": 0.5618368648500537,
"learning_rate": 8.9730699658237e-08,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15672558546066284,
"step": 4230,
"valid_targets_mean": 6090.8,
"valid_targets_min": 2870
},
{
"epoch": 6.819645732689211,
"grad_norm": 0.5753023449670881,
"learning_rate": 8.229261978025316e-08,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14445531368255615,
"step": 4235,
"valid_targets_mean": 5746.5,
"valid_targets_min": 3334
},
{
"epoch": 6.827697262479871,
"grad_norm": 0.6046612188056499,
"learning_rate": 7.517566986285474e-08,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16920645534992218,
"step": 4240,
"valid_targets_mean": 5464.9,
"valid_targets_min": 3204
},
{
"epoch": 6.835748792270532,
"grad_norm": 0.566160926164469,
"learning_rate": 6.837996465146823e-08,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1559247374534607,
"step": 4245,
"valid_targets_mean": 5526.6,
"valid_targets_min": 2793
},
{
"epoch": 6.843800322061192,
"grad_norm": 0.5934842203255924,
"learning_rate": 6.190561371214321e-08,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17836138606071472,
"step": 4250,
"valid_targets_mean": 6074.9,
"valid_targets_min": 3285
},
{
"epoch": 6.851851851851852,
"grad_norm": 0.5989111745239429,
"learning_rate": 5.575272142978927e-08,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14026236534118652,
"step": 4255,
"valid_targets_mean": 5260.6,
"valid_targets_min": 2292
},
{
"epoch": 6.859903381642512,
"grad_norm": 0.5852529999276449,
"learning_rate": 4.992138700649074e-08,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16409310698509216,
"step": 4260,
"valid_targets_mean": 5752.9,
"valid_targets_min": 4204
},
{
"epoch": 6.867954911433173,
"grad_norm": 0.6115217698676657,
"learning_rate": 4.4411704459903506e-08,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484546661376953,
"step": 4265,
"valid_targets_mean": 4836.7,
"valid_targets_min": 2111
},
{
"epoch": 6.876006441223833,
"grad_norm": 0.6316569084859304,
"learning_rate": 3.92237626217451e-08,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18417194485664368,
"step": 4270,
"valid_targets_mean": 6021.0,
"valid_targets_min": 4439
},
{
"epoch": 6.884057971014493,
"grad_norm": 0.5659170506134107,
"learning_rate": 3.435764513635809e-08,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16125309467315674,
"step": 4275,
"valid_targets_mean": 5661.9,
"valid_targets_min": 3607
},
{
"epoch": 6.892109500805153,
"grad_norm": 0.6183161652818728,
"learning_rate": 2.9813430459364465e-08,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16375675797462463,
"step": 4280,
"valid_targets_mean": 5420.4,
"valid_targets_min": 3078
},
{
"epoch": 6.900161030595813,
"grad_norm": 0.598243453584514,
"learning_rate": 2.5591191856397802e-08,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15643054246902466,
"step": 4285,
"valid_targets_mean": 5750.4,
"valid_targets_min": 2491
},
{
"epoch": 6.908212560386474,
"grad_norm": 0.5759364478429377,
"learning_rate": 2.1690997401928593e-08,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14383944869041443,
"step": 4290,
"valid_targets_mean": 5996.6,
"valid_targets_min": 4004
},
{
"epoch": 6.916264090177133,
"grad_norm": 0.5552887684264204,
"learning_rate": 1.811290997815851e-08,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14651936292648315,
"step": 4295,
"valid_targets_mean": 6200.9,
"valid_targets_min": 3148
},
{
"epoch": 6.9243156199677935,
"grad_norm": 0.49927201422387957,
"learning_rate": 1.485698727400564e-08,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13894528150558472,
"step": 4300,
"valid_targets_mean": 6472.3,
"valid_targets_min": 3581
},
{
"epoch": 6.932367149758454,
"grad_norm": 0.6237894773842607,
"learning_rate": 1.1923281784185226e-08,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22623667120933533,
"step": 4305,
"valid_targets_mean": 7532.8,
"valid_targets_min": 3206
},
{
"epoch": 6.940418679549114,
"grad_norm": 0.5964161951339775,
"learning_rate": 9.311840808357009e-09,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940787136554718,
"step": 4310,
"valid_targets_mean": 5952.9,
"valid_targets_min": 3304
},
{
"epoch": 6.948470209339774,
"grad_norm": 0.5723446720622757,
"learning_rate": 7.022706450354744e-09,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15612125396728516,
"step": 4315,
"valid_targets_mean": 5735.1,
"valid_targets_min": 3368
},
{
"epoch": 6.956521739130435,
"grad_norm": 0.6247370179630106,
"learning_rate": 5.055915617522278e-09,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16278734803199768,
"step": 4320,
"valid_targets_mean": 5506.7,
"valid_targets_min": 2908
},
{
"epoch": 6.964573268921095,
"grad_norm": 0.6002549871414108,
"learning_rate": 3.411500020109593e-09,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16616703569889069,
"step": 4325,
"valid_targets_mean": 5777.9,
"valid_targets_min": 3451
},
{
"epoch": 6.972624798711755,
"grad_norm": 0.4927861563779905,
"learning_rate": 2.08948617075988e-09,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13573740422725677,
"step": 4330,
"valid_targets_mean": 6045.9,
"valid_targets_min": 2967
},
{
"epoch": 6.980676328502415,
"grad_norm": 0.5443175862615581,
"learning_rate": 1.0898953840898786e-09,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1544107049703598,
"step": 4335,
"valid_targets_mean": 6113.4,
"valid_targets_min": 3912
},
{
"epoch": 6.988727858293076,
"grad_norm": 0.5346570746956858,
"learning_rate": 4.127437763390418e-10,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1397796869277954,
"step": 4340,
"valid_targets_mean": 5837.0,
"valid_targets_min": 3528
},
{
"epoch": 6.996779388083736,
"grad_norm": 0.5722567869143517,
"learning_rate": 5.804226511196831e-11,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16464683413505554,
"step": 4345,
"valid_targets_mean": 6356.6,
"valid_targets_min": 3725
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18215620517730713,
"step": 4347,
"total_flos": 1416797650550784.0,
"train_loss": 0.3156141554908915,
"train_runtime": 23294.0349,
"train_samples_per_second": 2.983,
"train_steps_per_second": 0.187,
"valid_targets_mean": 6658.9,
"valid_targets_min": 2494
}
],
"logging_steps": 5,
"max_steps": 4347,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1416797650550784.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}