a1-stack_ruby / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
1825d59 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4347,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008051529790660225,
"grad_norm": 18.887031329342683,
"learning_rate": 3.6781609195402303e-07,
"loss": 0.7617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7170521020889282,
"step": 5,
"valid_targets_mean": 4721.3,
"valid_targets_min": 995
},
{
"epoch": 0.01610305958132045,
"grad_norm": 17.610592482733104,
"learning_rate": 8.275862068965518e-07,
"loss": 0.7308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7500532865524292,
"step": 10,
"valid_targets_mean": 4560.7,
"valid_targets_min": 1282
},
{
"epoch": 0.024154589371980676,
"grad_norm": 17.389455158716025,
"learning_rate": 1.2873563218390806e-06,
"loss": 0.719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7645566463470459,
"step": 15,
"valid_targets_mean": 4224.9,
"valid_targets_min": 1424
},
{
"epoch": 0.0322061191626409,
"grad_norm": 12.900467657800844,
"learning_rate": 1.7471264367816093e-06,
"loss": 0.6498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6394810676574707,
"step": 20,
"valid_targets_mean": 3705.6,
"valid_targets_min": 613
},
{
"epoch": 0.040257648953301126,
"grad_norm": 8.27577785552847,
"learning_rate": 2.206896551724138e-06,
"loss": 0.6021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6195220351219177,
"step": 25,
"valid_targets_mean": 4815.3,
"valid_targets_min": 1591
},
{
"epoch": 0.04830917874396135,
"grad_norm": 4.570129109709082,
"learning_rate": 2.666666666666667e-06,
"loss": 0.5337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4826958477497101,
"step": 30,
"valid_targets_mean": 4646.1,
"valid_targets_min": 1763
},
{
"epoch": 0.05636070853462158,
"grad_norm": 2.9815097303289773,
"learning_rate": 3.1264367816091956e-06,
"loss": 0.5145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5005267858505249,
"step": 35,
"valid_targets_mean": 4164.2,
"valid_targets_min": 1256
},
{
"epoch": 0.0644122383252818,
"grad_norm": 1.6024853481776866,
"learning_rate": 3.5862068965517243e-06,
"loss": 0.4877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43937644362449646,
"step": 40,
"valid_targets_mean": 4963.1,
"valid_targets_min": 1405
},
{
"epoch": 0.07246376811594203,
"grad_norm": 1.1550666348042289,
"learning_rate": 4.0459770114942535e-06,
"loss": 0.4836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45346975326538086,
"step": 45,
"valid_targets_mean": 5371.4,
"valid_targets_min": 1739
},
{
"epoch": 0.08051529790660225,
"grad_norm": 1.1056770926806292,
"learning_rate": 4.505747126436782e-06,
"loss": 0.4879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4831688106060028,
"step": 50,
"valid_targets_mean": 5321.5,
"valid_targets_min": 1966
},
{
"epoch": 0.08856682769726248,
"grad_norm": 0.9520259825035011,
"learning_rate": 4.965517241379311e-06,
"loss": 0.4173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43055927753448486,
"step": 55,
"valid_targets_mean": 4930.1,
"valid_targets_min": 1613
},
{
"epoch": 0.0966183574879227,
"grad_norm": 0.7379387322001421,
"learning_rate": 5.42528735632184e-06,
"loss": 0.4301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41147735714912415,
"step": 60,
"valid_targets_mean": 4576.1,
"valid_targets_min": 693
},
{
"epoch": 0.10466988727858294,
"grad_norm": 0.6751399532440802,
"learning_rate": 5.8850574712643685e-06,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40098029375076294,
"step": 65,
"valid_targets_mean": 4767.1,
"valid_targets_min": 1984
},
{
"epoch": 0.11272141706924316,
"grad_norm": 0.6451168287397513,
"learning_rate": 6.344827586206898e-06,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41312819719314575,
"step": 70,
"valid_targets_mean": 4322.2,
"valid_targets_min": 523
},
{
"epoch": 0.12077294685990338,
"grad_norm": 0.6097646247381094,
"learning_rate": 6.804597701149426e-06,
"loss": 0.4048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3773424029350281,
"step": 75,
"valid_targets_mean": 4922.2,
"valid_targets_min": 1736
},
{
"epoch": 0.1288244766505636,
"grad_norm": 0.6955263869864199,
"learning_rate": 7.264367816091955e-06,
"loss": 0.386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3395404815673828,
"step": 80,
"valid_targets_mean": 4326.2,
"valid_targets_min": 822
},
{
"epoch": 0.13687600644122383,
"grad_norm": 0.6047921080138658,
"learning_rate": 7.724137931034483e-06,
"loss": 0.373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33859458565711975,
"step": 85,
"valid_targets_mean": 4358.8,
"valid_targets_min": 2465
},
{
"epoch": 0.14492753623188406,
"grad_norm": 0.5884903953581806,
"learning_rate": 8.183908045977013e-06,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.323479026556015,
"step": 90,
"valid_targets_mean": 4712.4,
"valid_targets_min": 2373
},
{
"epoch": 0.1529790660225443,
"grad_norm": 0.5738600516460006,
"learning_rate": 8.643678160919541e-06,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33414769172668457,
"step": 95,
"valid_targets_mean": 4288.1,
"valid_targets_min": 1850
},
{
"epoch": 0.1610305958132045,
"grad_norm": 0.6365501852080249,
"learning_rate": 9.10344827586207e-06,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41237330436706543,
"step": 100,
"valid_targets_mean": 4589.5,
"valid_targets_min": 617
},
{
"epoch": 0.16908212560386474,
"grad_norm": 0.5810936825227695,
"learning_rate": 9.563218390804598e-06,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3179246783256531,
"step": 105,
"valid_targets_mean": 4583.3,
"valid_targets_min": 892
},
{
"epoch": 0.17713365539452497,
"grad_norm": 0.6085982104059682,
"learning_rate": 1.0022988505747126e-05,
"loss": 0.3688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3603907823562622,
"step": 110,
"valid_targets_mean": 3972.6,
"valid_targets_min": 529
},
{
"epoch": 0.18518518518518517,
"grad_norm": 0.6219836430762767,
"learning_rate": 1.0482758620689658e-05,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36107924580574036,
"step": 115,
"valid_targets_mean": 3626.8,
"valid_targets_min": 784
},
{
"epoch": 0.1932367149758454,
"grad_norm": 0.5706613275227181,
"learning_rate": 1.0942528735632186e-05,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35068589448928833,
"step": 120,
"valid_targets_mean": 4590.1,
"valid_targets_min": 708
},
{
"epoch": 0.20128824476650564,
"grad_norm": 0.5239098489712369,
"learning_rate": 1.1402298850574713e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31050339341163635,
"step": 125,
"valid_targets_mean": 4365.3,
"valid_targets_min": 919
},
{
"epoch": 0.20933977455716588,
"grad_norm": 0.5408209063854124,
"learning_rate": 1.1862068965517241e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.343374639749527,
"step": 130,
"valid_targets_mean": 4735.1,
"valid_targets_min": 502
},
{
"epoch": 0.21739130434782608,
"grad_norm": 0.5429590967253727,
"learning_rate": 1.2321839080459773e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2973455786705017,
"step": 135,
"valid_targets_mean": 4331.6,
"valid_targets_min": 1580
},
{
"epoch": 0.22544283413848631,
"grad_norm": 0.5564263430607277,
"learning_rate": 1.2781609195402301e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33352577686309814,
"step": 140,
"valid_targets_mean": 4605.9,
"valid_targets_min": 973
},
{
"epoch": 0.23349436392914655,
"grad_norm": 0.59405705309966,
"learning_rate": 1.324137931034483e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31183719635009766,
"step": 145,
"valid_targets_mean": 3893.1,
"valid_targets_min": 1253
},
{
"epoch": 0.24154589371980675,
"grad_norm": 0.5158909121745847,
"learning_rate": 1.3701149425287356e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867949604988098,
"step": 150,
"valid_targets_mean": 4840.7,
"valid_targets_min": 1486
},
{
"epoch": 0.249597423510467,
"grad_norm": 0.6568765520342051,
"learning_rate": 1.4160919540229888e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3462482690811157,
"step": 155,
"valid_targets_mean": 3947.3,
"valid_targets_min": 1429
},
{
"epoch": 0.2576489533011272,
"grad_norm": 0.6071351268604575,
"learning_rate": 1.4620689655172416e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33247584104537964,
"step": 160,
"valid_targets_mean": 4600.6,
"valid_targets_min": 1925
},
{
"epoch": 0.26570048309178745,
"grad_norm": 0.538560909580689,
"learning_rate": 1.5080459770114944e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31049293279647827,
"step": 165,
"valid_targets_mean": 5258.5,
"valid_targets_min": 1983
},
{
"epoch": 0.27375201288244766,
"grad_norm": 0.568539391929678,
"learning_rate": 1.5540229885057473e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30851513147354126,
"step": 170,
"valid_targets_mean": 4449.2,
"valid_targets_min": 453
},
{
"epoch": 0.28180354267310787,
"grad_norm": 0.6078239781315768,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.302283376455307,
"step": 175,
"valid_targets_mean": 4618.0,
"valid_targets_min": 2377
},
{
"epoch": 0.2898550724637681,
"grad_norm": 0.5885746435904814,
"learning_rate": 1.645977011494253e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3404327630996704,
"step": 180,
"valid_targets_mean": 4848.8,
"valid_targets_min": 1075
},
{
"epoch": 0.29790660225442833,
"grad_norm": 0.6287600513879442,
"learning_rate": 1.691954022988506e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35874509811401367,
"step": 185,
"valid_targets_mean": 4003.5,
"valid_targets_min": 321
},
{
"epoch": 0.3059581320450886,
"grad_norm": 0.5118887113449945,
"learning_rate": 1.7379310344827586e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192656636238098,
"step": 190,
"valid_targets_mean": 5059.1,
"valid_targets_min": 2133
},
{
"epoch": 0.3140096618357488,
"grad_norm": 0.5676499502591437,
"learning_rate": 1.7839080459770116e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2645234167575836,
"step": 195,
"valid_targets_mean": 4453.4,
"valid_targets_min": 1599
},
{
"epoch": 0.322061191626409,
"grad_norm": 0.5756721398531897,
"learning_rate": 1.8298850574712646e-05,
"loss": 0.3204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3237614631652832,
"step": 200,
"valid_targets_mean": 4916.9,
"valid_targets_min": 2747
},
{
"epoch": 0.33011272141706927,
"grad_norm": 0.661205961638061,
"learning_rate": 1.8758620689655173e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30946576595306396,
"step": 205,
"valid_targets_mean": 4202.1,
"valid_targets_min": 1793
},
{
"epoch": 0.33816425120772947,
"grad_norm": 0.5585042067771965,
"learning_rate": 1.9218390804597703e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30198991298675537,
"step": 210,
"valid_targets_mean": 4014.8,
"valid_targets_min": 1521
},
{
"epoch": 0.3462157809983897,
"grad_norm": 0.5364392722283728,
"learning_rate": 1.9678160919540233e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3075558841228485,
"step": 215,
"valid_targets_mean": 4535.4,
"valid_targets_min": 736
},
{
"epoch": 0.35426731078904994,
"grad_norm": 0.5478504018061776,
"learning_rate": 2.013793103448276e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30238276720046997,
"step": 220,
"valid_targets_mean": 4278.9,
"valid_targets_min": 506
},
{
"epoch": 0.36231884057971014,
"grad_norm": 0.5543366789399233,
"learning_rate": 2.059770114942529e-05,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31759655475616455,
"step": 225,
"valid_targets_mean": 5445.6,
"valid_targets_min": 1006
},
{
"epoch": 0.37037037037037035,
"grad_norm": 0.6286539962949731,
"learning_rate": 2.1057471264367816e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30352896451950073,
"step": 230,
"valid_targets_mean": 3805.3,
"valid_targets_min": 676
},
{
"epoch": 0.3784219001610306,
"grad_norm": 0.5644783614075699,
"learning_rate": 2.1517241379310346e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3186013102531433,
"step": 235,
"valid_targets_mean": 4621.7,
"valid_targets_min": 1571
},
{
"epoch": 0.3864734299516908,
"grad_norm": 0.5931980260785429,
"learning_rate": 2.1977011494252873e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28426745533943176,
"step": 240,
"valid_targets_mean": 4771.1,
"valid_targets_min": 2048
},
{
"epoch": 0.394524959742351,
"grad_norm": 0.5236909740791719,
"learning_rate": 2.2436781609195406e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2973197102546692,
"step": 245,
"valid_targets_mean": 4744.9,
"valid_targets_min": 1209
},
{
"epoch": 0.4025764895330113,
"grad_norm": 0.5306243392897267,
"learning_rate": 2.2896551724137933e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3088257312774658,
"step": 250,
"valid_targets_mean": 5178.1,
"valid_targets_min": 1966
},
{
"epoch": 0.4106280193236715,
"grad_norm": 0.48677773497495813,
"learning_rate": 2.3356321839080463e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26008594036102295,
"step": 255,
"valid_targets_mean": 5040.2,
"valid_targets_min": 1177
},
{
"epoch": 0.41867954911433175,
"grad_norm": 1.2774083864267622,
"learning_rate": 2.381609195402299e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775506377220154,
"step": 260,
"valid_targets_mean": 4319.1,
"valid_targets_min": 570
},
{
"epoch": 0.42673107890499196,
"grad_norm": 0.6457594097564714,
"learning_rate": 2.427586206896552e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2859913408756256,
"step": 265,
"valid_targets_mean": 3785.8,
"valid_targets_min": 284
},
{
"epoch": 0.43478260869565216,
"grad_norm": 0.5721794133457904,
"learning_rate": 2.4735632183908046e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2737387716770172,
"step": 270,
"valid_targets_mean": 4904.9,
"valid_targets_min": 1197
},
{
"epoch": 0.4428341384863124,
"grad_norm": 0.6155727873490212,
"learning_rate": 2.5195402298850576e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.317902147769928,
"step": 275,
"valid_targets_mean": 3661.2,
"valid_targets_min": 818
},
{
"epoch": 0.45088566827697263,
"grad_norm": 0.6349757508130273,
"learning_rate": 2.5655172413793103e-05,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2630305290222168,
"step": 280,
"valid_targets_mean": 3326.7,
"valid_targets_min": 941
},
{
"epoch": 0.45893719806763283,
"grad_norm": 0.6148296415866233,
"learning_rate": 2.6114942528735636e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27396440505981445,
"step": 285,
"valid_targets_mean": 4434.6,
"valid_targets_min": 1038
},
{
"epoch": 0.4669887278582931,
"grad_norm": 0.5645172489838126,
"learning_rate": 2.6574712643678166e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25225305557250977,
"step": 290,
"valid_targets_mean": 4993.3,
"valid_targets_min": 1962
},
{
"epoch": 0.4750402576489533,
"grad_norm": 0.5739342126572219,
"learning_rate": 2.7034482758620693e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.340742826461792,
"step": 295,
"valid_targets_mean": 4796.8,
"valid_targets_min": 710
},
{
"epoch": 0.4830917874396135,
"grad_norm": 0.5587075968581772,
"learning_rate": 2.749425287356322e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27218180894851685,
"step": 300,
"valid_targets_mean": 4788.8,
"valid_targets_min": 882
},
{
"epoch": 0.49114331723027377,
"grad_norm": 0.7790422573070022,
"learning_rate": 2.795402298850575e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25361332297325134,
"step": 305,
"valid_targets_mean": 3807.0,
"valid_targets_min": 344
},
{
"epoch": 0.499194847020934,
"grad_norm": 0.5359108312034309,
"learning_rate": 2.8413793103448276e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24744702875614166,
"step": 310,
"valid_targets_mean": 4844.2,
"valid_targets_min": 1948
},
{
"epoch": 0.5072463768115942,
"grad_norm": 0.7694244503734501,
"learning_rate": 2.8873563218390806e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25962382555007935,
"step": 315,
"valid_targets_mean": 3957.3,
"valid_targets_min": 751
},
{
"epoch": 0.5152979066022544,
"grad_norm": 0.6998112569580612,
"learning_rate": 2.9333333333333333e-05,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.283919095993042,
"step": 320,
"valid_targets_mean": 4178.9,
"valid_targets_min": 1504
},
{
"epoch": 0.5233494363929146,
"grad_norm": 0.5572107376686236,
"learning_rate": 2.9793103448275866e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3307899236679077,
"step": 325,
"valid_targets_mean": 4934.9,
"valid_targets_min": 860
},
{
"epoch": 0.5314009661835749,
"grad_norm": 0.5601650228344617,
"learning_rate": 3.0252873563218396e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26864737272262573,
"step": 330,
"valid_targets_mean": 3976.2,
"valid_targets_min": 1313
},
{
"epoch": 0.5394524959742351,
"grad_norm": 0.6400241549564539,
"learning_rate": 3.071264367816092e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869405746459961,
"step": 335,
"valid_targets_mean": 4011.7,
"valid_targets_min": 952
},
{
"epoch": 0.5475040257648953,
"grad_norm": 0.5021644926973708,
"learning_rate": 3.117241379310345e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2651926279067993,
"step": 340,
"valid_targets_mean": 5310.1,
"valid_targets_min": 692
},
{
"epoch": 0.5555555555555556,
"grad_norm": 0.819724946601287,
"learning_rate": 3.1632183908045976e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.297665536403656,
"step": 345,
"valid_targets_mean": 3748.9,
"valid_targets_min": 249
},
{
"epoch": 0.5636070853462157,
"grad_norm": 0.49635945683598137,
"learning_rate": 3.2091954022988506e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27254384756088257,
"step": 350,
"valid_targets_mean": 4190.4,
"valid_targets_min": 380
},
{
"epoch": 0.571658615136876,
"grad_norm": 1.1643886506532481,
"learning_rate": 3.2551724137931036e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615281343460083,
"step": 355,
"valid_targets_mean": 3684.1,
"valid_targets_min": 304
},
{
"epoch": 0.5797101449275363,
"grad_norm": 0.5045131044975655,
"learning_rate": 3.3011494252873566e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28446757793426514,
"step": 360,
"valid_targets_mean": 5213.9,
"valid_targets_min": 2518
},
{
"epoch": 0.5877616747181964,
"grad_norm": 0.5901966768401951,
"learning_rate": 3.3471264367816096e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2504952549934387,
"step": 365,
"valid_targets_mean": 4182.6,
"valid_targets_min": 691
},
{
"epoch": 0.5958132045088567,
"grad_norm": 0.620399649393727,
"learning_rate": 3.3931034482758626e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2381853461265564,
"step": 370,
"valid_targets_mean": 4586.0,
"valid_targets_min": 1672
},
{
"epoch": 0.6038647342995169,
"grad_norm": 0.5417315383509183,
"learning_rate": 3.4390804597701156e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672516405582428,
"step": 375,
"valid_targets_mean": 4311.4,
"valid_targets_min": 1082
},
{
"epoch": 0.6119162640901772,
"grad_norm": 0.6433514192784039,
"learning_rate": 3.485057471264368e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32015344500541687,
"step": 380,
"valid_targets_mean": 3902.9,
"valid_targets_min": 1623
},
{
"epoch": 0.6199677938808373,
"grad_norm": 0.4775998328542989,
"learning_rate": 3.531034482758621e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24788491427898407,
"step": 385,
"valid_targets_mean": 4189.4,
"valid_targets_min": 713
},
{
"epoch": 0.6280193236714976,
"grad_norm": 0.5122265709609899,
"learning_rate": 3.577011494252874e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27622339129447937,
"step": 390,
"valid_targets_mean": 4446.6,
"valid_targets_min": 1670
},
{
"epoch": 0.6360708534621579,
"grad_norm": 0.659466553378636,
"learning_rate": 3.622988505747126e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3116128742694855,
"step": 395,
"valid_targets_mean": 4667.6,
"valid_targets_min": 1070
},
{
"epoch": 0.644122383252818,
"grad_norm": 0.5849425616180388,
"learning_rate": 3.668965517241379e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27755099534988403,
"step": 400,
"valid_targets_mean": 4714.6,
"valid_targets_min": 995
},
{
"epoch": 0.6521739130434783,
"grad_norm": 0.5327108961779472,
"learning_rate": 3.714942528735633e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27385851740837097,
"step": 405,
"valid_targets_mean": 5260.8,
"valid_targets_min": 2141
},
{
"epoch": 0.6602254428341385,
"grad_norm": 0.5998643197455865,
"learning_rate": 3.760919540229885e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3069554567337036,
"step": 410,
"valid_targets_mean": 4323.8,
"valid_targets_min": 831
},
{
"epoch": 0.6682769726247987,
"grad_norm": 0.5690712799581026,
"learning_rate": 3.806896551724138e-05,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29719623923301697,
"step": 415,
"valid_targets_mean": 4270.9,
"valid_targets_min": 1089
},
{
"epoch": 0.6763285024154589,
"grad_norm": 0.5754513117973928,
"learning_rate": 3.852873563218391e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29911819100379944,
"step": 420,
"valid_targets_mean": 4512.4,
"valid_targets_min": 1988
},
{
"epoch": 0.6843800322061192,
"grad_norm": 0.6061703211904361,
"learning_rate": 3.898850574712644e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23556432127952576,
"step": 425,
"valid_targets_mean": 3921.6,
"valid_targets_min": 1217
},
{
"epoch": 0.6924315619967794,
"grad_norm": 0.5391890622955845,
"learning_rate": 3.9448275862068966e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23832057416439056,
"step": 430,
"valid_targets_mean": 4345.2,
"valid_targets_min": 2090
},
{
"epoch": 0.7004830917874396,
"grad_norm": 0.6101927641358206,
"learning_rate": 3.9908045977011496e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2649371325969696,
"step": 435,
"valid_targets_mean": 4433.6,
"valid_targets_min": 1317
},
{
"epoch": 0.7085346215780999,
"grad_norm": 0.5646390271799305,
"learning_rate": 3.9999896813789735e-05,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27699440717697144,
"step": 440,
"valid_targets_mean": 4894.1,
"valid_targets_min": 731
},
{
"epoch": 0.71658615136876,
"grad_norm": 0.5718807548846909,
"learning_rate": 3.999947762163533e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29374945163726807,
"step": 445,
"valid_targets_mean": 3907.8,
"valid_targets_min": 1022
},
{
"epoch": 0.7246376811594203,
"grad_norm": 0.5614682322405541,
"learning_rate": 3.999873598115203e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257183313369751,
"step": 450,
"valid_targets_mean": 4987.9,
"valid_targets_min": 1860
},
{
"epoch": 0.7326892109500805,
"grad_norm": 0.5300074790618707,
"learning_rate": 3.999767190429718e-05,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23682445287704468,
"step": 455,
"valid_targets_mean": 5225.4,
"valid_targets_min": 2450
},
{
"epoch": 0.7407407407407407,
"grad_norm": 0.6542049865844981,
"learning_rate": 3.99962854082267e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29080742597579956,
"step": 460,
"valid_targets_mean": 4597.2,
"valid_targets_min": 2222
},
{
"epoch": 0.748792270531401,
"grad_norm": 0.502946880278254,
"learning_rate": 3.9994576515294864e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28522011637687683,
"step": 465,
"valid_targets_mean": 4706.1,
"valid_targets_min": 1773
},
{
"epoch": 0.7568438003220612,
"grad_norm": 0.5050040823394027,
"learning_rate": 3.999254525305386e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506832480430603,
"step": 470,
"valid_targets_mean": 5194.9,
"valid_targets_min": 715
},
{
"epoch": 0.7648953301127214,
"grad_norm": 0.8322414020355918,
"learning_rate": 3.999019165425341e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29580700397491455,
"step": 475,
"valid_targets_mean": 3748.2,
"valid_targets_min": 1077
},
{
"epoch": 0.7729468599033816,
"grad_norm": 0.5680386432970268,
"learning_rate": 3.99875157568402e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2671373188495636,
"step": 480,
"valid_targets_mean": 4587.8,
"valid_targets_min": 775
},
{
"epoch": 0.7809983896940419,
"grad_norm": 0.5112203887556883,
"learning_rate": 3.998451760395729e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2868801951408386,
"step": 485,
"valid_targets_mean": 4774.4,
"valid_targets_min": 1792
},
{
"epoch": 0.789049919484702,
"grad_norm": 0.5606005265672219,
"learning_rate": 3.99811972439434e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751631736755371,
"step": 490,
"valid_targets_mean": 4579.5,
"valid_targets_min": 1396
},
{
"epoch": 0.7971014492753623,
"grad_norm": 0.5467905444044749,
"learning_rate": 3.997755473033218e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562072277069092,
"step": 495,
"valid_targets_mean": 3827.3,
"valid_targets_min": 1348
},
{
"epoch": 0.8051529790660226,
"grad_norm": 0.5387721194984708,
"learning_rate": 3.997359012185127e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520545721054077,
"step": 500,
"valid_targets_mean": 4061.6,
"valid_targets_min": 547
},
{
"epoch": 0.8132045088566827,
"grad_norm": 0.5976518636156888,
"learning_rate": 3.996930348242141e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23626355826854706,
"step": 505,
"valid_targets_mean": 4540.9,
"valid_targets_min": 1484
},
{
"epoch": 0.821256038647343,
"grad_norm": 0.6166919816090995,
"learning_rate": 3.996469488115539e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615845203399658,
"step": 510,
"valid_targets_mean": 4508.8,
"valid_targets_min": 1246
},
{
"epoch": 0.8293075684380032,
"grad_norm": 0.530813397454018,
"learning_rate": 3.995976439235694e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612318694591522,
"step": 515,
"valid_targets_mean": 4225.1,
"valid_targets_min": 1044
},
{
"epoch": 0.8373590982286635,
"grad_norm": 0.6517729260520128,
"learning_rate": 3.995451209551953e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23576730489730835,
"step": 520,
"valid_targets_mean": 5023.0,
"valid_targets_min": 1701
},
{
"epoch": 0.8454106280193237,
"grad_norm": 0.4740752251218264,
"learning_rate": 3.994893807532509e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28204214572906494,
"step": 525,
"valid_targets_mean": 4959.8,
"valid_targets_min": 1081
},
{
"epoch": 0.8534621578099839,
"grad_norm": 0.5257899294040256,
"learning_rate": 3.994304242164265e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655045986175537,
"step": 530,
"valid_targets_mean": 4981.6,
"valid_targets_min": 2051
},
{
"epoch": 0.8615136876006442,
"grad_norm": 0.536523092714892,
"learning_rate": 3.9936825229526855e-05,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29214853048324585,
"step": 535,
"valid_targets_mean": 4368.4,
"valid_targets_min": 2191
},
{
"epoch": 0.8695652173913043,
"grad_norm": 0.5028299546325571,
"learning_rate": 3.9930286599216506e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27183425426483154,
"step": 540,
"valid_targets_mean": 5098.8,
"valid_targets_min": 2186
},
{
"epoch": 0.8776167471819646,
"grad_norm": 0.5635419055915679,
"learning_rate": 3.9923426636132866e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2873607277870178,
"step": 545,
"valid_targets_mean": 4578.5,
"valid_targets_min": 1671
},
{
"epoch": 0.8856682769726248,
"grad_norm": 0.5724413640787459,
"learning_rate": 3.991624545087801e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27895426750183105,
"step": 550,
"valid_targets_mean": 3958.7,
"valid_targets_min": 1181
},
{
"epoch": 0.893719806763285,
"grad_norm": 0.5024007626126078,
"learning_rate": 3.9908743159233016e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20082515478134155,
"step": 555,
"valid_targets_mean": 4550.9,
"valid_targets_min": 1029
},
{
"epoch": 0.9017713365539453,
"grad_norm": 0.5485922659002295,
"learning_rate": 3.990091988215612e-05,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2621651887893677,
"step": 560,
"valid_targets_mean": 4163.2,
"valid_targets_min": 1507
},
{
"epoch": 0.9098228663446055,
"grad_norm": 0.5184933123196136,
"learning_rate": 3.989277574578074e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20918220281600952,
"step": 565,
"valid_targets_mean": 3785.8,
"valid_targets_min": 990
},
{
"epoch": 0.9178743961352657,
"grad_norm": 0.5186343425685319,
"learning_rate": 3.9884310881413473e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2877514362335205,
"step": 570,
"valid_targets_mean": 5365.6,
"valid_targets_min": 956
},
{
"epoch": 0.9259259259259259,
"grad_norm": 0.5097833267576443,
"learning_rate": 3.987552542553194e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23448419570922852,
"step": 575,
"valid_targets_mean": 4300.2,
"valid_targets_min": 1615
},
{
"epoch": 0.9339774557165862,
"grad_norm": 0.5183101791069704,
"learning_rate": 3.9866419519782636e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744702696800232,
"step": 580,
"valid_targets_mean": 4674.6,
"valid_targets_min": 267
},
{
"epoch": 0.9420289855072463,
"grad_norm": 0.5621277031078485,
"learning_rate": 3.985699331097858e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2877187728881836,
"step": 585,
"valid_targets_mean": 4813.2,
"valid_targets_min": 720
},
{
"epoch": 0.9500805152979066,
"grad_norm": 0.6940945000218365,
"learning_rate": 3.984724695109702e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29620370268821716,
"step": 590,
"valid_targets_mean": 5132.4,
"valid_targets_min": 1631
},
{
"epoch": 0.9581320450885669,
"grad_norm": 0.6065162564844915,
"learning_rate": 3.983718059727693e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27759110927581787,
"step": 595,
"valid_targets_mean": 3982.5,
"valid_targets_min": 1549
},
{
"epoch": 0.966183574879227,
"grad_norm": 0.5059275833472612,
"learning_rate": 3.9826794411816495e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27101898193359375,
"step": 600,
"valid_targets_mean": 4788.5,
"valid_targets_min": 1713
},
{
"epoch": 0.9742351046698873,
"grad_norm": 0.4992312775195265,
"learning_rate": 3.981608856217049e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23076659440994263,
"step": 605,
"valid_targets_mean": 4342.8,
"valid_targets_min": 1263
},
{
"epoch": 0.9822866344605475,
"grad_norm": 0.5353175524067539,
"learning_rate": 3.980506322094761e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311723828315735,
"step": 610,
"valid_targets_mean": 4810.8,
"valid_targets_min": 570
},
{
"epoch": 0.9903381642512077,
"grad_norm": 0.6330855933495575,
"learning_rate": 3.979371856590762e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28571778535842896,
"step": 615,
"valid_targets_mean": 4376.3,
"valid_targets_min": 2240
},
{
"epoch": 0.998389694041868,
"grad_norm": 0.5397840170469355,
"learning_rate": 3.978205477995856e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24998024106025696,
"step": 620,
"valid_targets_mean": 4034.1,
"valid_targets_min": 1638
},
{
"epoch": 1.0064412238325282,
"grad_norm": 0.5507361899409122,
"learning_rate": 3.9770072051153754e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252638041973114,
"step": 625,
"valid_targets_mean": 4238.3,
"valid_targets_min": 1021
},
{
"epoch": 1.0144927536231885,
"grad_norm": 0.5602531648929935,
"learning_rate": 3.9757770572688786e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23810608685016632,
"step": 630,
"valid_targets_mean": 3836.5,
"valid_targets_min": 1569
},
{
"epoch": 1.0225442834138487,
"grad_norm": 0.5389828337838378,
"learning_rate": 3.9745150542898405e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20239052176475525,
"step": 635,
"valid_targets_mean": 3506.9,
"valid_targets_min": 1175
},
{
"epoch": 1.0305958132045088,
"grad_norm": 0.5471627213957879,
"learning_rate": 3.97322121652533e-05,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23700180649757385,
"step": 640,
"valid_targets_mean": 4167.8,
"valid_targets_min": 380
},
{
"epoch": 1.038647342995169,
"grad_norm": 0.5304941534687796,
"learning_rate": 3.971895564835683e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21442700922489166,
"step": 645,
"valid_targets_mean": 4103.1,
"valid_targets_min": 1034
},
{
"epoch": 1.0466988727858293,
"grad_norm": 0.5123253191465812,
"learning_rate": 3.970538120594166e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22118300199508667,
"step": 650,
"valid_targets_mean": 4709.2,
"valid_targets_min": 1225
},
{
"epoch": 1.0547504025764896,
"grad_norm": 0.5144164225120834,
"learning_rate": 3.9691489056866324e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2365712821483612,
"step": 655,
"valid_targets_mean": 4630.8,
"valid_targets_min": 862
},
{
"epoch": 1.0628019323671498,
"grad_norm": 0.6461651582671288,
"learning_rate": 3.9677279425111684e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24799947440624237,
"step": 660,
"valid_targets_mean": 4166.1,
"valid_targets_min": 1309
},
{
"epoch": 1.07085346215781,
"grad_norm": 0.5024189972964114,
"learning_rate": 3.9662752539777314e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24382641911506653,
"step": 665,
"valid_targets_mean": 5176.7,
"valid_targets_min": 521
},
{
"epoch": 1.0789049919484701,
"grad_norm": 0.9391803347175582,
"learning_rate": 3.9647908635077845e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.277189165353775,
"step": 670,
"valid_targets_mean": 4315.8,
"valid_targets_min": 703
},
{
"epoch": 1.0869565217391304,
"grad_norm": 0.4882832004268316,
"learning_rate": 3.963274795033913e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24163475632667542,
"step": 675,
"valid_targets_mean": 5134.3,
"valid_targets_min": 710
},
{
"epoch": 1.0950080515297906,
"grad_norm": 0.6167872996926629,
"learning_rate": 3.9617270729994436e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24507923424243927,
"step": 680,
"valid_targets_mean": 4063.7,
"valid_targets_min": 1058
},
{
"epoch": 1.103059581320451,
"grad_norm": 0.6232571737295083,
"learning_rate": 3.960147722358046e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23517994582653046,
"step": 685,
"valid_targets_mean": 3350.7,
"valid_targets_min": 736
},
{
"epoch": 1.1111111111111112,
"grad_norm": 0.5205417579091651,
"learning_rate": 3.958536768573335e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25678330659866333,
"step": 690,
"valid_targets_mean": 4774.0,
"valid_targets_min": 1681
},
{
"epoch": 1.1191626409017714,
"grad_norm": 0.5540696760333587,
"learning_rate": 3.956894237618456e-05,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2578514814376831,
"step": 695,
"valid_targets_mean": 3721.6,
"valid_targets_min": 543
},
{
"epoch": 1.1272141706924317,
"grad_norm": 0.5703134217215095,
"learning_rate": 3.955220155975669e-05,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27087417244911194,
"step": 700,
"valid_targets_mean": 4647.0,
"valid_targets_min": 1837
},
{
"epoch": 1.1352657004830917,
"grad_norm": 0.5281006763450222,
"learning_rate": 3.9535145506359206e-05,
"loss": 0.2431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2202616184949875,
"step": 705,
"valid_targets_mean": 4643.4,
"valid_targets_min": 548
},
{
"epoch": 1.143317230273752,
"grad_norm": 0.4639603789841704,
"learning_rate": 3.951777449098408e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2633700966835022,
"step": 710,
"valid_targets_mean": 5459.8,
"valid_targets_min": 2264
},
{
"epoch": 1.1513687600644122,
"grad_norm": 0.469137374700247,
"learning_rate": 3.9500088793701387e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19833050668239594,
"step": 715,
"valid_targets_mean": 4964.5,
"valid_targets_min": 2160
},
{
"epoch": 1.1594202898550725,
"grad_norm": 0.4905202669992282,
"learning_rate": 3.948208869965473e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24042034149169922,
"step": 720,
"valid_targets_mean": 4569.5,
"valid_targets_min": 776
},
{
"epoch": 1.1674718196457328,
"grad_norm": 0.5271378070562325,
"learning_rate": 3.946377449905672e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24370059370994568,
"step": 725,
"valid_targets_mean": 4409.8,
"valid_targets_min": 1705
},
{
"epoch": 1.1755233494363928,
"grad_norm": 0.48816490928722517,
"learning_rate": 3.9445146487184226e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23395568132400513,
"step": 730,
"valid_targets_mean": 4742.6,
"valid_targets_min": 1740
},
{
"epoch": 1.183574879227053,
"grad_norm": 0.508703086089454,
"learning_rate": 3.942620496437366e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787438929080963,
"step": 735,
"valid_targets_mean": 5090.3,
"valid_targets_min": 720
},
{
"epoch": 1.1916264090177133,
"grad_norm": 0.5274435230388868,
"learning_rate": 3.940695023601612e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23083099722862244,
"step": 740,
"valid_targets_mean": 4942.7,
"valid_targets_min": 1747
},
{
"epoch": 1.1996779388083736,
"grad_norm": 0.48187263788077117,
"learning_rate": 3.938738261255247e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21453389525413513,
"step": 745,
"valid_targets_mean": 4564.6,
"valid_targets_min": 1401
},
{
"epoch": 1.2077294685990339,
"grad_norm": 0.7495259641509139,
"learning_rate": 3.9367502409468315e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21770915389060974,
"step": 750,
"valid_targets_mean": 4150.0,
"valid_targets_min": 848
},
{
"epoch": 1.2157809983896941,
"grad_norm": 0.513119058591006,
"learning_rate": 3.934730994728893e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2321898341178894,
"step": 755,
"valid_targets_mean": 3742.6,
"valid_targets_min": 1247
},
{
"epoch": 1.2238325281803544,
"grad_norm": 0.5088681345844467,
"learning_rate": 3.932680555157413e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2543366551399231,
"step": 760,
"valid_targets_mean": 4571.6,
"valid_targets_min": 745
},
{
"epoch": 1.2318840579710144,
"grad_norm": 0.5212074947311489,
"learning_rate": 3.9305989552912936e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24161793291568756,
"step": 765,
"valid_targets_mean": 4267.8,
"valid_targets_min": 2059
},
{
"epoch": 1.2399355877616747,
"grad_norm": 0.6379814909420424,
"learning_rate": 3.928486228691831e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25767624378204346,
"step": 770,
"valid_targets_mean": 4049.4,
"valid_targets_min": 1596
},
{
"epoch": 1.247987117552335,
"grad_norm": 0.5355001588932113,
"learning_rate": 3.926342409422175e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23288603127002716,
"step": 775,
"valid_targets_mean": 3844.3,
"valid_targets_min": 823
},
{
"epoch": 1.2560386473429952,
"grad_norm": 0.5212100454034752,
"learning_rate": 3.924167532046773e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24769359827041626,
"step": 780,
"valid_targets_mean": 4338.0,
"valid_targets_min": 1507
},
{
"epoch": 1.2640901771336555,
"grad_norm": 0.5991969877035959,
"learning_rate": 3.9219616316308215e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23935574293136597,
"step": 785,
"valid_targets_mean": 4815.1,
"valid_targets_min": 1755
},
{
"epoch": 1.2721417069243155,
"grad_norm": 0.5852623692737184,
"learning_rate": 3.919724743739694e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2316393107175827,
"step": 790,
"valid_targets_mean": 4748.1,
"valid_targets_min": 1010
},
{
"epoch": 1.2801932367149758,
"grad_norm": 0.5400353515222852,
"learning_rate": 3.91745690443837e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24360281229019165,
"step": 795,
"valid_targets_mean": 4905.1,
"valid_targets_min": 1697
},
{
"epoch": 1.288244766505636,
"grad_norm": 0.5161454582163929,
"learning_rate": 3.915158150290855e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2185833752155304,
"step": 800,
"valid_targets_mean": 4708.6,
"valid_targets_min": 1210
},
{
"epoch": 1.2962962962962963,
"grad_norm": 0.5421912889681342,
"learning_rate": 3.912828518359588e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24869637191295624,
"step": 805,
"valid_targets_mean": 5677.7,
"valid_targets_min": 2666
},
{
"epoch": 1.3043478260869565,
"grad_norm": 0.5587294675034205,
"learning_rate": 3.910468046204846e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.240371972322464,
"step": 810,
"valid_targets_mean": 3585.4,
"valid_targets_min": 677
},
{
"epoch": 1.3123993558776168,
"grad_norm": 0.5803843717029648,
"learning_rate": 3.908076771884139e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23448866605758667,
"step": 815,
"valid_targets_mean": 4076.1,
"valid_targets_min": 1353
},
{
"epoch": 1.320450885668277,
"grad_norm": 0.6615696992092541,
"learning_rate": 3.905654733951595e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24138154089450836,
"step": 820,
"valid_targets_mean": 3298.6,
"valid_targets_min": 713
},
{
"epoch": 1.3285024154589373,
"grad_norm": 0.48424332287717764,
"learning_rate": 3.9032019714573366e-05,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2244749665260315,
"step": 825,
"valid_targets_mean": 4370.7,
"valid_targets_min": 1299
},
{
"epoch": 1.3365539452495974,
"grad_norm": 0.5116233310783836,
"learning_rate": 3.9007185239468554e-05,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2363509237766266,
"step": 830,
"valid_targets_mean": 4251.2,
"valid_targets_min": 1057
},
{
"epoch": 1.3446054750402576,
"grad_norm": 0.5726251093172268,
"learning_rate": 3.8982044314603725e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25756919384002686,
"step": 835,
"valid_targets_mean": 4103.4,
"valid_targets_min": 818
},
{
"epoch": 1.3526570048309179,
"grad_norm": 0.5399551753973628,
"learning_rate": 3.8956597345321927e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23214933276176453,
"step": 840,
"valid_targets_mean": 3571.1,
"valid_targets_min": 997
},
{
"epoch": 1.3607085346215781,
"grad_norm": 0.5153551957359142,
"learning_rate": 3.893084474190051e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24375241994857788,
"step": 845,
"valid_targets_mean": 4158.2,
"valid_targets_min": 952
},
{
"epoch": 1.3687600644122382,
"grad_norm": 0.48984930240931984,
"learning_rate": 3.890478691954452e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2558751702308655,
"step": 850,
"valid_targets_mean": 4738.9,
"valid_targets_min": 656
},
{
"epoch": 1.3768115942028984,
"grad_norm": 0.5179307198966028,
"learning_rate": 3.8878424298379996e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22707146406173706,
"step": 855,
"valid_targets_mean": 4074.3,
"valid_targets_min": 1101
},
{
"epoch": 1.3848631239935587,
"grad_norm": 0.6293401724856043,
"learning_rate": 3.885175730344718e-05,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24598611891269684,
"step": 860,
"valid_targets_mean": 4331.4,
"valid_targets_min": 1429
},
{
"epoch": 1.392914653784219,
"grad_norm": 0.5429776165767362,
"learning_rate": 3.882478636469372e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25051477551460266,
"step": 865,
"valid_targets_mean": 4375.6,
"valid_targets_min": 1616
},
{
"epoch": 1.4009661835748792,
"grad_norm": 0.5668228228210831,
"learning_rate": 3.879751191696766e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2403651624917984,
"step": 870,
"valid_targets_mean": 3847.9,
"valid_targets_min": 656
},
{
"epoch": 1.4090177133655395,
"grad_norm": 0.4916125568229993,
"learning_rate": 3.8769934400010506e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23794618248939514,
"step": 875,
"valid_targets_mean": 4820.1,
"valid_targets_min": 284
},
{
"epoch": 1.4170692431561998,
"grad_norm": 0.48401044866312015,
"learning_rate": 3.8742054258450085e-05,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25705933570861816,
"step": 880,
"valid_targets_mean": 4531.7,
"valid_targets_min": 1442
},
{
"epoch": 1.42512077294686,
"grad_norm": 0.5305875988771065,
"learning_rate": 3.871387194179338e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20840579271316528,
"step": 885,
"valid_targets_mean": 4164.4,
"valid_targets_min": 2047
},
{
"epoch": 1.43317230273752,
"grad_norm": 0.5592288973797526,
"learning_rate": 3.868538790441931e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24872620403766632,
"step": 890,
"valid_targets_mean": 4424.3,
"valid_targets_min": 1035
},
{
"epoch": 1.4412238325281803,
"grad_norm": 0.46555566538841864,
"learning_rate": 3.865660260557138e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21978382766246796,
"step": 895,
"valid_targets_mean": 4317.1,
"valid_targets_min": 2278
},
{
"epoch": 1.4492753623188406,
"grad_norm": 0.5185263723338586,
"learning_rate": 3.8627516509350286e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2476550042629242,
"step": 900,
"valid_targets_mean": 3795.6,
"valid_targets_min": 1701
},
{
"epoch": 1.4573268921095008,
"grad_norm": 0.5514262995566678,
"learning_rate": 3.859813008470644e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24102932214736938,
"step": 905,
"valid_targets_mean": 3926.9,
"valid_targets_min": 1209
},
{
"epoch": 1.465378421900161,
"grad_norm": 0.4713138062680591,
"learning_rate": 3.856844380543239e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23857206106185913,
"step": 910,
"valid_targets_mean": 4829.1,
"valid_targets_min": 1822
},
{
"epoch": 1.4734299516908211,
"grad_norm": 0.46745151947518565,
"learning_rate": 3.8538458150155186e-05,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21306023001670837,
"step": 915,
"valid_targets_mean": 5670.3,
"valid_targets_min": 1223
},
{
"epoch": 1.4814814814814814,
"grad_norm": 0.5399378076969245,
"learning_rate": 3.850817360232869e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23806512355804443,
"step": 920,
"valid_targets_mean": 5083.9,
"valid_targets_min": 2183
},
{
"epoch": 1.4895330112721417,
"grad_norm": 0.6208023209932018,
"learning_rate": 3.8477590650225735e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26910722255706787,
"step": 925,
"valid_targets_mean": 4777.4,
"valid_targets_min": 1044
},
{
"epoch": 1.497584541062802,
"grad_norm": 0.5213298121096795,
"learning_rate": 3.8446709786930305e-05,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24538570642471313,
"step": 930,
"valid_targets_mean": 4161.3,
"valid_targets_min": 1399
},
{
"epoch": 1.5056360708534622,
"grad_norm": 0.5236314811464815,
"learning_rate": 3.841553151032953e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23516438901424408,
"step": 935,
"valid_targets_mean": 5095.7,
"valid_targets_min": 1027
},
{
"epoch": 1.5136876006441224,
"grad_norm": 0.44460197327326756,
"learning_rate": 3.8384056323105695e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23193703591823578,
"step": 940,
"valid_targets_mean": 5266.9,
"valid_targets_min": 1863
},
{
"epoch": 1.5217391304347827,
"grad_norm": 0.6021732933768308,
"learning_rate": 3.835228473272814e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2238101363182068,
"step": 945,
"valid_targets_mean": 4458.2,
"valid_targets_min": 751
},
{
"epoch": 1.529790660225443,
"grad_norm": 0.5548844712586349,
"learning_rate": 3.832021725144506e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418593019247055,
"step": 950,
"valid_targets_mean": 4469.2,
"valid_targets_min": 1717
},
{
"epoch": 1.537842190016103,
"grad_norm": 0.46334027352601115,
"learning_rate": 3.828785439627523e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24094292521476746,
"step": 955,
"valid_targets_mean": 5478.1,
"valid_targets_min": 1745
},
{
"epoch": 1.5458937198067633,
"grad_norm": 0.5074800565232367,
"learning_rate": 3.825519668899972e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25097841024398804,
"step": 960,
"valid_targets_mean": 5015.4,
"valid_targets_min": 1369
},
{
"epoch": 1.5539452495974235,
"grad_norm": 0.5212941157766611,
"learning_rate": 3.8222244656153444e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2439125031232834,
"step": 965,
"valid_targets_mean": 4481.0,
"valid_targets_min": 973
},
{
"epoch": 1.5619967793880838,
"grad_norm": 0.5111240156665687,
"learning_rate": 3.818899882901666e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22901548445224762,
"step": 970,
"valid_targets_mean": 4092.8,
"valid_targets_min": 1591
},
{
"epoch": 1.5700483091787438,
"grad_norm": 0.512770693439504,
"learning_rate": 3.815545974360644e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23196808993816376,
"step": 975,
"valid_targets_mean": 4075.3,
"valid_targets_min": 1956
},
{
"epoch": 1.578099838969404,
"grad_norm": 0.5042161332697872,
"learning_rate": 3.812162794066802e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25058242678642273,
"step": 980,
"valid_targets_mean": 4614.4,
"valid_targets_min": 339
},
{
"epoch": 1.5861513687600644,
"grad_norm": 0.4846950795943882,
"learning_rate": 3.8087503965666057e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2251492440700531,
"step": 985,
"valid_targets_mean": 4310.9,
"valid_targets_min": 1978
},
{
"epoch": 1.5942028985507246,
"grad_norm": 0.49445825909902524,
"learning_rate": 3.805308836877586e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2309640347957611,
"step": 990,
"valid_targets_mean": 4083.0,
"valid_targets_min": 688
},
{
"epoch": 1.6022544283413849,
"grad_norm": 0.522939331982219,
"learning_rate": 3.80183817048745e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23157933354377747,
"step": 995,
"valid_targets_mean": 3599.1,
"valid_targets_min": 358
},
{
"epoch": 1.6103059581320451,
"grad_norm": 0.5144792659864994,
"learning_rate": 3.7983384533531894e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2594456374645233,
"step": 1000,
"valid_targets_mean": 4572.1,
"valid_targets_min": 1116
},
{
"epoch": 1.6183574879227054,
"grad_norm": 0.514940069429718,
"learning_rate": 3.7948097419001736e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23250789940357208,
"step": 1005,
"valid_targets_mean": 4625.0,
"valid_targets_min": 350
},
{
"epoch": 1.6264090177133657,
"grad_norm": 0.52221869816674,
"learning_rate": 3.7912520930212445e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21590971946716309,
"step": 1010,
"valid_targets_mean": 4035.4,
"valid_targets_min": 1483
},
{
"epoch": 1.634460547504026,
"grad_norm": 0.42946813411877144,
"learning_rate": 3.7876655640757974e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23158404231071472,
"step": 1015,
"valid_targets_mean": 5336.1,
"valid_targets_min": 979
},
{
"epoch": 1.642512077294686,
"grad_norm": 0.4983259472306404,
"learning_rate": 3.784050212888857e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527810335159302,
"step": 1020,
"valid_targets_mean": 5022.8,
"valid_targets_min": 2939
},
{
"epoch": 1.6505636070853462,
"grad_norm": 0.46712880691077496,
"learning_rate": 3.780406097750141e-05,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22650480270385742,
"step": 1025,
"valid_targets_mean": 4311.5,
"valid_targets_min": 1275
},
{
"epoch": 1.6586151368760065,
"grad_norm": 0.5417140597671484,
"learning_rate": 3.776733277413127e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.195145845413208,
"step": 1030,
"valid_targets_mean": 4207.8,
"valid_targets_min": 1043
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.4883088038596097,
"learning_rate": 3.7730318110941004e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21643765270709991,
"step": 1035,
"valid_targets_mean": 4391.3,
"valid_targets_min": 2660
},
{
"epoch": 1.6747181964573268,
"grad_norm": 0.5289568127223118,
"learning_rate": 3.7693017584712013e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23360106348991394,
"step": 1040,
"valid_targets_mean": 4826.2,
"valid_targets_min": 2011
},
{
"epoch": 1.682769726247987,
"grad_norm": 0.5576792989418248,
"learning_rate": 3.765543179683462e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24486708641052246,
"step": 1045,
"valid_targets_mean": 3934.4,
"valid_targets_min": 1683
},
{
"epoch": 1.6908212560386473,
"grad_norm": 0.5017617827412163,
"learning_rate": 3.7617561353298395e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24896810948848724,
"step": 1050,
"valid_targets_mean": 4011.8,
"valid_targets_min": 321
},
{
"epoch": 1.6988727858293076,
"grad_norm": 0.4860709875293544,
"learning_rate": 3.7579406864682327e-05,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24139925837516785,
"step": 1055,
"valid_targets_mean": 4299.9,
"valid_targets_min": 667
},
{
"epoch": 1.7069243156199678,
"grad_norm": 0.5345894675911452,
"learning_rate": 3.7540968946145036e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2598978877067566,
"step": 1060,
"valid_targets_mean": 4928.6,
"valid_targets_min": 1283
},
{
"epoch": 1.714975845410628,
"grad_norm": 0.5465814570656329,
"learning_rate": 3.750224821741486e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2219647765159607,
"step": 1065,
"valid_targets_mean": 5155.9,
"valid_targets_min": 1303
},
{
"epoch": 1.7230273752012883,
"grad_norm": 0.5300553470904004,
"learning_rate": 3.7463245302779795e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28267112374305725,
"step": 1070,
"valid_targets_mean": 3852.3,
"valid_targets_min": 599
},
{
"epoch": 1.7310789049919486,
"grad_norm": 0.4624218505703108,
"learning_rate": 3.742396083107751e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21661648154258728,
"step": 1075,
"valid_targets_mean": 4283.7,
"valid_targets_min": 1147
},
{
"epoch": 1.7391304347826086,
"grad_norm": 0.4993979746767997,
"learning_rate": 3.7384395435685166e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21909837424755096,
"step": 1080,
"valid_targets_mean": 4359.1,
"valid_targets_min": 2250
},
{
"epoch": 1.747181964573269,
"grad_norm": 0.5407067040296573,
"learning_rate": 3.7344549754509196e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22699233889579773,
"step": 1085,
"valid_targets_mean": 3677.0,
"valid_targets_min": 892
},
{
"epoch": 1.7552334943639292,
"grad_norm": 0.4642737834973646,
"learning_rate": 3.7304424429975046e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22292137145996094,
"step": 1090,
"valid_targets_mean": 5690.0,
"valid_targets_min": 782
},
{
"epoch": 1.7632850241545892,
"grad_norm": 0.5671519558623886,
"learning_rate": 3.726402010901681e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21334418654441833,
"step": 1095,
"valid_targets_mean": 4616.9,
"valid_targets_min": 1898
},
{
"epoch": 1.7713365539452495,
"grad_norm": 0.5083634785423456,
"learning_rate": 3.722333744306678e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21738044917583466,
"step": 1100,
"valid_targets_mean": 5448.9,
"valid_targets_min": 1726
},
{
"epoch": 1.7793880837359097,
"grad_norm": 0.8896163020318464,
"learning_rate": 3.7182377088044984e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22921855747699738,
"step": 1105,
"valid_targets_mean": 4703.8,
"valid_targets_min": 1508
},
{
"epoch": 1.78743961352657,
"grad_norm": 0.5450639925225488,
"learning_rate": 3.7141139704348576e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21833300590515137,
"step": 1110,
"valid_targets_mean": 3445.8,
"valid_targets_min": 1099
},
{
"epoch": 1.7954911433172303,
"grad_norm": 0.6520638172384545,
"learning_rate": 3.7099625956841175e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25272321701049805,
"step": 1115,
"valid_targets_mean": 3248.3,
"valid_targets_min": 617
},
{
"epoch": 1.8035426731078905,
"grad_norm": 0.4493969588039246,
"learning_rate": 3.70578365148422e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23505555093288422,
"step": 1120,
"valid_targets_mean": 5024.8,
"valid_targets_min": 1833
},
{
"epoch": 1.8115942028985508,
"grad_norm": 0.4827090106067237,
"learning_rate": 3.701577205211604e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535856366157532,
"step": 1125,
"valid_targets_mean": 4428.5,
"valid_targets_min": 990
},
{
"epoch": 1.819645732689211,
"grad_norm": 0.6263613356926185,
"learning_rate": 3.697343324686119e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23104625940322876,
"step": 1130,
"valid_targets_mean": 4673.7,
"valid_targets_min": 1449
},
{
"epoch": 1.8276972624798713,
"grad_norm": 0.5298323694554691,
"learning_rate": 3.693082078169933e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24033012986183167,
"step": 1135,
"valid_targets_mean": 4732.1,
"valid_targets_min": 1605
},
{
"epoch": 1.8357487922705316,
"grad_norm": 0.4783853550563579,
"learning_rate": 3.68879353436643e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2028733789920807,
"step": 1140,
"valid_targets_mean": 4867.9,
"valid_targets_min": 2154
},
{
"epoch": 1.8438003220611916,
"grad_norm": 0.4595078299986765,
"learning_rate": 3.684477762419108e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.215766042470932,
"step": 1145,
"valid_targets_mean": 4522.2,
"valid_targets_min": 2208
},
{
"epoch": 1.8518518518518519,
"grad_norm": 0.5149239335560051,
"learning_rate": 3.6801348319104546e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2230435311794281,
"step": 1150,
"valid_targets_mean": 3680.6,
"valid_targets_min": 434
},
{
"epoch": 1.8599033816425121,
"grad_norm": 0.42919344493593076,
"learning_rate": 3.675764812860833e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20287317037582397,
"step": 1155,
"valid_targets_mean": 5642.9,
"valid_targets_min": 2036
},
{
"epoch": 1.8679549114331722,
"grad_norm": 0.4884349396198345,
"learning_rate": 3.671367775727353e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24478939175605774,
"step": 1160,
"valid_targets_mean": 4762.1,
"valid_targets_min": 775
},
{
"epoch": 1.8760064412238324,
"grad_norm": 0.49953971630838795,
"learning_rate": 3.666943791402726e-05,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2292686104774475,
"step": 1165,
"valid_targets_mean": 4543.8,
"valid_targets_min": 1026
},
{
"epoch": 1.8840579710144927,
"grad_norm": 0.4644474561197982,
"learning_rate": 3.662492931214137e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597373127937317,
"step": 1170,
"valid_targets_mean": 5243.1,
"valid_targets_min": 1246
},
{
"epoch": 1.892109500805153,
"grad_norm": 0.5180686308684069,
"learning_rate": 3.6580152669220784e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606375813484192,
"step": 1175,
"valid_targets_mean": 4800.7,
"valid_targets_min": 2456
},
{
"epoch": 1.9001610305958132,
"grad_norm": 0.42092491518373576,
"learning_rate": 3.6535108707192053e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22271546721458435,
"step": 1180,
"valid_targets_mean": 5251.3,
"valid_targets_min": 1616
},
{
"epoch": 1.9082125603864735,
"grad_norm": 0.5826394657065203,
"learning_rate": 3.648979815229167e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20627357065677643,
"step": 1185,
"valid_targets_mean": 3834.6,
"valid_targets_min": 693
},
{
"epoch": 1.9162640901771337,
"grad_norm": 0.7082935353213954,
"learning_rate": 3.644422173505433e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24815203249454498,
"step": 1190,
"valid_targets_mean": 4642.2,
"valid_targets_min": 338
},
{
"epoch": 1.924315619967794,
"grad_norm": 0.5088420525828131,
"learning_rate": 3.639838019030123e-05,
"loss": 0.2303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23133976757526398,
"step": 1195,
"valid_targets_mean": 4064.8,
"valid_targets_min": 1849
},
{
"epoch": 1.9323671497584543,
"grad_norm": 0.4807696052913685,
"learning_rate": 3.635227425712812e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24485018849372864,
"step": 1200,
"valid_targets_mean": 5358.3,
"valid_targets_min": 1956
},
{
"epoch": 1.9404186795491143,
"grad_norm": 0.5374569252336697,
"learning_rate": 3.6305904678893504e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23684567213058472,
"step": 1205,
"valid_targets_mean": 4465.9,
"valid_targets_min": 2036
},
{
"epoch": 1.9484702093397746,
"grad_norm": 0.4315082896253737,
"learning_rate": 3.6259272203206535e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20846745371818542,
"step": 1210,
"valid_targets_mean": 5167.9,
"valid_targets_min": 1434
},
{
"epoch": 1.9565217391304348,
"grad_norm": 0.5262891588589963,
"learning_rate": 3.621237758191505e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24596351385116577,
"step": 1215,
"valid_targets_mean": 3761.8,
"valid_targets_min": 1066
},
{
"epoch": 1.9645732689210949,
"grad_norm": 0.49628184032222405,
"learning_rate": 3.616522157109342e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21257467567920685,
"step": 1220,
"valid_targets_mean": 4065.5,
"valid_targets_min": 1897
},
{
"epoch": 1.9726247987117551,
"grad_norm": 0.4787291955056688,
"learning_rate": 3.6117804931030324e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2495032548904419,
"step": 1225,
"valid_targets_mean": 4767.3,
"valid_targets_min": 930
},
{
"epoch": 1.9806763285024154,
"grad_norm": 0.4952065016883059,
"learning_rate": 3.607012842621657e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23980122804641724,
"step": 1230,
"valid_targets_mean": 4069.4,
"valid_targets_min": 1260
},
{
"epoch": 1.9887278582930756,
"grad_norm": 0.5230866628171786,
"learning_rate": 3.602219282533269e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2368500828742981,
"step": 1235,
"valid_targets_mean": 4682.7,
"valid_targets_min": 2343
},
{
"epoch": 1.996779388083736,
"grad_norm": 0.5246193826991147,
"learning_rate": 3.597399890123659e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21333156526088715,
"step": 1240,
"valid_targets_mean": 4692.2,
"valid_targets_min": 2047
},
{
"epoch": 2.004830917874396,
"grad_norm": 0.505863313320365,
"learning_rate": 3.5925547430951094e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20909734070301056,
"step": 1245,
"valid_targets_mean": 4637.2,
"valid_targets_min": 989
},
{
"epoch": 2.0128824476650564,
"grad_norm": 0.43133643927265986,
"learning_rate": 3.587683919565136e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19329163432121277,
"step": 1250,
"valid_targets_mean": 5283.4,
"valid_targets_min": 1835
},
{
"epoch": 2.0209339774557167,
"grad_norm": 0.4837745442669591,
"learning_rate": 3.582787498065237e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20409853756427765,
"step": 1255,
"valid_targets_mean": 4767.1,
"valid_targets_min": 1074
},
{
"epoch": 2.028985507246377,
"grad_norm": 0.6452848255637806,
"learning_rate": 3.577865557539621e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1907821148633957,
"step": 1260,
"valid_targets_mean": 4763.1,
"valid_targets_min": 392
},
{
"epoch": 2.037037037037037,
"grad_norm": 0.5867010578619666,
"learning_rate": 3.572918177343935e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1922091245651245,
"step": 1265,
"valid_targets_mean": 4118.4,
"valid_targets_min": 631
},
{
"epoch": 2.0450885668276975,
"grad_norm": 0.48474397713094575,
"learning_rate": 3.567945437243987e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19150424003601074,
"step": 1270,
"valid_targets_mean": 4600.4,
"valid_targets_min": 1066
},
{
"epoch": 2.0531400966183573,
"grad_norm": 0.5113649508317663,
"learning_rate": 3.5629474174144564e-05,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.253940224647522,
"step": 1275,
"valid_targets_mean": 5131.0,
"valid_targets_min": 2438
},
{
"epoch": 2.0611916264090175,
"grad_norm": 0.491663340986429,
"learning_rate": 3.5579241984376065e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22499999403953552,
"step": 1280,
"valid_targets_mean": 3951.9,
"valid_targets_min": 1010
},
{
"epoch": 2.069243156199678,
"grad_norm": 0.520462248826658,
"learning_rate": 3.5528758613019804e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19735172390937805,
"step": 1285,
"valid_targets_mean": 3831.2,
"valid_targets_min": 1088
},
{
"epoch": 2.077294685990338,
"grad_norm": 0.5206723700369398,
"learning_rate": 3.547802487401097e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23212730884552002,
"step": 1290,
"valid_targets_mean": 5061.6,
"valid_targets_min": 2180
},
{
"epoch": 2.0853462157809983,
"grad_norm": 0.577226384156968,
"learning_rate": 3.54270415853214e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20443934202194214,
"step": 1295,
"valid_targets_mean": 3395.8,
"valid_targets_min": 627
},
{
"epoch": 2.0933977455716586,
"grad_norm": 0.4423746810496331,
"learning_rate": 3.537580956894638e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21375350654125214,
"step": 1300,
"valid_targets_mean": 5160.8,
"valid_targets_min": 1507
},
{
"epoch": 2.101449275362319,
"grad_norm": 0.5548629803187833,
"learning_rate": 3.532432965089138e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22949251532554626,
"step": 1305,
"valid_targets_mean": 5229.6,
"valid_targets_min": 2557
},
{
"epoch": 2.109500805152979,
"grad_norm": 0.4906711255865245,
"learning_rate": 3.527260266115876e-05,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2087794542312622,
"step": 1310,
"valid_targets_mean": 5409.4,
"valid_targets_min": 2349
},
{
"epoch": 2.1175523349436394,
"grad_norm": 0.6560805934109221,
"learning_rate": 3.522062943373438e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17596739530563354,
"step": 1315,
"valid_targets_mean": 4226.9,
"valid_targets_min": 1025
},
{
"epoch": 2.1256038647342996,
"grad_norm": 0.7107665752653891,
"learning_rate": 3.516841080657413e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23091405630111694,
"step": 1320,
"valid_targets_mean": 4053.8,
"valid_targets_min": 689
},
{
"epoch": 2.13365539452496,
"grad_norm": 0.5185713231757747,
"learning_rate": 3.511594762159046e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20578667521476746,
"step": 1325,
"valid_targets_mean": 4018.0,
"valid_targets_min": 978
},
{
"epoch": 2.14170692431562,
"grad_norm": 0.463159581350649,
"learning_rate": 3.506324072463878e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929136961698532,
"step": 1330,
"valid_targets_mean": 4945.8,
"valid_targets_min": 2099
},
{
"epoch": 2.14975845410628,
"grad_norm": 0.5447005808188629,
"learning_rate": 3.5010290965503826e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23045824468135834,
"step": 1335,
"valid_targets_mean": 4698.5,
"valid_targets_min": 1716
},
{
"epoch": 2.1578099838969402,
"grad_norm": 0.4595107321034477,
"learning_rate": 3.495709919788597e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18875578045845032,
"step": 1340,
"valid_targets_mean": 4457.4,
"valid_targets_min": 755
},
{
"epoch": 2.1658615136876005,
"grad_norm": 0.6481051628858272,
"learning_rate": 3.490366627938742e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22552573680877686,
"step": 1345,
"valid_targets_mean": 4907.9,
"valid_targets_min": 1381
},
{
"epoch": 2.1739130434782608,
"grad_norm": 0.8255339190022734,
"learning_rate": 3.484999307149846e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20174431800842285,
"step": 1350,
"valid_targets_mean": 3897.0,
"valid_targets_min": 979
},
{
"epoch": 2.181964573268921,
"grad_norm": 0.47550594396325907,
"learning_rate": 3.47960804395835e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21997377276420593,
"step": 1355,
"valid_targets_mean": 4916.5,
"valid_targets_min": 990
},
{
"epoch": 2.1900161030595813,
"grad_norm": 0.5142914581894688,
"learning_rate": 3.474192925286714e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2234359234571457,
"step": 1360,
"valid_targets_mean": 4057.0,
"valid_targets_min": 554
},
{
"epoch": 2.1980676328502415,
"grad_norm": 0.5135241141747307,
"learning_rate": 3.468754038442017e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21173028647899628,
"step": 1365,
"valid_targets_mean": 4122.8,
"valid_targets_min": 963
},
{
"epoch": 2.206119162640902,
"grad_norm": 0.5281981416757465,
"learning_rate": 3.463291471114548e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2580035328865051,
"step": 1370,
"valid_targets_mean": 4534.7,
"valid_targets_min": 1253
},
{
"epoch": 2.214170692431562,
"grad_norm": 0.546080448981762,
"learning_rate": 3.4578053113763936e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2357328236103058,
"step": 1375,
"valid_targets_mean": 4083.2,
"valid_targets_min": 1119
},
{
"epoch": 2.2222222222222223,
"grad_norm": 0.43510725221723323,
"learning_rate": 3.452295647680014e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.210770383477211,
"step": 1380,
"valid_targets_mean": 5021.1,
"valid_targets_min": 1913
},
{
"epoch": 2.2302737520128826,
"grad_norm": 0.45576706352160945,
"learning_rate": 3.4467625688568245e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20456649363040924,
"step": 1385,
"valid_targets_mean": 4813.6,
"valid_targets_min": 1879
},
{
"epoch": 2.238325281803543,
"grad_norm": 0.4605011820162796,
"learning_rate": 3.4412061641157546e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862925887107849,
"step": 1390,
"valid_targets_mean": 5375.2,
"valid_targets_min": 1405
},
{
"epoch": 2.246376811594203,
"grad_norm": 0.5067717085593049,
"learning_rate": 3.435626523041815e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20806747674942017,
"step": 1395,
"valid_targets_mean": 4125.7,
"valid_targets_min": 2104
},
{
"epoch": 2.2544283413848634,
"grad_norm": 0.503211076543084,
"learning_rate": 3.430023735594653e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23167727887630463,
"step": 1400,
"valid_targets_mean": 4897.6,
"valid_targets_min": 344
},
{
"epoch": 2.262479871175523,
"grad_norm": 0.5252844399823857,
"learning_rate": 3.4243978921071005e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18407735228538513,
"step": 1405,
"valid_targets_mean": 4546.8,
"valid_targets_min": 1908
},
{
"epoch": 2.2705314009661834,
"grad_norm": 0.5703046217142366,
"learning_rate": 3.418749083283719e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23428402841091156,
"step": 1410,
"valid_targets_mean": 4894.1,
"valid_targets_min": 1720
},
{
"epoch": 2.2785829307568437,
"grad_norm": 0.45360806117795466,
"learning_rate": 3.413077400199334e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16744893789291382,
"step": 1415,
"valid_targets_mean": 4128.2,
"valid_targets_min": 1177
},
{
"epoch": 2.286634460547504,
"grad_norm": 0.48066382062291113,
"learning_rate": 3.407382934297571e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21223318576812744,
"step": 1420,
"valid_targets_mean": 4697.8,
"valid_targets_min": 1982
},
{
"epoch": 2.2946859903381642,
"grad_norm": 0.4623146781727566,
"learning_rate": 3.4016657773893785e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.186685249209404,
"step": 1425,
"valid_targets_mean": 5018.8,
"valid_targets_min": 1843
},
{
"epoch": 2.3027375201288245,
"grad_norm": 0.5051350867881649,
"learning_rate": 3.3959260216515495e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1981533169746399,
"step": 1430,
"valid_targets_mean": 4461.0,
"valid_targets_min": 1264
},
{
"epoch": 2.3107890499194848,
"grad_norm": 0.547928503478585,
"learning_rate": 3.3901637596252325e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20269712805747986,
"step": 1435,
"valid_targets_mean": 4606.9,
"valid_targets_min": 216
},
{
"epoch": 2.318840579710145,
"grad_norm": 0.5050671980985264,
"learning_rate": 3.384379084214443e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21335461735725403,
"step": 1440,
"valid_targets_mean": 3892.7,
"valid_targets_min": 1209
},
{
"epoch": 2.3268921095008053,
"grad_norm": 0.48909304735454484,
"learning_rate": 3.378572088684562e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19523759186267853,
"step": 1445,
"valid_targets_mean": 4354.8,
"valid_targets_min": 1308
},
{
"epoch": 2.3349436392914655,
"grad_norm": 0.6388146830801954,
"learning_rate": 3.372742866660836e-05,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.198106050491333,
"step": 1450,
"valid_targets_mean": 4365.9,
"valid_targets_min": 713
},
{
"epoch": 2.342995169082126,
"grad_norm": 0.5410396103360308,
"learning_rate": 3.3668915121268636e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23412463068962097,
"step": 1455,
"valid_targets_mean": 4374.0,
"valid_targets_min": 547
},
{
"epoch": 2.3510466988727856,
"grad_norm": 0.5291219901130383,
"learning_rate": 3.361018119423085e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2332005500793457,
"step": 1460,
"valid_targets_mean": 3958.9,
"valid_targets_min": 1381
},
{
"epoch": 2.359098228663446,
"grad_norm": 0.5100995870174685,
"learning_rate": 3.3551227832452555e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2195730209350586,
"step": 1465,
"valid_targets_mean": 4228.3,
"valid_targets_min": 2352
},
{
"epoch": 2.367149758454106,
"grad_norm": 0.5322099118621038,
"learning_rate": 3.3492055986429235e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22615352272987366,
"step": 1470,
"valid_targets_mean": 4539.8,
"valid_targets_min": 296
},
{
"epoch": 2.3752012882447664,
"grad_norm": 0.4656836442072764,
"learning_rate": 3.3432666610178936e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17955255508422852,
"step": 1475,
"valid_targets_mean": 4149.8,
"valid_targets_min": 1631
},
{
"epoch": 2.3832528180354267,
"grad_norm": 0.5493172940293227,
"learning_rate": 3.3373060661226944e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23940381407737732,
"step": 1480,
"valid_targets_mean": 4181.2,
"valid_targets_min": 2011
},
{
"epoch": 2.391304347826087,
"grad_norm": 0.49597904545260957,
"learning_rate": 3.331323910059027e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24300578236579895,
"step": 1485,
"valid_targets_mean": 3967.4,
"valid_targets_min": 677
},
{
"epoch": 2.399355877616747,
"grad_norm": 0.5003561031279338,
"learning_rate": 3.3253202892762244e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1889512538909912,
"step": 1490,
"valid_targets_mean": 4254.9,
"valid_targets_min": 1570
},
{
"epoch": 2.4074074074074074,
"grad_norm": 0.4683723297524737,
"learning_rate": 3.319295300569686e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22197048366069794,
"step": 1495,
"valid_targets_mean": 5005.4,
"valid_targets_min": 857
},
{
"epoch": 2.4154589371980677,
"grad_norm": 0.5071114785034765,
"learning_rate": 3.3132490410793294e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20913785696029663,
"step": 1500,
"valid_targets_mean": 4472.4,
"valid_targets_min": 1073
},
{
"epoch": 2.423510466988728,
"grad_norm": 0.4572009276147089,
"learning_rate": 3.3071816082880115e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19436806440353394,
"step": 1505,
"valid_targets_mean": 4905.2,
"valid_targets_min": 1404
},
{
"epoch": 2.4315619967793882,
"grad_norm": 0.5338897691126591,
"learning_rate": 3.3010931000199674e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22107122838497162,
"step": 1510,
"valid_targets_mean": 4076.6,
"valid_targets_min": 1904
},
{
"epoch": 2.4396135265700485,
"grad_norm": 0.49724905678619213,
"learning_rate": 3.2949836144392256e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22516636550426483,
"step": 1515,
"valid_targets_mean": 5009.3,
"valid_targets_min": 1353
},
{
"epoch": 2.4476650563607087,
"grad_norm": 0.5108239733431804,
"learning_rate": 3.28885325004803e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23558905720710754,
"step": 1520,
"valid_targets_mean": 4774.4,
"valid_targets_min": 1731
},
{
"epoch": 2.455716586151369,
"grad_norm": 0.4908585219445986,
"learning_rate": 3.282702105685251e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22913925349712372,
"step": 1525,
"valid_targets_mean": 5611.8,
"valid_targets_min": 2104
},
{
"epoch": 2.463768115942029,
"grad_norm": 0.4523927665088012,
"learning_rate": 3.2765302805247885e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20795124769210815,
"step": 1530,
"valid_targets_mean": 4889.2,
"valid_targets_min": 2184
},
{
"epoch": 2.471819645732689,
"grad_norm": 0.5485354909981668,
"learning_rate": 3.270337874073977e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2317976951599121,
"step": 1535,
"valid_targets_mean": 5319.1,
"valid_targets_min": 1932
},
{
"epoch": 2.4798711755233493,
"grad_norm": 0.5061836838324374,
"learning_rate": 3.264124986171981e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25826138257980347,
"step": 1540,
"valid_targets_mean": 4537.9,
"valid_targets_min": 453
},
{
"epoch": 2.4879227053140096,
"grad_norm": 0.47633311927326305,
"learning_rate": 3.2578917169881816e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22371219098567963,
"step": 1545,
"valid_targets_mean": 4426.5,
"valid_targets_min": 1435
},
{
"epoch": 2.49597423510467,
"grad_norm": 0.528382297311333,
"learning_rate": 3.2516381670205665e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22219571471214294,
"step": 1550,
"valid_targets_mean": 4377.4,
"valid_targets_min": 812
},
{
"epoch": 2.50402576489533,
"grad_norm": 0.496647756887993,
"learning_rate": 3.245364437094105e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22214139997959137,
"step": 1555,
"valid_targets_mean": 4800.2,
"valid_targets_min": 1516
},
{
"epoch": 2.5120772946859904,
"grad_norm": 0.5176776733548973,
"learning_rate": 3.239070628359126e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536792755126953,
"step": 1560,
"valid_targets_mean": 4532.4,
"valid_targets_min": 420
},
{
"epoch": 2.5201288244766507,
"grad_norm": 0.4521203535869814,
"learning_rate": 3.232756842289685e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1837652325630188,
"step": 1565,
"valid_targets_mean": 4955.4,
"valid_targets_min": 1611
},
{
"epoch": 2.528180354267311,
"grad_norm": 0.48332269443651105,
"learning_rate": 3.2264231806819286e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18321290612220764,
"step": 1570,
"valid_targets_mean": 4541.4,
"valid_targets_min": 1371
},
{
"epoch": 2.536231884057971,
"grad_norm": 0.5203474071856915,
"learning_rate": 3.220069745652456e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2053850144147873,
"step": 1575,
"valid_targets_mean": 4024.7,
"valid_targets_min": 380
},
{
"epoch": 2.544283413848631,
"grad_norm": 0.46470085704874836,
"learning_rate": 3.213696639636666e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19794431328773499,
"step": 1580,
"valid_targets_mean": 4241.2,
"valid_targets_min": 756
},
{
"epoch": 2.5523349436392913,
"grad_norm": 0.4921456777251355,
"learning_rate": 3.207303965387114e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2276471108198166,
"step": 1585,
"valid_targets_mean": 4376.2,
"valid_targets_min": 327
},
{
"epoch": 2.5603864734299515,
"grad_norm": 0.5461925808616269,
"learning_rate": 3.200891825971846e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2170354425907135,
"step": 1590,
"valid_targets_mean": 4376.3,
"valid_targets_min": 1624
},
{
"epoch": 2.5684380032206118,
"grad_norm": 0.45331868338223147,
"learning_rate": 3.194460324772746e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17769229412078857,
"step": 1595,
"valid_targets_mean": 4559.6,
"valid_targets_min": 1717
},
{
"epoch": 2.576489533011272,
"grad_norm": 0.5481556666487605,
"learning_rate": 3.188009565483861e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21930727362632751,
"step": 1600,
"valid_targets_mean": 3786.7,
"valid_targets_min": 627
},
{
"epoch": 2.5845410628019323,
"grad_norm": 0.5306078402232887,
"learning_rate": 3.1815396521097376e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22777387499809265,
"step": 1605,
"valid_targets_mean": 4098.1,
"valid_targets_min": 581
},
{
"epoch": 2.5925925925925926,
"grad_norm": 0.6396015312802733,
"learning_rate": 3.1750506889637366e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606090009212494,
"step": 1610,
"valid_targets_mean": 4573.8,
"valid_targets_min": 513
},
{
"epoch": 2.600644122383253,
"grad_norm": 0.5139629491463821,
"learning_rate": 3.1685427806663574e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22717058658599854,
"step": 1615,
"valid_targets_mean": 4616.6,
"valid_targets_min": 2109
},
{
"epoch": 2.608695652173913,
"grad_norm": 0.4896772812229126,
"learning_rate": 3.1620160321435475e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2393844723701477,
"step": 1620,
"valid_targets_mean": 4748.1,
"valid_targets_min": 1671
},
{
"epoch": 2.6167471819645733,
"grad_norm": 0.5123496934824213,
"learning_rate": 3.155470548625014e-05,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2570544481277466,
"step": 1625,
"valid_targets_mean": 4746.9,
"valid_targets_min": 1642
},
{
"epoch": 2.6247987117552336,
"grad_norm": 0.5011886008293388,
"learning_rate": 3.1489064356425235e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21146038174629211,
"step": 1630,
"valid_targets_mean": 4106.5,
"valid_targets_min": 1263
},
{
"epoch": 2.632850241545894,
"grad_norm": 0.4918629952935143,
"learning_rate": 3.142323799028204e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.205857515335083,
"step": 1635,
"valid_targets_mean": 4128.4,
"valid_targets_min": 713
},
{
"epoch": 2.640901771336554,
"grad_norm": 0.4975884336977351,
"learning_rate": 3.135722744912836e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19787558913230896,
"step": 1640,
"valid_targets_mean": 5678.5,
"valid_targets_min": 886
},
{
"epoch": 2.6489533011272144,
"grad_norm": 0.48481732390442694,
"learning_rate": 3.129103379724143e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1850062608718872,
"step": 1645,
"valid_targets_mean": 3477.6,
"valid_targets_min": 752
},
{
"epoch": 2.6570048309178746,
"grad_norm": 0.4665528515319807,
"learning_rate": 3.122465810185075e-05,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21181383728981018,
"step": 1650,
"valid_targets_mean": 4864.5,
"valid_targets_min": 1598
},
{
"epoch": 2.6650563607085345,
"grad_norm": 0.5077396920276867,
"learning_rate": 3.1158101433120863e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19636741280555725,
"step": 1655,
"valid_targets_mean": 3697.4,
"valid_targets_min": 339
},
{
"epoch": 2.6731078904991947,
"grad_norm": 0.5055566499587948,
"learning_rate": 3.1091364864134136e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20249465107917786,
"step": 1660,
"valid_targets_mean": 4576.9,
"valid_targets_min": 543
},
{
"epoch": 2.681159420289855,
"grad_norm": 0.49702037708190555,
"learning_rate": 3.102444947087342e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17359226942062378,
"step": 1665,
"valid_targets_mean": 3802.2,
"valid_targets_min": 1850
},
{
"epoch": 2.6892109500805152,
"grad_norm": 0.543548482081646,
"learning_rate": 3.0957356332204745e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21617215871810913,
"step": 1670,
"valid_targets_mean": 5324.2,
"valid_targets_min": 1401
},
{
"epoch": 2.6972624798711755,
"grad_norm": 0.473211339207569,
"learning_rate": 3.089008652985989e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20709389448165894,
"step": 1675,
"valid_targets_mean": 4730.4,
"valid_targets_min": 1283
},
{
"epoch": 2.7053140096618358,
"grad_norm": 0.48495909325226566,
"learning_rate": 3.082264114841892e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19697055220603943,
"step": 1680,
"valid_targets_mean": 4703.1,
"valid_targets_min": 1393
},
{
"epoch": 2.713365539452496,
"grad_norm": 0.525234042627054,
"learning_rate": 3.07550212752928e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21602725982666016,
"step": 1685,
"valid_targets_mean": 4527.6,
"valid_targets_min": 728
},
{
"epoch": 2.7214170692431563,
"grad_norm": 0.49507933380428965,
"learning_rate": 3.068722800070574e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23652076721191406,
"step": 1690,
"valid_targets_mean": 3893.8,
"valid_targets_min": 1490
},
{
"epoch": 2.7294685990338166,
"grad_norm": 0.478229441737468,
"learning_rate": 3.0619262417677695e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20760485529899597,
"step": 1695,
"valid_targets_mean": 4375.8,
"valid_targets_min": 1930
},
{
"epoch": 2.7375201288244764,
"grad_norm": 0.4760382784479069,
"learning_rate": 3.055112562200673e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20306912064552307,
"step": 1700,
"valid_targets_mean": 4093.1,
"valid_targets_min": 892
},
{
"epoch": 2.7455716586151366,
"grad_norm": 0.567194545288659,
"learning_rate": 3.0482818712251318e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22697149217128754,
"step": 1705,
"valid_targets_mean": 5224.9,
"valid_targets_min": 679
},
{
"epoch": 2.753623188405797,
"grad_norm": 0.7966562099200152,
"learning_rate": 3.0414342789712675e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644144296646118,
"step": 1710,
"valid_targets_mean": 3641.8,
"valid_targets_min": 267
},
{
"epoch": 2.761674718196457,
"grad_norm": 0.5194781986137333,
"learning_rate": 3.034569895841699e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20732516050338745,
"step": 1715,
"valid_targets_mean": 4665.7,
"valid_targets_min": 1796
},
{
"epoch": 2.7697262479871174,
"grad_norm": 0.5139542297559575,
"learning_rate": 3.0276888325097583e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2747165858745575,
"step": 1720,
"valid_targets_mean": 5593.7,
"valid_targets_min": 863
},
{
"epoch": 2.7777777777777777,
"grad_norm": 0.5017349754200195,
"learning_rate": 3.020791199917713e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19357708096504211,
"step": 1725,
"valid_targets_mean": 4411.8,
"valid_targets_min": 775
},
{
"epoch": 2.785829307568438,
"grad_norm": 0.47883623225450245,
"learning_rate": 3.0138771092749722e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21340464055538177,
"step": 1730,
"valid_targets_mean": 4259.2,
"valid_targets_min": 702
},
{
"epoch": 2.793880837359098,
"grad_norm": 0.5042451347947459,
"learning_rate": 3.006946672056297e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20300012826919556,
"step": 1735,
"valid_targets_mean": 4185.3,
"valid_targets_min": 1004
},
{
"epoch": 2.8019323671497585,
"grad_norm": 0.5599312568052899,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22356563806533813,
"step": 1740,
"valid_targets_mean": 4172.1,
"valid_targets_min": 1019
},
{
"epoch": 2.8099838969404187,
"grad_norm": 0.5188094581424917,
"learning_rate": 2.993037205106147e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21803626418113708,
"step": 1745,
"valid_targets_mean": 4445.8,
"valid_targets_min": 1772
},
{
"epoch": 2.818035426731079,
"grad_norm": 0.48903765537814037,
"learning_rate": 2.9860583996347495e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21702814102172852,
"step": 1750,
"valid_targets_mean": 4806.7,
"valid_targets_min": 1671
},
{
"epoch": 2.8260869565217392,
"grad_norm": 0.48803716906398215,
"learning_rate": 2.9790636961039524e-05,
"loss": 0.2193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22425541281700134,
"step": 1755,
"valid_targets_mean": 4643.0,
"valid_targets_min": 1506
},
{
"epoch": 2.8341384863123995,
"grad_norm": 0.48749480729575717,
"learning_rate": 2.9720532072882268e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19417119026184082,
"step": 1760,
"valid_targets_mean": 4002.8,
"valid_targets_min": 1522
},
{
"epoch": 2.8421900161030598,
"grad_norm": 0.45848716202240636,
"learning_rate": 2.965027046216544e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1857365071773529,
"step": 1765,
"valid_targets_mean": 4783.7,
"valid_targets_min": 1919
},
{
"epoch": 2.85024154589372,
"grad_norm": 0.6718800164601025,
"learning_rate": 2.9579853261705573e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23533181846141815,
"step": 1770,
"valid_targets_mean": 4673.9,
"valid_targets_min": 1311
},
{
"epoch": 2.8582930756843803,
"grad_norm": 0.4660110391421861,
"learning_rate": 2.950928160682775e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19263693690299988,
"step": 1775,
"valid_targets_mean": 4255.1,
"valid_targets_min": 1076
},
{
"epoch": 2.86634460547504,
"grad_norm": 0.5145254890484248,
"learning_rate": 2.943855663534731e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23376551270484924,
"step": 1780,
"valid_targets_mean": 4397.2,
"valid_targets_min": 1787
},
{
"epoch": 2.8743961352657004,
"grad_norm": 0.4906091551370421,
"learning_rate": 2.9367679487551473e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20546765625476837,
"step": 1785,
"valid_targets_mean": 3990.4,
"valid_targets_min": 1477
},
{
"epoch": 2.8824476650563606,
"grad_norm": 0.5093898731159036,
"learning_rate": 2.929665130618098e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22851824760437012,
"step": 1790,
"valid_targets_mean": 5522.1,
"valid_targets_min": 1762
},
{
"epoch": 2.890499194847021,
"grad_norm": 0.4518802511006292,
"learning_rate": 2.9225473236411655e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18847951292991638,
"step": 1795,
"valid_targets_mean": 4818.7,
"valid_targets_min": 1111
},
{
"epoch": 2.898550724637681,
"grad_norm": 0.6937426790422542,
"learning_rate": 2.915414642583596e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20088736712932587,
"step": 1800,
"valid_targets_mean": 3600.9,
"valid_targets_min": 848
},
{
"epoch": 2.9066022544283414,
"grad_norm": 0.46521668715049397,
"learning_rate": 2.9082672024444485e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22432249784469604,
"step": 1805,
"valid_targets_mean": 4322.0,
"valid_targets_min": 1358
},
{
"epoch": 2.9146537842190017,
"grad_norm": 0.436860595041999,
"learning_rate": 2.901105118460737e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1966436803340912,
"step": 1810,
"valid_targets_mean": 4940.1,
"valid_targets_min": 1944
},
{
"epoch": 2.922705314009662,
"grad_norm": 0.5361044008606226,
"learning_rate": 2.8939285061055807e-05,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2078220695257187,
"step": 1815,
"valid_targets_mean": 3302.5,
"valid_targets_min": 609
},
{
"epoch": 2.930756843800322,
"grad_norm": 0.49990872670719105,
"learning_rate": 2.8867374810863325e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2396693229675293,
"step": 1820,
"valid_targets_mean": 4933.6,
"valid_targets_min": 1197
},
{
"epoch": 2.938808373590982,
"grad_norm": 0.4676050983632418,
"learning_rate": 2.8795321593427227e-05,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21761463582515717,
"step": 1825,
"valid_targets_mean": 4473.9,
"valid_targets_min": 1740
},
{
"epoch": 2.9468599033816423,
"grad_norm": 0.4579800892905144,
"learning_rate": 2.8723126570449813e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22557538747787476,
"step": 1830,
"valid_targets_mean": 4990.2,
"valid_targets_min": 1104
},
{
"epoch": 2.9549114331723025,
"grad_norm": 0.521039627014324,
"learning_rate": 2.8650790905919724e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21462702751159668,
"step": 1835,
"valid_targets_mean": 4125.9,
"valid_targets_min": 1187
},
{
"epoch": 2.962962962962963,
"grad_norm": 0.5446614093095541,
"learning_rate": 2.8578315766093133e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22720134258270264,
"step": 1840,
"valid_targets_mean": 4199.9,
"valid_targets_min": 379
},
{
"epoch": 2.971014492753623,
"grad_norm": 0.5085501802829419,
"learning_rate": 2.850570231947493e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20165984332561493,
"step": 1845,
"valid_targets_mean": 4610.2,
"valid_targets_min": 745
},
{
"epoch": 2.9790660225442833,
"grad_norm": 0.4995531673717949,
"learning_rate": 2.8432951736799933e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21701423823833466,
"step": 1850,
"valid_targets_mean": 4243.4,
"valid_targets_min": 1952
},
{
"epoch": 2.9871175523349436,
"grad_norm": 0.5654118721016965,
"learning_rate": 2.8360065191013967e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22924692928791046,
"step": 1855,
"valid_targets_mean": 3948.6,
"valid_targets_min": 1818
},
{
"epoch": 2.995169082125604,
"grad_norm": 0.5368747366497263,
"learning_rate": 2.8287043857254957e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18569841980934143,
"step": 1860,
"valid_targets_mean": 4243.3,
"valid_targets_min": 944
},
{
"epoch": 3.003220611916264,
"grad_norm": 0.5308612324214572,
"learning_rate": 2.8213888912834026e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20392943918704987,
"step": 1865,
"valid_targets_mean": 5240.9,
"valid_targets_min": 3176
},
{
"epoch": 3.0112721417069244,
"grad_norm": 0.5850366317547473,
"learning_rate": 2.814060153721644e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22741422057151794,
"step": 1870,
"valid_targets_mean": 4518.1,
"valid_targets_min": 1313
},
{
"epoch": 3.0193236714975846,
"grad_norm": 0.5456534322958014,
"learning_rate": 2.8067182912002663e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19902676343917847,
"step": 1875,
"valid_targets_mean": 4697.9,
"valid_targets_min": 1401
},
{
"epoch": 3.027375201288245,
"grad_norm": 0.5866691020588805,
"learning_rate": 2.7993634220909254e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17653107643127441,
"step": 1880,
"valid_targets_mean": 5312.7,
"valid_targets_min": 1668
},
{
"epoch": 3.035426731078905,
"grad_norm": 0.4839014869325985,
"learning_rate": 2.7919956649749826e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207495778799057,
"step": 1885,
"valid_targets_mean": 4792.9,
"valid_targets_min": 1475
},
{
"epoch": 3.0434782608695654,
"grad_norm": 0.5792725572749162,
"learning_rate": 2.784615138641588e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2462862730026245,
"step": 1890,
"valid_targets_mean": 3582.7,
"valid_targets_min": 1264
},
{
"epoch": 3.0515297906602252,
"grad_norm": 0.5471292037490801,
"learning_rate": 2.7772219620857685e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2000941038131714,
"step": 1895,
"valid_targets_mean": 4260.8,
"valid_targets_min": 1662
},
{
"epoch": 3.0595813204508855,
"grad_norm": 0.5418789392536902,
"learning_rate": 2.769816254506509e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17109820246696472,
"step": 1900,
"valid_targets_mean": 4285.0,
"valid_targets_min": 688
},
{
"epoch": 3.0676328502415457,
"grad_norm": 0.5696873068816691,
"learning_rate": 2.76239813530483e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17864085733890533,
"step": 1905,
"valid_targets_mean": 3839.0,
"valid_targets_min": 356
},
{
"epoch": 3.075684380032206,
"grad_norm": 0.5257872930167539,
"learning_rate": 2.7549677240818628e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20962268114089966,
"step": 1910,
"valid_targets_mean": 4587.1,
"valid_targets_min": 854
},
{
"epoch": 3.0837359098228663,
"grad_norm": 0.5648446285032245,
"learning_rate": 2.7475251406369197e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20219004154205322,
"step": 1915,
"valid_targets_mean": 4792.9,
"valid_targets_min": 1897
},
{
"epoch": 3.0917874396135265,
"grad_norm": 0.454963234903237,
"learning_rate": 2.740070504965565e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1661757528781891,
"step": 1920,
"valid_targets_mean": 5107.2,
"valid_targets_min": 1842
},
{
"epoch": 3.099838969404187,
"grad_norm": 0.5802646506856157,
"learning_rate": 2.7326039372576782e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20974227786064148,
"step": 1925,
"valid_targets_mean": 4211.8,
"valid_targets_min": 1850
},
{
"epoch": 3.107890499194847,
"grad_norm": 0.5115859872263251,
"learning_rate": 2.7251255578955186e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191048726439476,
"step": 1930,
"valid_targets_mean": 4847.3,
"valid_targets_min": 2149
},
{
"epoch": 3.1159420289855073,
"grad_norm": 0.4838092911137751,
"learning_rate": 2.7176354874517805e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18548092246055603,
"step": 1935,
"valid_targets_mean": 4928.9,
"valid_targets_min": 1746
},
{
"epoch": 3.1239935587761676,
"grad_norm": 0.6716396355587732,
"learning_rate": 2.7101338466876542e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17967697978019714,
"step": 1940,
"valid_targets_mean": 3838.4,
"valid_targets_min": 933
},
{
"epoch": 3.132045088566828,
"grad_norm": 0.5175526656495621,
"learning_rate": 2.702620756550874e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18851426243782043,
"step": 1945,
"valid_targets_mean": 4249.6,
"valid_targets_min": 1164
},
{
"epoch": 3.140096618357488,
"grad_norm": 0.5292721987453661,
"learning_rate": 2.6950963381737728e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20516784489154816,
"step": 1950,
"valid_targets_mean": 4134.1,
"valid_targets_min": 1487
},
{
"epoch": 3.148148148148148,
"grad_norm": 0.5429459342739271,
"learning_rate": 2.687560712871325e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19477809965610504,
"step": 1955,
"valid_targets_mean": 4617.6,
"valid_targets_min": 321
},
{
"epoch": 3.156199677938808,
"grad_norm": 0.5204990053162142,
"learning_rate": 2.6800140021391933e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2121405303478241,
"step": 1960,
"valid_targets_mean": 5504.8,
"valid_targets_min": 2133
},
{
"epoch": 3.1642512077294684,
"grad_norm": 0.5107603352588185,
"learning_rate": 2.6724563276517697e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.217079758644104,
"step": 1965,
"valid_targets_mean": 4874.7,
"valid_targets_min": 578
},
{
"epoch": 3.1723027375201287,
"grad_norm": 0.5709422965320798,
"learning_rate": 2.6648878112602115e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20290029048919678,
"step": 1970,
"valid_targets_mean": 4168.8,
"valid_targets_min": 537
},
{
"epoch": 3.180354267310789,
"grad_norm": 0.5236384072204857,
"learning_rate": 2.6573085749904784e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18646635115146637,
"step": 1975,
"valid_targets_mean": 5792.3,
"valid_targets_min": 3148
},
{
"epoch": 3.1884057971014492,
"grad_norm": 0.4931013592583483,
"learning_rate": 2.6497187410413676e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16621598601341248,
"step": 1980,
"valid_targets_mean": 4182.5,
"valid_targets_min": 626
},
{
"epoch": 3.1964573268921095,
"grad_norm": 0.513477571797092,
"learning_rate": 2.642118431782537e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19758376479148865,
"step": 1985,
"valid_targets_mean": 4814.4,
"valid_targets_min": 841
},
{
"epoch": 3.2045088566827697,
"grad_norm": 0.5208664241436397,
"learning_rate": 2.6345077697525394e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036036252975464,
"step": 1990,
"valid_targets_mean": 4699.8,
"valid_targets_min": 1314
},
{
"epoch": 3.21256038647343,
"grad_norm": 0.48590086014586165,
"learning_rate": 2.6268868776568416e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1840904951095581,
"step": 1995,
"valid_targets_mean": 4029.8,
"valid_targets_min": 2119
},
{
"epoch": 3.2206119162640903,
"grad_norm": 0.48975245964069325,
"learning_rate": 2.619255878365849e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19650408625602722,
"step": 2000,
"valid_targets_mean": 4923.2,
"valid_targets_min": 2035
},
{
"epoch": 3.2286634460547505,
"grad_norm": 0.4730736998762011,
"learning_rate": 2.6116148949129237e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19848835468292236,
"step": 2005,
"valid_targets_mean": 5154.9,
"valid_targets_min": 862
},
{
"epoch": 3.236714975845411,
"grad_norm": 0.49293775625702296,
"learning_rate": 2.603964050492401e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1910780966281891,
"step": 2010,
"valid_targets_mean": 5177.5,
"valid_targets_min": 1035
},
{
"epoch": 3.244766505636071,
"grad_norm": 0.4352279629169526,
"learning_rate": 2.5963034684576024e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1654304563999176,
"step": 2015,
"valid_targets_mean": 4889.2,
"valid_targets_min": 755
},
{
"epoch": 3.2528180354267313,
"grad_norm": 0.48928557887722884,
"learning_rate": 2.5886332723188484e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17599686980247498,
"step": 2020,
"valid_targets_mean": 3929.6,
"valid_targets_min": 627
},
{
"epoch": 3.260869565217391,
"grad_norm": 0.4602375034247986,
"learning_rate": 2.5809535857414637e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19927427172660828,
"step": 2025,
"valid_targets_mean": 4907.2,
"valid_targets_min": 700
},
{
"epoch": 3.2689210950080514,
"grad_norm": 0.45533522839686313,
"learning_rate": 2.573264532543788e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1822260171175003,
"step": 2030,
"valid_targets_mean": 4557.0,
"valid_targets_min": 2401
},
{
"epoch": 3.2769726247987117,
"grad_norm": 0.5432317512688624,
"learning_rate": 2.5655662366951778e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1943272203207016,
"step": 2035,
"valid_targets_mean": 3990.8,
"valid_targets_min": 1026
},
{
"epoch": 3.285024154589372,
"grad_norm": 0.5340485828335133,
"learning_rate": 2.557858822314007e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2411888986825943,
"step": 2040,
"valid_targets_mean": 4090.6,
"valid_targets_min": 1032
},
{
"epoch": 3.293075684380032,
"grad_norm": 0.5155182145466647,
"learning_rate": 2.5501424136656635e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2276889681816101,
"step": 2045,
"valid_targets_mean": 4593.6,
"valid_targets_min": 574
},
{
"epoch": 3.3011272141706924,
"grad_norm": 0.5465406153378882,
"learning_rate": 2.5424171351605518e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17450806498527527,
"step": 2050,
"valid_targets_mean": 4325.6,
"valid_targets_min": 1283
},
{
"epoch": 3.3091787439613527,
"grad_norm": 0.5652814304177497,
"learning_rate": 2.5346831113520827e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21284984052181244,
"step": 2055,
"valid_targets_mean": 4811.6,
"valid_targets_min": 1066
},
{
"epoch": 3.317230273752013,
"grad_norm": 0.5717869882020237,
"learning_rate": 2.526940466934664e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19881507754325867,
"step": 2060,
"valid_targets_mean": 3001.5,
"valid_targets_min": 350
},
{
"epoch": 3.325281803542673,
"grad_norm": 0.5193991609655757,
"learning_rate": 2.5191893267416964e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19282767176628113,
"step": 2065,
"valid_targets_mean": 4379.1,
"valid_targets_min": 943
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.5087654352874541,
"learning_rate": 2.5114298157435526e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22454917430877686,
"step": 2070,
"valid_targets_mean": 5994.5,
"valid_targets_min": 1253
},
{
"epoch": 3.3413848631239937,
"grad_norm": 0.4773374743223842,
"learning_rate": 2.503662059045568e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19372783601284027,
"step": 2075,
"valid_targets_mean": 4415.6,
"valid_targets_min": 1046
},
{
"epoch": 3.3494363929146536,
"grad_norm": 0.5211750691881805,
"learning_rate": 2.4958861818860217e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20317870378494263,
"step": 2080,
"valid_targets_mean": 4938.8,
"valid_targets_min": 1053
},
{
"epoch": 3.357487922705314,
"grad_norm": 0.580769513908195,
"learning_rate": 2.488102309634119e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17012670636177063,
"step": 2085,
"valid_targets_mean": 3300.9,
"valid_targets_min": 570
},
{
"epoch": 3.365539452495974,
"grad_norm": 0.4677262023270228,
"learning_rate": 2.480310567787967e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21143823862075806,
"step": 2090,
"valid_targets_mean": 4960.4,
"valid_targets_min": 1486
},
{
"epoch": 3.3735909822866343,
"grad_norm": 0.498695274074395,
"learning_rate": 2.4725110819725542e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19077152013778687,
"step": 2095,
"valid_targets_mean": 4409.8,
"valid_targets_min": 1603
},
{
"epoch": 3.3816425120772946,
"grad_norm": 0.6606944270313985,
"learning_rate": 2.464703977937723e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2209235429763794,
"step": 2100,
"valid_targets_mean": 5160.9,
"valid_targets_min": 2260
},
{
"epoch": 3.389694041867955,
"grad_norm": 0.48392843927081547,
"learning_rate": 2.456889381556144e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1707090586423874,
"step": 2105,
"valid_targets_mean": 4587.8,
"valid_targets_min": 1717
},
{
"epoch": 3.397745571658615,
"grad_norm": 0.4875147573168212,
"learning_rate": 2.449067418821285e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18568046391010284,
"step": 2110,
"valid_targets_mean": 4881.9,
"valid_targets_min": 2069
},
{
"epoch": 3.4057971014492754,
"grad_norm": 0.5240738697697526,
"learning_rate": 2.4412382158453807e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17656230926513672,
"step": 2115,
"valid_targets_mean": 4386.1,
"valid_targets_min": 1483
},
{
"epoch": 3.4138486312399356,
"grad_norm": 0.5359424822294189,
"learning_rate": 2.4334018988573983e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22453176975250244,
"step": 2120,
"valid_targets_mean": 4363.1,
"valid_targets_min": 2099
},
{
"epoch": 3.421900161030596,
"grad_norm": 0.7044397785288949,
"learning_rate": 2.425558594201004e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17415092885494232,
"step": 2125,
"valid_targets_mean": 4853.5,
"valid_targets_min": 1658
},
{
"epoch": 3.429951690821256,
"grad_norm": 0.7313542515268883,
"learning_rate": 2.417708428332525e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18305009603500366,
"step": 2130,
"valid_targets_mean": 4156.8,
"valid_targets_min": 317
},
{
"epoch": 3.4380032206119164,
"grad_norm": 0.4738591164631795,
"learning_rate": 2.4098515278189097e-05,
"loss": 0.192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1723197102546692,
"step": 2135,
"valid_targets_mean": 4533.4,
"valid_targets_min": 1353
},
{
"epoch": 3.4460547504025767,
"grad_norm": 0.5276265701938105,
"learning_rate": 2.4019880193356902e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17899435758590698,
"step": 2140,
"valid_targets_mean": 4434.9,
"valid_targets_min": 675
},
{
"epoch": 3.454106280193237,
"grad_norm": 0.5632489582281142,
"learning_rate": 2.3941180296649348e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22366738319396973,
"step": 2145,
"valid_targets_mean": 3995.8,
"valid_targets_min": 1400
},
{
"epoch": 3.4621578099838968,
"grad_norm": 0.5526994009194625,
"learning_rate": 2.3862416856932087e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19457975029945374,
"step": 2150,
"valid_targets_mean": 3929.9,
"valid_targets_min": 1593
},
{
"epoch": 3.470209339774557,
"grad_norm": 0.5417281294909433,
"learning_rate": 2.378359114409527e-05,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20209567248821259,
"step": 2155,
"valid_targets_mean": 4491.2,
"valid_targets_min": 1771
},
{
"epoch": 3.4782608695652173,
"grad_norm": 0.5283860783665116,
"learning_rate": 2.370470442903306e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2074143886566162,
"step": 2160,
"valid_targets_mean": 3453.6,
"valid_targets_min": 656
},
{
"epoch": 3.4863123993558776,
"grad_norm": 0.5596014550678241,
"learning_rate": 2.362575798362315e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20553532242774963,
"step": 2165,
"valid_targets_mean": 3728.8,
"valid_targets_min": 1291
},
{
"epoch": 3.494363929146538,
"grad_norm": 0.47388886907429295,
"learning_rate": 2.3546753080706242e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2011997401714325,
"step": 2170,
"valid_targets_mean": 4747.0,
"valid_targets_min": 1499
},
{
"epoch": 3.502415458937198,
"grad_norm": 0.5433473628742698,
"learning_rate": 2.346769099406557e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22939231991767883,
"step": 2175,
"valid_targets_mean": 3726.4,
"valid_targets_min": 824
},
{
"epoch": 3.5104669887278583,
"grad_norm": 0.4457288216134543,
"learning_rate": 2.33885729984063e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1754472553730011,
"step": 2180,
"valid_targets_mean": 5101.0,
"valid_targets_min": 1832
},
{
"epoch": 3.5185185185185186,
"grad_norm": 0.511189888500102,
"learning_rate": 2.3309400369335033e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18584825098514557,
"step": 2185,
"valid_targets_mean": 4445.9,
"valid_targets_min": 1920
},
{
"epoch": 3.526570048309179,
"grad_norm": 0.5632502133321703,
"learning_rate": 2.3230174383339196e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2198297381401062,
"step": 2190,
"valid_targets_mean": 4171.1,
"valid_targets_min": 758
},
{
"epoch": 3.534621578099839,
"grad_norm": 0.4874975024015211,
"learning_rate": 2.3150896317766505e-05,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1995978057384491,
"step": 2195,
"valid_targets_mean": 4628.1,
"valid_targets_min": 1282
},
{
"epoch": 3.542673107890499,
"grad_norm": 0.47843928271386893,
"learning_rate": 2.3071567450804325e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690368950366974,
"step": 2200,
"valid_targets_mean": 4314.7,
"valid_targets_min": 1529
},
{
"epoch": 3.550724637681159,
"grad_norm": 0.5030690747235215,
"learning_rate": 2.299218906145909e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17591848969459534,
"step": 2205,
"valid_targets_mean": 4831.5,
"valid_targets_min": 1692
},
{
"epoch": 3.5587761674718195,
"grad_norm": 0.4445594459012944,
"learning_rate": 2.2912762429535684e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2045142650604248,
"step": 2210,
"valid_targets_mean": 5075.3,
"valid_targets_min": 1787
},
{
"epoch": 3.5668276972624797,
"grad_norm": 0.5066371584429301,
"learning_rate": 2.2833288835616784e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20660072565078735,
"step": 2215,
"valid_targets_mean": 4255.6,
"valid_targets_min": 978
},
{
"epoch": 3.57487922705314,
"grad_norm": 0.5314312269324657,
"learning_rate": 2.2753769561042235e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856955885887146,
"step": 2220,
"valid_targets_mean": 4382.4,
"valid_targets_min": 306
},
{
"epoch": 3.5829307568438002,
"grad_norm": 0.594664193968932,
"learning_rate": 2.2674205887888386e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22779573500156403,
"step": 2225,
"valid_targets_mean": 4177.1,
"valid_targets_min": 581
},
{
"epoch": 3.5909822866344605,
"grad_norm": 0.4922219770303433,
"learning_rate": 2.259459909894742e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22328010201454163,
"step": 2230,
"valid_targets_mean": 5152.0,
"valid_targets_min": 851
},
{
"epoch": 3.5990338164251208,
"grad_norm": 0.48869544172575563,
"learning_rate": 2.2514950477706657e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20914164185523987,
"step": 2235,
"valid_targets_mean": 5138.6,
"valid_targets_min": 1484
},
{
"epoch": 3.607085346215781,
"grad_norm": 0.6963749789958893,
"learning_rate": 2.2435261308327875e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1746867597103119,
"step": 2240,
"valid_targets_mean": 4765.4,
"valid_targets_min": 1839
},
{
"epoch": 3.6151368760064413,
"grad_norm": 0.5367886666270889,
"learning_rate": 2.2355532875626612e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18968860805034637,
"step": 2245,
"valid_targets_mean": 3609.9,
"valid_targets_min": 1136
},
{
"epoch": 3.6231884057971016,
"grad_norm": 0.5074205448750082,
"learning_rate": 2.2275766465051444e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20984122157096863,
"step": 2250,
"valid_targets_mean": 4557.3,
"valid_targets_min": 818
},
{
"epoch": 3.631239935587762,
"grad_norm": 0.5328336917497768,
"learning_rate": 2.2195963362663236e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1873650997877121,
"step": 2255,
"valid_targets_mean": 4251.6,
"valid_targets_min": 1417
},
{
"epoch": 3.639291465378422,
"grad_norm": 0.5279031470689559,
"learning_rate": 2.211612485511446e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19223317503929138,
"step": 2260,
"valid_targets_mean": 4547.8,
"valid_targets_min": 989
},
{
"epoch": 3.6473429951690823,
"grad_norm": 0.4807142652014487,
"learning_rate": 2.2036252229628392e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17448017001152039,
"step": 2265,
"valid_targets_mean": 4428.8,
"valid_targets_min": 1791
},
{
"epoch": 3.6553945249597426,
"grad_norm": 0.46162214621632697,
"learning_rate": 2.19563467739784e-05,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15724977850914001,
"step": 2270,
"valid_targets_mean": 4100.6,
"valid_targets_min": 1856
},
{
"epoch": 3.6634460547504024,
"grad_norm": 0.437259128811763,
"learning_rate": 2.1876409776467165e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19419334828853607,
"step": 2275,
"valid_targets_mean": 5604.3,
"valid_targets_min": 1799
},
{
"epoch": 3.6714975845410627,
"grad_norm": 0.509046081849507,
"learning_rate": 2.1796442525905923e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1819322556257248,
"step": 2280,
"valid_targets_mean": 3572.2,
"valid_targets_min": 1228
},
{
"epoch": 3.679549114331723,
"grad_norm": 0.512456182600672,
"learning_rate": 2.171644631159366e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21677514910697937,
"step": 2285,
"valid_targets_mean": 4920.6,
"valid_targets_min": 720
},
{
"epoch": 3.687600644122383,
"grad_norm": 3.5749072057598865,
"learning_rate": 2.163642242329633e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948278695344925,
"step": 2290,
"valid_targets_mean": 4014.2,
"valid_targets_min": 1316
},
{
"epoch": 3.6956521739130435,
"grad_norm": 0.48865940439627575,
"learning_rate": 2.1556372151226097e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21440473198890686,
"step": 2295,
"valid_targets_mean": 4626.4,
"valid_targets_min": 1967
},
{
"epoch": 3.7037037037037037,
"grad_norm": 0.5877525411956264,
"learning_rate": 2.1476296786020502e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.173828125,
"step": 2300,
"valid_targets_mean": 4059.1,
"valid_targets_min": 345
},
{
"epoch": 3.711755233494364,
"grad_norm": 0.532071939990665,
"learning_rate": 2.139619761872163e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20449981093406677,
"step": 2305,
"valid_targets_mean": 3978.1,
"valid_targets_min": 987
},
{
"epoch": 3.7198067632850242,
"grad_norm": 0.5500257667017805,
"learning_rate": 2.1316075940755363e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19600236415863037,
"step": 2310,
"valid_targets_mean": 4358.1,
"valid_targets_min": 2076
},
{
"epoch": 3.7278582930756845,
"grad_norm": 0.4910824420542707,
"learning_rate": 2.1235933043910488e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749979555606842,
"step": 2315,
"valid_targets_mean": 3997.7,
"valid_targets_min": 1403
},
{
"epoch": 3.7359098228663448,
"grad_norm": 0.49001315022408615,
"learning_rate": 2.1155770220317918e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976926326751709,
"step": 2320,
"valid_targets_mean": 4852.8,
"valid_targets_min": 506
},
{
"epoch": 3.7439613526570046,
"grad_norm": 0.6702681948241392,
"learning_rate": 2.107558876242983e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19468314945697784,
"step": 2325,
"valid_targets_mean": 3499.4,
"valid_targets_min": 1520
},
{
"epoch": 3.752012882447665,
"grad_norm": 0.4609480240941858,
"learning_rate": 2.0995389962998845e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19903123378753662,
"step": 2330,
"valid_targets_mean": 4891.3,
"valid_targets_min": 1678
},
{
"epoch": 3.760064412238325,
"grad_norm": 0.48913542025927365,
"learning_rate": 2.091517511505719e-05,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21223650872707367,
"step": 2335,
"valid_targets_mean": 4559.2,
"valid_targets_min": 2650
},
{
"epoch": 3.7681159420289854,
"grad_norm": 0.46883840985224706,
"learning_rate": 2.0834945511895816e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1941649466753006,
"step": 2340,
"valid_targets_mean": 5603.5,
"valid_targets_min": 2498
},
{
"epoch": 3.7761674718196456,
"grad_norm": 0.4681238690714185,
"learning_rate": 2.0754702447043585e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1943756639957428,
"step": 2345,
"valid_targets_mean": 4566.8,
"valid_targets_min": 677
},
{
"epoch": 3.784219001610306,
"grad_norm": 0.4482811469832385,
"learning_rate": 2.0674447214246394e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1913878321647644,
"step": 2350,
"valid_targets_mean": 5163.6,
"valid_targets_min": 2337
},
{
"epoch": 3.792270531400966,
"grad_norm": 0.47556405809315727,
"learning_rate": 2.059418110744633e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18677163124084473,
"step": 2355,
"valid_targets_mean": 4713.3,
"valid_targets_min": 933
},
{
"epoch": 3.8003220611916264,
"grad_norm": 0.4690759790686193,
"learning_rate": 2.0513905420760798e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19385367631912231,
"step": 2360,
"valid_targets_mean": 4902.2,
"valid_targets_min": 627
},
{
"epoch": 3.8083735909822867,
"grad_norm": 0.5121675478037654,
"learning_rate": 2.043362144846164e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19691093266010284,
"step": 2365,
"valid_targets_mean": 3866.6,
"valid_targets_min": 689
},
{
"epoch": 3.816425120772947,
"grad_norm": 0.52059333383564,
"learning_rate": 2.035333048495431e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16973920166492462,
"step": 2370,
"valid_targets_mean": 3510.0,
"valid_targets_min": 909
},
{
"epoch": 3.824476650563607,
"grad_norm": 0.5076146647866968,
"learning_rate": 2.0273033824756964e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17860174179077148,
"step": 2375,
"valid_targets_mean": 3703.1,
"valid_targets_min": 506
},
{
"epoch": 3.8325281803542675,
"grad_norm": 0.6011850519404554,
"learning_rate": 2.0192732762479616e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20434610545635223,
"step": 2380,
"valid_targets_mean": 4579.6,
"valid_targets_min": 631
},
{
"epoch": 3.8405797101449277,
"grad_norm": 0.5345131849791486,
"learning_rate": 2.011242859280325e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21205343306064606,
"step": 2385,
"valid_targets_mean": 4124.2,
"valid_targets_min": 823
},
{
"epoch": 3.848631239935588,
"grad_norm": 0.5114321926687082,
"learning_rate": 2.0032122610458947e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17156703770160675,
"step": 2390,
"valid_targets_mean": 4274.9,
"valid_targets_min": 1740
},
{
"epoch": 3.8566827697262482,
"grad_norm": 0.6336174608958026,
"learning_rate": 1.9951816110207004e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1964995563030243,
"step": 2395,
"valid_targets_mean": 4251.1,
"valid_targets_min": 1610
},
{
"epoch": 3.864734299516908,
"grad_norm": 0.49492043165747124,
"learning_rate": 1.9871510386816103e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17603623867034912,
"step": 2400,
"valid_targets_mean": 4051.9,
"valid_targets_min": 1925
},
{
"epoch": 3.8727858293075683,
"grad_norm": 0.5681035881235681,
"learning_rate": 1.979120673504235e-05,
"loss": 0.2058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20705150067806244,
"step": 2405,
"valid_targets_mean": 5603.1,
"valid_targets_min": 3701
},
{
"epoch": 3.8808373590982286,
"grad_norm": 1.2929630707396456,
"learning_rate": 1.9710906449608498e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19122429192066193,
"step": 2410,
"valid_targets_mean": 4886.8,
"valid_targets_min": 1569
},
{
"epoch": 3.888888888888889,
"grad_norm": 0.47492876907794285,
"learning_rate": 1.9630610825182992e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18603213131427765,
"step": 2415,
"valid_targets_mean": 4944.1,
"valid_targets_min": 1929
},
{
"epoch": 3.896940418679549,
"grad_norm": 0.5030538323026981,
"learning_rate": 1.955032115635915e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22285720705986023,
"step": 2420,
"valid_targets_mean": 4422.1,
"valid_targets_min": 1352
},
{
"epoch": 3.9049919484702094,
"grad_norm": 0.5031818050359901,
"learning_rate": 1.9470038737634257e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19892553985118866,
"step": 2425,
"valid_targets_mean": 4099.8,
"valid_targets_min": 1262
},
{
"epoch": 3.9130434782608696,
"grad_norm": 0.5757670497420159,
"learning_rate": 1.9389764863388706e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19620567560195923,
"step": 2430,
"valid_targets_mean": 3868.5,
"valid_targets_min": 545
},
{
"epoch": 3.92109500805153,
"grad_norm": 0.48359405966706115,
"learning_rate": 1.9309500827865136e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1803748607635498,
"step": 2435,
"valid_targets_mean": 4338.0,
"valid_targets_min": 1348
},
{
"epoch": 3.92914653784219,
"grad_norm": 0.4640923476833218,
"learning_rate": 1.9229247925147553e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1907849907875061,
"step": 2440,
"valid_targets_mean": 4583.9,
"valid_targets_min": 1771
},
{
"epoch": 3.9371980676328504,
"grad_norm": 0.5117773057032822,
"learning_rate": 1.9149007449140462e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17059685289859772,
"step": 2445,
"valid_targets_mean": 4338.1,
"valid_targets_min": 1784
},
{
"epoch": 3.9452495974235102,
"grad_norm": 0.5915049699700269,
"learning_rate": 1.906878069354804e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21201738715171814,
"step": 2450,
"valid_targets_mean": 3018.6,
"valid_targets_min": 1027
},
{
"epoch": 3.9533011272141705,
"grad_norm": 0.47160593652811594,
"learning_rate": 1.898856895185322e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16955235600471497,
"step": 2455,
"valid_targets_mean": 4181.1,
"valid_targets_min": 1075
},
{
"epoch": 3.9613526570048307,
"grad_norm": 0.49702142957897827,
"learning_rate": 1.8908373517296888e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19719739258289337,
"step": 2460,
"valid_targets_mean": 4295.4,
"valid_targets_min": 249
},
{
"epoch": 3.969404186795491,
"grad_norm": 0.5129921266484054,
"learning_rate": 1.882819568285701e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19295062124729156,
"step": 2465,
"valid_targets_mean": 3921.4,
"valid_targets_min": 966
},
{
"epoch": 3.9774557165861513,
"grad_norm": 0.45382648008126336,
"learning_rate": 1.874803674122778e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1945837438106537,
"step": 2470,
"valid_targets_mean": 5054.1,
"valid_targets_min": 1828
},
{
"epoch": 3.9855072463768115,
"grad_norm": 0.47820396478837407,
"learning_rate": 1.8667897984798804e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21562841534614563,
"step": 2475,
"valid_targets_mean": 4692.4,
"valid_targets_min": 300
},
{
"epoch": 3.993558776167472,
"grad_norm": 0.539195337968872,
"learning_rate": 1.858778070563422e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1887316107749939,
"step": 2480,
"valid_targets_mean": 4306.7,
"valid_targets_min": 590
},
{
"epoch": 4.001610305958132,
"grad_norm": 0.5374780928948082,
"learning_rate": 1.8507686195451918e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25074928998947144,
"step": 2485,
"valid_targets_mean": 4598.8,
"valid_targets_min": 374
},
{
"epoch": 4.009661835748792,
"grad_norm": 0.4944011317477905,
"learning_rate": 1.8427615745602667e-05,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15997666120529175,
"step": 2490,
"valid_targets_mean": 4936.9,
"valid_targets_min": 1591
},
{
"epoch": 4.017713365539453,
"grad_norm": 0.4765635224384645,
"learning_rate": 1.834757064704933e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592136025428772,
"step": 2495,
"valid_targets_mean": 4652.1,
"valid_targets_min": 1149
},
{
"epoch": 4.025764895330113,
"grad_norm": 0.4956167235108182,
"learning_rate": 1.826755219034603e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19604167342185974,
"step": 2500,
"valid_targets_mean": 4386.4,
"valid_targets_min": 380
},
{
"epoch": 4.033816425120773,
"grad_norm": 0.45476926402320006,
"learning_rate": 1.818756166561733e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637008637189865,
"step": 2505,
"valid_targets_mean": 4699.8,
"valid_targets_min": 1197
},
{
"epoch": 4.041867954911433,
"grad_norm": 0.43733602489225165,
"learning_rate": 1.8107600362537473e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16251038014888763,
"step": 2510,
"valid_targets_mean": 4847.2,
"valid_targets_min": 1813
},
{
"epoch": 4.049919484702094,
"grad_norm": 0.49193894405362015,
"learning_rate": 1.8027669570309572e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16793620586395264,
"step": 2515,
"valid_targets_mean": 4591.9,
"valid_targets_min": 506
},
{
"epoch": 4.057971014492754,
"grad_norm": 0.5075017593056104,
"learning_rate": 1.7947770577644787e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1729605346918106,
"step": 2520,
"valid_targets_mean": 4395.8,
"valid_targets_min": 656
},
{
"epoch": 4.066022544283414,
"grad_norm": 0.499304090315969,
"learning_rate": 1.786790467274161e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17558912932872772,
"step": 2525,
"valid_targets_mean": 4637.6,
"valid_targets_min": 2011
},
{
"epoch": 4.074074074074074,
"grad_norm": 0.5559504833423238,
"learning_rate": 1.778807314326505e-05,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18689918518066406,
"step": 2530,
"valid_targets_mean": 3930.3,
"valid_targets_min": 548
},
{
"epoch": 4.082125603864735,
"grad_norm": 0.47641769475056645,
"learning_rate": 1.7708277276325886e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637909710407257,
"step": 2535,
"valid_targets_mean": 5154.6,
"valid_targets_min": 1826
},
{
"epoch": 4.090177133655395,
"grad_norm": 0.5182362997358064,
"learning_rate": 1.762851835845992e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18916486203670502,
"step": 2540,
"valid_targets_mean": 4544.1,
"valid_targets_min": 570
},
{
"epoch": 4.098228663446055,
"grad_norm": 0.4862343355871757,
"learning_rate": 1.754879767560723e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18593139946460724,
"step": 2545,
"valid_targets_mean": 4532.4,
"valid_targets_min": 1521
},
{
"epoch": 4.106280193236715,
"grad_norm": 0.527960071470203,
"learning_rate": 1.746911651309144e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19690777361392975,
"step": 2550,
"valid_targets_mean": 3843.6,
"valid_targets_min": 881
},
{
"epoch": 4.114331723027375,
"grad_norm": 0.5103425212083436,
"learning_rate": 1.7389476155598974e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21908551454544067,
"step": 2555,
"valid_targets_mean": 5082.4,
"valid_targets_min": 784
},
{
"epoch": 4.122383252818035,
"grad_norm": 0.7756087805548777,
"learning_rate": 1.7309877887158388e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1794763058423996,
"step": 2560,
"valid_targets_mean": 2992.2,
"valid_targets_min": 467
},
{
"epoch": 4.130434782608695,
"grad_norm": 0.4567684656881922,
"learning_rate": 1.723032299111964e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15088678896427155,
"step": 2565,
"valid_targets_mean": 4922.8,
"valid_targets_min": 1327
},
{
"epoch": 4.138486312399356,
"grad_norm": 0.5425918961875108,
"learning_rate": 1.7150812750133382e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1673865020275116,
"step": 2570,
"valid_targets_mean": 3965.9,
"valid_targets_min": 1407
},
{
"epoch": 4.146537842190016,
"grad_norm": 0.6838407873867918,
"learning_rate": 1.707134844613032e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15312550961971283,
"step": 2575,
"valid_targets_mean": 4199.9,
"valid_targets_min": 1891
},
{
"epoch": 4.154589371980676,
"grad_norm": 0.5385560587074719,
"learning_rate": 1.699193136030052e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17279349267482758,
"step": 2580,
"valid_targets_mean": 3938.8,
"valid_targets_min": 880
},
{
"epoch": 4.162640901771336,
"grad_norm": 0.5502968325727028,
"learning_rate": 1.6912562773072765e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18601390719413757,
"step": 2585,
"valid_targets_mean": 4653.2,
"valid_targets_min": 2040
},
{
"epoch": 4.170692431561997,
"grad_norm": 0.5862578517681709,
"learning_rate": 1.6833243964093877e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2094813883304596,
"step": 2590,
"valid_targets_mean": 4215.5,
"valid_targets_min": 1508
},
{
"epoch": 4.178743961352657,
"grad_norm": 0.525233464465349,
"learning_rate": 1.6753976212208137e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17922204732894897,
"step": 2595,
"valid_targets_mean": 3851.4,
"valid_targets_min": 667
},
{
"epoch": 4.186795491143317,
"grad_norm": 0.6610861468502892,
"learning_rate": 1.667476079543664e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17614664137363434,
"step": 2600,
"valid_targets_mean": 3052.1,
"valid_targets_min": 691
},
{
"epoch": 4.194847020933977,
"grad_norm": 0.5630100784699484,
"learning_rate": 1.659559899095667e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20966169238090515,
"step": 2605,
"valid_targets_mean": 5309.3,
"valid_targets_min": 1187
},
{
"epoch": 4.202898550724638,
"grad_norm": 0.6807488645292253,
"learning_rate": 1.651649207508114e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19908779859542847,
"step": 2610,
"valid_targets_mean": 4216.5,
"valid_targets_min": 1027
},
{
"epoch": 4.210950080515298,
"grad_norm": 0.49692416499926767,
"learning_rate": 1.643744132323801e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19740644097328186,
"step": 2615,
"valid_targets_mean": 4830.8,
"valid_targets_min": 1913
},
{
"epoch": 4.219001610305958,
"grad_norm": 0.6036326467813666,
"learning_rate": 1.6358448009949714e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22196456789970398,
"step": 2620,
"valid_targets_mean": 5333.3,
"valid_targets_min": 2355
},
{
"epoch": 4.2270531400966185,
"grad_norm": 0.4829391874239536,
"learning_rate": 1.6279513408812603e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1743869185447693,
"step": 2625,
"valid_targets_mean": 5413.8,
"valid_targets_min": 1251
},
{
"epoch": 4.235104669887279,
"grad_norm": 0.5048080599206834,
"learning_rate": 1.620063879247643e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16595719754695892,
"step": 2630,
"valid_targets_mean": 3924.2,
"valid_targets_min": 443
},
{
"epoch": 4.243156199677939,
"grad_norm": 0.46752510731782826,
"learning_rate": 1.6121825432623827e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1762651652097702,
"step": 2635,
"valid_targets_mean": 5055.4,
"valid_targets_min": 1403
},
{
"epoch": 4.251207729468599,
"grad_norm": 0.4797644865040805,
"learning_rate": 1.6043074599949785e-05,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17031241953372955,
"step": 2640,
"valid_targets_mean": 4893.6,
"valid_targets_min": 966
},
{
"epoch": 4.2592592592592595,
"grad_norm": 1.0165849437996184,
"learning_rate": 1.5964387564141192e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19583508372306824,
"step": 2645,
"valid_targets_mean": 4988.9,
"valid_targets_min": 1611
},
{
"epoch": 4.26731078904992,
"grad_norm": 0.6039054133342181,
"learning_rate": 1.588576559385635e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17843933403491974,
"step": 2650,
"valid_targets_mean": 4234.7,
"valid_targets_min": 1211
},
{
"epoch": 4.27536231884058,
"grad_norm": 0.512856167089867,
"learning_rate": 1.5807209956704505e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1996535062789917,
"step": 2655,
"valid_targets_mean": 4500.6,
"valid_targets_min": 1506
},
{
"epoch": 4.28341384863124,
"grad_norm": 0.4991515466828228,
"learning_rate": 1.5728721919225428e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14569713175296783,
"step": 2660,
"valid_targets_mean": 4720.1,
"valid_targets_min": 1211
},
{
"epoch": 4.291465378421901,
"grad_norm": 0.9601831661650259,
"learning_rate": 1.5650302746869004e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1880815625190735,
"step": 2665,
"valid_targets_mean": 4171.6,
"valid_targets_min": 833
},
{
"epoch": 4.29951690821256,
"grad_norm": 0.4412736536027149,
"learning_rate": 1.5571953703974813e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16794951260089874,
"step": 2670,
"valid_targets_mean": 5724.5,
"valid_targets_min": 2565
},
{
"epoch": 4.30756843800322,
"grad_norm": 0.49660094639156666,
"learning_rate": 1.5493676053751747e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17535799741744995,
"step": 2675,
"valid_targets_mean": 4800.3,
"valid_targets_min": 1829
},
{
"epoch": 4.3156199677938805,
"grad_norm": 0.5456531223844872,
"learning_rate": 1.5415471058257638e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17335663735866547,
"step": 2680,
"valid_targets_mean": 4570.4,
"valid_targets_min": 1658
},
{
"epoch": 4.323671497584541,
"grad_norm": 0.45678206025420953,
"learning_rate": 1.533733997837893e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.169780433177948,
"step": 2685,
"valid_targets_mean": 4216.1,
"valid_targets_min": 1449
},
{
"epoch": 4.331723027375201,
"grad_norm": 0.5415606665772222,
"learning_rate": 1.5259284073810333e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16021227836608887,
"step": 2690,
"valid_targets_mean": 3275.1,
"valid_targets_min": 984
},
{
"epoch": 4.339774557165861,
"grad_norm": 0.5136691048212793,
"learning_rate": 1.5181304603034513e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1827298104763031,
"step": 2695,
"valid_targets_mean": 4889.6,
"valid_targets_min": 1238
},
{
"epoch": 4.3478260869565215,
"grad_norm": 1.4914173173538663,
"learning_rate": 1.5103402823301819e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18776141107082367,
"step": 2700,
"valid_targets_mean": 4532.6,
"valid_targets_min": 850
},
{
"epoch": 4.355877616747182,
"grad_norm": 0.5083803805655037,
"learning_rate": 1.5025579990609973e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16755394637584686,
"step": 2705,
"valid_targets_mean": 4128.1,
"valid_targets_min": 379
},
{
"epoch": 4.363929146537842,
"grad_norm": 0.500974762279468,
"learning_rate": 1.4947837359683882e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17978541553020477,
"step": 2710,
"valid_targets_mean": 5342.4,
"valid_targets_min": 2152
},
{
"epoch": 4.371980676328502,
"grad_norm": 0.5603545589277986,
"learning_rate": 1.487017618395534e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.198044091463089,
"step": 2715,
"valid_targets_mean": 4740.4,
"valid_targets_min": 1746
},
{
"epoch": 4.3800322061191626,
"grad_norm": 0.4771112752411543,
"learning_rate": 1.479259771554288e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1699572205543518,
"step": 2720,
"valid_targets_mean": 4872.8,
"valid_targets_min": 448
},
{
"epoch": 4.388083735909823,
"grad_norm": 0.521661536652827,
"learning_rate": 1.4715103205231545e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18613924086093903,
"step": 2725,
"valid_targets_mean": 4061.7,
"valid_targets_min": 995
},
{
"epoch": 4.396135265700483,
"grad_norm": 0.537250383283014,
"learning_rate": 1.463769390245273e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.178946852684021,
"step": 2730,
"valid_targets_mean": 4061.8,
"valid_targets_min": 900
},
{
"epoch": 4.404186795491143,
"grad_norm": 0.5244437127559632,
"learning_rate": 1.4560371055264052e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18043842911720276,
"step": 2735,
"valid_targets_mean": 4802.7,
"valid_targets_min": 1843
},
{
"epoch": 4.412238325281804,
"grad_norm": 0.5146870682156327,
"learning_rate": 1.448313591032922e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17479149997234344,
"step": 2740,
"valid_targets_mean": 5214.2,
"valid_targets_min": 1866
},
{
"epoch": 4.420289855072464,
"grad_norm": 0.4691547439815975,
"learning_rate": 1.4405989712897923e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18224862217903137,
"step": 2745,
"valid_targets_mean": 5050.6,
"valid_targets_min": 1427
},
{
"epoch": 4.428341384863124,
"grad_norm": 0.5424155500541844,
"learning_rate": 1.4328933706785782e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1883089393377304,
"step": 2750,
"valid_targets_mean": 4057.4,
"valid_targets_min": 854
},
{
"epoch": 4.436392914653784,
"grad_norm": 0.5100283152717094,
"learning_rate": 1.4251969134354247e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16344183683395386,
"step": 2755,
"valid_targets_mean": 4199.4,
"valid_targets_min": 1557
},
{
"epoch": 4.444444444444445,
"grad_norm": 0.5071596893081406,
"learning_rate": 1.4175097236490627e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1783141791820526,
"step": 2760,
"valid_targets_mean": 4905.3,
"valid_targets_min": 383
},
{
"epoch": 4.452495974235105,
"grad_norm": 0.4808405938396642,
"learning_rate": 1.409831925258805e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19857333600521088,
"step": 2765,
"valid_targets_mean": 4961.1,
"valid_targets_min": 847
},
{
"epoch": 4.460547504025765,
"grad_norm": 0.48057741594526054,
"learning_rate": 1.4021636420525466e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1644965559244156,
"step": 2770,
"valid_targets_mean": 4509.1,
"valid_targets_min": 1227
},
{
"epoch": 4.468599033816425,
"grad_norm": 0.5128321881887902,
"learning_rate": 1.3945049976647726e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749866008758545,
"step": 2775,
"valid_targets_mean": 4825.0,
"valid_targets_min": 1201
},
{
"epoch": 4.476650563607086,
"grad_norm": 0.6327024505387485,
"learning_rate": 1.3868561155745628e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19712504744529724,
"step": 2780,
"valid_targets_mean": 4430.3,
"valid_targets_min": 703
},
{
"epoch": 4.484702093397746,
"grad_norm": 0.4913167577071679,
"learning_rate": 1.3792171191036001e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15714874863624573,
"step": 2785,
"valid_targets_mean": 4104.7,
"valid_targets_min": 1663
},
{
"epoch": 4.492753623188406,
"grad_norm": 0.5394186960786538,
"learning_rate": 1.3715881314141835e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19951429963111877,
"step": 2790,
"valid_targets_mean": 4620.1,
"valid_targets_min": 1843
},
{
"epoch": 4.500805152979066,
"grad_norm": 0.5953737763754138,
"learning_rate": 1.3639692755072429e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2141798585653305,
"step": 2795,
"valid_targets_mean": 4660.8,
"valid_targets_min": 1401
},
{
"epoch": 4.508856682769727,
"grad_norm": 0.5453366269316137,
"learning_rate": 1.3563606742203548e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20897048711776733,
"step": 2800,
"valid_targets_mean": 4447.4,
"valid_targets_min": 1113
},
{
"epoch": 4.516908212560386,
"grad_norm": 0.531617180983723,
"learning_rate": 1.3487624502257598e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20468959212303162,
"step": 2805,
"valid_targets_mean": 4891.9,
"valid_targets_min": 2624
},
{
"epoch": 4.524959742351046,
"grad_norm": 1.0175978905323302,
"learning_rate": 1.3411747260283905e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867702454328537,
"step": 2810,
"valid_targets_mean": 4380.1,
"valid_targets_min": 800
},
{
"epoch": 4.533011272141707,
"grad_norm": 0.5172120222306495,
"learning_rate": 1.333597623963892e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17019790410995483,
"step": 2815,
"valid_targets_mean": 4795.6,
"valid_targets_min": 626
},
{
"epoch": 4.541062801932367,
"grad_norm": 0.6059009807629652,
"learning_rate": 1.3260312661966487e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17550814151763916,
"step": 2820,
"valid_targets_mean": 5061.1,
"valid_targets_min": 1263
},
{
"epoch": 4.549114331723027,
"grad_norm": 0.613180864431363,
"learning_rate": 1.3184757747178187e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19658298790454865,
"step": 2825,
"valid_targets_mean": 5041.3,
"valid_targets_min": 1795
},
{
"epoch": 4.557165861513687,
"grad_norm": 0.5633900947396653,
"learning_rate": 1.3109312713433642e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18244323134422302,
"step": 2830,
"valid_targets_mean": 4282.2,
"valid_targets_min": 543
},
{
"epoch": 4.565217391304348,
"grad_norm": 0.9588780998775635,
"learning_rate": 1.3033978777120861e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690833568572998,
"step": 2835,
"valid_targets_mean": 3991.0,
"valid_targets_min": 1088
},
{
"epoch": 4.573268921095008,
"grad_norm": 0.5205077973662069,
"learning_rate": 1.2958757152836671e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22376713156700134,
"step": 2840,
"valid_targets_mean": 4458.4,
"valid_targets_min": 2143
},
{
"epoch": 4.581320450885668,
"grad_norm": 0.5253874104264332,
"learning_rate": 1.2883649053367106e-05,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1675848662853241,
"step": 2845,
"valid_targets_mean": 4003.0,
"valid_targets_min": 845
},
{
"epoch": 4.5893719806763285,
"grad_norm": 0.5452379881212879,
"learning_rate": 1.2808655689667846e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1796257197856903,
"step": 2850,
"valid_targets_mean": 4152.3,
"valid_targets_min": 455
},
{
"epoch": 4.597423510466989,
"grad_norm": 0.5239905621350787,
"learning_rate": 1.2733778270844712e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18232783675193787,
"step": 2855,
"valid_targets_mean": 4419.6,
"valid_targets_min": 529
},
{
"epoch": 4.605475040257649,
"grad_norm": 0.5607032815508621,
"learning_rate": 1.265901800413416e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17835384607315063,
"step": 2860,
"valid_targets_mean": 3395.8,
"valid_targets_min": 627
},
{
"epoch": 4.613526570048309,
"grad_norm": 0.9496967272226038,
"learning_rate": 1.2584376094883832e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17716357111930847,
"step": 2865,
"valid_targets_mean": 4483.6,
"valid_targets_min": 710
},
{
"epoch": 4.6215780998389695,
"grad_norm": 0.7842117859067653,
"learning_rate": 1.250985374653311e-05,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17786236107349396,
"step": 2870,
"valid_targets_mean": 4693.0,
"valid_targets_min": 1134
},
{
"epoch": 4.62962962962963,
"grad_norm": 0.5033684151280889,
"learning_rate": 1.2435452160593698e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17148058116436005,
"step": 2875,
"valid_targets_mean": 4303.3,
"valid_targets_min": 1429
},
{
"epoch": 4.63768115942029,
"grad_norm": 0.5032006756891246,
"learning_rate": 1.2361172536630288e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16900071501731873,
"step": 2880,
"valid_targets_mean": 4471.4,
"valid_targets_min": 1507
},
{
"epoch": 4.64573268921095,
"grad_norm": 0.5449401674057853,
"learning_rate": 1.2287016072241195e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19873306155204773,
"step": 2885,
"valid_targets_mean": 4050.9,
"valid_targets_min": 321
},
{
"epoch": 4.6537842190016105,
"grad_norm": 0.5002283792241559,
"learning_rate": 1.221298396303904e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17124618589878082,
"step": 2890,
"valid_targets_mean": 5187.2,
"valid_targets_min": 1399
},
{
"epoch": 4.661835748792271,
"grad_norm": 0.4706451280493202,
"learning_rate": 1.2139077402631495e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14620235562324524,
"step": 2895,
"valid_targets_mean": 4477.4,
"valid_targets_min": 1454
},
{
"epoch": 4.669887278582931,
"grad_norm": 0.5330785987823722,
"learning_rate": 1.2065297582602037e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17816966772079468,
"step": 2900,
"valid_targets_mean": 4355.4,
"valid_targets_min": 2065
},
{
"epoch": 4.677938808373591,
"grad_norm": 0.4942305241126504,
"learning_rate": 1.199164569249071e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18558406829833984,
"step": 2905,
"valid_targets_mean": 4951.6,
"valid_targets_min": 1299
},
{
"epoch": 4.685990338164252,
"grad_norm": 0.537628904978011,
"learning_rate": 1.191812291977497e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19403138756752014,
"step": 2910,
"valid_targets_mean": 4024.0,
"valid_targets_min": 1450
},
{
"epoch": 4.694041867954912,
"grad_norm": 0.5439040484202802,
"learning_rate": 1.1844730449850546e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19234639406204224,
"step": 2915,
"valid_targets_mean": 5036.8,
"valid_targets_min": 1058
},
{
"epoch": 4.702093397745571,
"grad_norm": 0.583242909808935,
"learning_rate": 1.1771469466012309e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20131342113018036,
"step": 2920,
"valid_targets_mean": 4106.1,
"valid_targets_min": 983
},
{
"epoch": 4.710144927536232,
"grad_norm": 0.5038233636197879,
"learning_rate": 1.1698341149435196e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684148907661438,
"step": 2925,
"valid_targets_mean": 4802.6,
"valid_targets_min": 1952
},
{
"epoch": 4.718196457326892,
"grad_norm": 0.4600414999991662,
"learning_rate": 1.1625346679155179e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15985998511314392,
"step": 2930,
"valid_targets_mean": 4799.9,
"valid_targets_min": 1859
},
{
"epoch": 4.726247987117552,
"grad_norm": 0.4936755991303249,
"learning_rate": 1.1552487232050242e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17861491441726685,
"step": 2935,
"valid_targets_mean": 4306.8,
"valid_targets_min": 1605
},
{
"epoch": 4.734299516908212,
"grad_norm": 0.44442070244437953,
"learning_rate": 1.1479763982821414e-05,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17784011363983154,
"step": 2940,
"valid_targets_mean": 5608.9,
"valid_targets_min": 1956
},
{
"epoch": 4.7423510466988725,
"grad_norm": 0.5637401886713175,
"learning_rate": 1.1407178103973834e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18229396641254425,
"step": 2945,
"valid_targets_mean": 3870.8,
"valid_targets_min": 864
},
{
"epoch": 4.750402576489533,
"grad_norm": 0.45308334583470944,
"learning_rate": 1.1334730765797843e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19959984719753265,
"step": 2950,
"valid_targets_mean": 5085.4,
"valid_targets_min": 1791
},
{
"epoch": 4.758454106280193,
"grad_norm": 0.5571182515606663,
"learning_rate": 1.1262423136350087e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22160165011882782,
"step": 2955,
"valid_targets_mean": 3792.0,
"valid_targets_min": 1099
},
{
"epoch": 4.766505636070853,
"grad_norm": 0.5901554994508056,
"learning_rate": 1.1190256381434738e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17873704433441162,
"step": 2960,
"valid_targets_mean": 3899.3,
"valid_targets_min": 778
},
{
"epoch": 4.774557165861514,
"grad_norm": 0.5158336477050018,
"learning_rate": 1.1118231664584674e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886855959892273,
"step": 2965,
"valid_targets_mean": 4861.4,
"valid_targets_min": 1898
},
{
"epoch": 4.782608695652174,
"grad_norm": 0.4887213717876692,
"learning_rate": 1.1046350147042681e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20001167058944702,
"step": 2970,
"valid_targets_mean": 4675.2,
"valid_targets_min": 952
},
{
"epoch": 4.790660225442834,
"grad_norm": 0.48768071610571156,
"learning_rate": 1.0974612987742807e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18149898946285248,
"step": 2975,
"valid_targets_mean": 4411.8,
"valid_targets_min": 1129
},
{
"epoch": 4.798711755233494,
"grad_norm": 0.4873268036344298,
"learning_rate": 1.0903021343291613e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20546609163284302,
"step": 2980,
"valid_targets_mean": 4418.5,
"valid_targets_min": 608
},
{
"epoch": 4.806763285024155,
"grad_norm": 0.5054671612514106,
"learning_rate": 1.0831576367949555e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18941310048103333,
"step": 2985,
"valid_targets_mean": 4868.4,
"valid_targets_min": 2311
},
{
"epoch": 4.814814814814815,
"grad_norm": 0.5242076423511247,
"learning_rate": 1.0760279213612362e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16793029010295868,
"step": 2990,
"valid_targets_mean": 5404.2,
"valid_targets_min": 2117
},
{
"epoch": 4.822866344605475,
"grad_norm": 0.6828436818331252,
"learning_rate": 1.068913102979248e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19285649061203003,
"step": 2995,
"valid_targets_mean": 3826.8,
"valid_targets_min": 1070
},
{
"epoch": 4.830917874396135,
"grad_norm": 0.47219942742537285,
"learning_rate": 1.0618132963600507e-05,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18546539545059204,
"step": 3000,
"valid_targets_mean": 5087.4,
"valid_targets_min": 1959
},
{
"epoch": 4.838969404186796,
"grad_norm": 0.4457820811603146,
"learning_rate": 1.0547286159726743e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19360345602035522,
"step": 3005,
"valid_targets_mean": 5867.6,
"valid_targets_min": 1035
},
{
"epoch": 4.847020933977456,
"grad_norm": 0.5847539672595908,
"learning_rate": 1.047659176042268e-05,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16391941905021667,
"step": 3010,
"valid_targets_mean": 3891.6,
"valid_targets_min": 578
},
{
"epoch": 4.855072463768116,
"grad_norm": 0.5080943188478495,
"learning_rate": 1.0406050905482647e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1736719310283661,
"step": 3015,
"valid_targets_mean": 4204.6,
"valid_targets_min": 631
},
{
"epoch": 4.8631239935587764,
"grad_norm": 0.4950021070139557,
"learning_rate": 1.033566473222539e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16896328330039978,
"step": 3020,
"valid_targets_mean": 5143.3,
"valid_targets_min": 2767
},
{
"epoch": 4.871175523349437,
"grad_norm": 0.5149173904980839,
"learning_rate": 1.0265434375475744e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1894487589597702,
"step": 3025,
"valid_targets_mean": 4708.5,
"valid_targets_min": 656
},
{
"epoch": 4.879227053140097,
"grad_norm": 0.5128722203180325,
"learning_rate": 1.0195360967546342e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18005244433879852,
"step": 3030,
"valid_targets_mean": 5025.9,
"valid_targets_min": 1716
},
{
"epoch": 4.887278582930757,
"grad_norm": 0.5010958581493115,
"learning_rate": 1.0125445638219369e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19406850636005402,
"step": 3035,
"valid_targets_mean": 4813.1,
"valid_targets_min": 908
},
{
"epoch": 4.8953301127214175,
"grad_norm": 0.5210294803713594,
"learning_rate": 1.00556895147283e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16892248392105103,
"step": 3040,
"valid_targets_mean": 3893.8,
"valid_targets_min": 1273
},
{
"epoch": 4.903381642512077,
"grad_norm": 0.6293372498483756,
"learning_rate": 9.986093721739793e-06,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1870511919260025,
"step": 3045,
"valid_targets_mean": 3776.4,
"valid_targets_min": 296
},
{
"epoch": 4.911433172302738,
"grad_norm": 0.5480638562689124,
"learning_rate": 9.916659381335524e-06,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15634512901306152,
"step": 3050,
"valid_targets_mean": 4189.9,
"valid_targets_min": 1195
},
{
"epoch": 4.919484702093397,
"grad_norm": 0.5734404649785564,
"learning_rate": 9.847387612994065e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715972125530243,
"step": 3055,
"valid_targets_mean": 4624.1,
"valid_targets_min": 999
},
{
"epoch": 4.927536231884058,
"grad_norm": 0.4755904568874477,
"learning_rate": 9.778279533572894e-06,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1521787941455841,
"step": 3060,
"valid_targets_mean": 4754.1,
"valid_targets_min": 1047
},
{
"epoch": 4.935587761674718,
"grad_norm": 0.7122666442809198,
"learning_rate": 9.70933625729035e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17114746570587158,
"step": 3065,
"valid_targets_mean": 5142.9,
"valid_targets_min": 1175
},
{
"epoch": 4.943639291465378,
"grad_norm": 0.7359607180808936,
"learning_rate": 9.640558895707681e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18806086480617523,
"step": 3070,
"valid_targets_mean": 4064.7,
"valid_targets_min": 1615
},
{
"epoch": 4.951690821256038,
"grad_norm": 0.5379368590841539,
"learning_rate": 9.571948557711104e-06,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17751240730285645,
"step": 3075,
"valid_targets_mean": 3381.2,
"valid_targets_min": 249
},
{
"epoch": 4.959742351046699,
"grad_norm": 0.4777499224064591,
"learning_rate": 9.503506349493959e-06,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592390239238739,
"step": 3080,
"valid_targets_mean": 4629.0,
"valid_targets_min": 1254
},
{
"epoch": 4.967793880837359,
"grad_norm": 0.5139616446857665,
"learning_rate": 9.435233374538848e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18165704607963562,
"step": 3085,
"valid_targets_mean": 4665.1,
"valid_targets_min": 1736
},
{
"epoch": 4.975845410628019,
"grad_norm": 0.5162555365137094,
"learning_rate": 9.367130733599863e-06,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19067494571208954,
"step": 3090,
"valid_targets_mean": 4688.7,
"valid_targets_min": 1872
},
{
"epoch": 4.9838969404186795,
"grad_norm": 0.569575182274062,
"learning_rate": 9.299199524684815e-06,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16250163316726685,
"step": 3095,
"valid_targets_mean": 4311.8,
"valid_targets_min": 1994
},
{
"epoch": 4.99194847020934,
"grad_norm": 0.5520222968798817,
"learning_rate": 9.23144084303756e-06,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921304166316986,
"step": 3100,
"valid_targets_mean": 4493.3,
"valid_targets_min": 2050
},
{
"epoch": 5.0,
"grad_norm": 0.7884221741023202,
"learning_rate": 9.163855781120302e-06,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20062533020973206,
"step": 3105,
"valid_targets_mean": 3796.8,
"valid_targets_min": 374
},
{
"epoch": 5.00805152979066,
"grad_norm": 0.5195634108838502,
"learning_rate": 9.096445428596026e-06,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1869000345468521,
"step": 3110,
"valid_targets_mean": 4366.8,
"valid_targets_min": 1253
},
{
"epoch": 5.0161030595813205,
"grad_norm": 0.5278497870764118,
"learning_rate": 9.029210872310884e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1439373940229416,
"step": 3115,
"valid_targets_mean": 4365.9,
"valid_targets_min": 554
},
{
"epoch": 5.024154589371981,
"grad_norm": 0.5284272892101102,
"learning_rate": 8.962153196276713e-06,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14253228902816772,
"step": 3120,
"valid_targets_mean": 4662.7,
"valid_targets_min": 312
},
{
"epoch": 5.032206119162641,
"grad_norm": 0.5474998021835664,
"learning_rate": 8.895273481653527e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17854666709899902,
"step": 3125,
"valid_targets_mean": 4428.5,
"valid_targets_min": 627
},
{
"epoch": 5.040257648953301,
"grad_norm": 1.2329548853780503,
"learning_rate": 8.828572806732103e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1708088219165802,
"step": 3130,
"valid_targets_mean": 4686.6,
"valid_targets_min": 1916
},
{
"epoch": 5.048309178743962,
"grad_norm": 0.5097310950347612,
"learning_rate": 8.76205224691659e-06,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17174428701400757,
"step": 3135,
"valid_targets_mean": 4785.3,
"valid_targets_min": 1860
},
{
"epoch": 5.056360708534622,
"grad_norm": 0.46008600902359126,
"learning_rate": 8.695712874707169e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16250503063201904,
"step": 3140,
"valid_targets_mean": 4901.8,
"valid_targets_min": 402
},
{
"epoch": 5.064412238325282,
"grad_norm": 0.47656692190311706,
"learning_rate": 8.629555759682756e-06,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15433499217033386,
"step": 3145,
"valid_targets_mean": 5206.9,
"valid_targets_min": 892
},
{
"epoch": 5.072463768115942,
"grad_norm": 0.46684035634871635,
"learning_rate": 8.563581968483774e-06,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15580695867538452,
"step": 3150,
"valid_targets_mean": 4968.5,
"valid_targets_min": 1514
},
{
"epoch": 5.080515297906603,
"grad_norm": 0.4817709325187039,
"learning_rate": 8.497792564794935e-06,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596037745475769,
"step": 3155,
"valid_targets_mean": 4873.9,
"valid_targets_min": 656
},
{
"epoch": 5.088566827697263,
"grad_norm": 0.49561234768208556,
"learning_rate": 8.432188609328112e-06,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18620729446411133,
"step": 3160,
"valid_targets_mean": 4277.6,
"valid_targets_min": 429
},
{
"epoch": 5.096618357487923,
"grad_norm": 0.5342689640020111,
"learning_rate": 8.366771159805222e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1623041033744812,
"step": 3165,
"valid_targets_mean": 3849.9,
"valid_targets_min": 1692
},
{
"epoch": 5.1046698872785825,
"grad_norm": 0.5558864483320473,
"learning_rate": 8.301541270941178e-06,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19302302598953247,
"step": 3170,
"valid_targets_mean": 3954.7,
"valid_targets_min": 894
},
{
"epoch": 5.112721417069243,
"grad_norm": 0.5483085784932584,
"learning_rate": 8.236499994426886e-06,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17752034962177277,
"step": 3175,
"valid_targets_mean": 4114.2,
"valid_targets_min": 321
},
{
"epoch": 5.120772946859903,
"grad_norm": 0.5129349338303597,
"learning_rate": 8.171648378912272e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1786811649799347,
"step": 3180,
"valid_targets_mean": 5010.1,
"valid_targets_min": 1693
},
{
"epoch": 5.128824476650563,
"grad_norm": 0.47618052790196236,
"learning_rate": 8.1069874699894e-06,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14539986848831177,
"step": 3185,
"valid_targets_mean": 4915.1,
"valid_targets_min": 1295
},
{
"epoch": 5.1368760064412236,
"grad_norm": 0.5408793562526828,
"learning_rate": 8.042518310175607e-06,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1692083477973938,
"step": 3190,
"valid_targets_mean": 4689.8,
"valid_targets_min": 693
},
{
"epoch": 5.144927536231884,
"grad_norm": 0.427889087391779,
"learning_rate": 7.978241938896679e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13784319162368774,
"step": 3195,
"valid_targets_mean": 4693.8,
"valid_targets_min": 2255
},
{
"epoch": 5.152979066022544,
"grad_norm": 0.5199711838065452,
"learning_rate": 7.914159392470118e-06,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16833321750164032,
"step": 3200,
"valid_targets_mean": 4362.7,
"valid_targets_min": 848
},
{
"epoch": 5.161030595813204,
"grad_norm": 0.47753654786071936,
"learning_rate": 7.850271704088396e-06,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14919407665729523,
"step": 3205,
"valid_targets_mean": 4483.1,
"valid_targets_min": 2048
},
{
"epoch": 5.169082125603865,
"grad_norm": 0.47729884629127567,
"learning_rate": 7.786579903802342e-06,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15295487642288208,
"step": 3210,
"valid_targets_mean": 4766.6,
"valid_targets_min": 1817
},
{
"epoch": 5.177133655394525,
"grad_norm": 0.5186129305793417,
"learning_rate": 7.723085018504512e-06,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621103286743164,
"step": 3215,
"valid_targets_mean": 4525.6,
"valid_targets_min": 529
},
{
"epoch": 5.185185185185185,
"grad_norm": 0.562831677149766,
"learning_rate": 7.659788071912612e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16404971480369568,
"step": 3220,
"valid_targets_mean": 3796.4,
"valid_targets_min": 1477
},
{
"epoch": 5.193236714975845,
"grad_norm": 0.48044538637214657,
"learning_rate": 7.59669008455304e-06,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16649338603019714,
"step": 3225,
"valid_targets_mean": 5432.8,
"valid_targets_min": 1858
},
{
"epoch": 5.201288244766506,
"grad_norm": 0.5790721887585502,
"learning_rate": 7.533792073744395e-06,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17744669318199158,
"step": 3230,
"valid_targets_mean": 4592.4,
"valid_targets_min": 935
},
{
"epoch": 5.209339774557166,
"grad_norm": 0.5717495383522813,
"learning_rate": 7.471095053581086e-06,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1721886694431305,
"step": 3235,
"valid_targets_mean": 4073.8,
"valid_targets_min": 823
},
{
"epoch": 5.217391304347826,
"grad_norm": 0.5319904040215578,
"learning_rate": 7.4086000349169864e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15195900201797485,
"step": 3240,
"valid_targets_mean": 4558.5,
"valid_targets_min": 296
},
{
"epoch": 5.225442834138486,
"grad_norm": 0.6199276315504786,
"learning_rate": 7.346308025349138e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16166193783283234,
"step": 3245,
"valid_targets_mean": 3986.2,
"valid_targets_min": 848
},
{
"epoch": 5.233494363929147,
"grad_norm": 0.6244366963899998,
"learning_rate": 7.2842200292014805e-06,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17683975398540497,
"step": 3250,
"valid_targets_mean": 3601.2,
"valid_targets_min": 760
},
{
"epoch": 5.241545893719807,
"grad_norm": 0.5241028588187276,
"learning_rate": 7.2223370475086896e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595272421836853,
"step": 3255,
"valid_targets_mean": 4269.6,
"valid_targets_min": 1279
},
{
"epoch": 5.249597423510467,
"grad_norm": 0.4473386775088612,
"learning_rate": 7.160660078000028e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16722847521305084,
"step": 3260,
"valid_targets_mean": 5286.9,
"valid_targets_min": 2305
},
{
"epoch": 5.2576489533011275,
"grad_norm": 0.5009816722230198,
"learning_rate": 7.099190115083259e-06,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17297816276550293,
"step": 3265,
"valid_targets_mean": 4930.7,
"valid_targets_min": 2434
},
{
"epoch": 5.265700483091788,
"grad_norm": 0.5600085277272723,
"learning_rate": 7.037928149828608e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18866902589797974,
"step": 3270,
"valid_targets_mean": 4635.0,
"valid_targets_min": 1444
},
{
"epoch": 5.273752012882448,
"grad_norm": 0.5153595033812705,
"learning_rate": 6.97687516995279e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15133386850357056,
"step": 3275,
"valid_targets_mean": 4087.8,
"valid_targets_min": 1111
},
{
"epoch": 5.281803542673108,
"grad_norm": 0.5588332326443939,
"learning_rate": 6.916032159803088e-06,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20162728428840637,
"step": 3280,
"valid_targets_mean": 4709.9,
"valid_targets_min": 2151
},
{
"epoch": 5.2898550724637685,
"grad_norm": 0.5640390114972573,
"learning_rate": 6.855400100341458e-06,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17432144284248352,
"step": 3285,
"valid_targets_mean": 3788.3,
"valid_targets_min": 543
},
{
"epoch": 5.297906602254429,
"grad_norm": 0.5376565233222369,
"learning_rate": 6.794979969128755e-06,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16141164302825928,
"step": 3290,
"valid_targets_mean": 4118.3,
"valid_targets_min": 1706
},
{
"epoch": 5.305958132045088,
"grad_norm": 0.5378942356008535,
"learning_rate": 6.7347727403089325e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17127177119255066,
"step": 3295,
"valid_targets_mean": 4600.5,
"valid_targets_min": 1136
},
{
"epoch": 5.314009661835748,
"grad_norm": 0.48776680886655227,
"learning_rate": 6.674779384593373e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13992200791835785,
"step": 3300,
"valid_targets_mean": 4386.2,
"valid_targets_min": 1725
},
{
"epoch": 5.322061191626409,
"grad_norm": 0.5329626208836868,
"learning_rate": 6.61500086924519e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17515888810157776,
"step": 3305,
"valid_targets_mean": 4181.7,
"valid_targets_min": 290
},
{
"epoch": 5.330112721417069,
"grad_norm": 0.46016033498034964,
"learning_rate": 6.555438158063683e-06,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17031973600387573,
"step": 3310,
"valid_targets_mean": 5609.8,
"valid_targets_min": 1475
},
{
"epoch": 5.338164251207729,
"grad_norm": 0.7890593958793812,
"learning_rate": 6.4960922113687695e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17659761011600494,
"step": 3315,
"valid_targets_mean": 3941.4,
"valid_targets_min": 1450
},
{
"epoch": 5.3462157809983895,
"grad_norm": 0.5703421349872555,
"learning_rate": 6.4369639859855115e-06,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17057812213897705,
"step": 3320,
"valid_targets_mean": 4658.4,
"valid_targets_min": 1863
},
{
"epoch": 5.35426731078905,
"grad_norm": 0.564126182226765,
"learning_rate": 6.378054435228671e-06,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18041761219501495,
"step": 3325,
"valid_targets_mean": 4159.0,
"valid_targets_min": 759
},
{
"epoch": 5.36231884057971,
"grad_norm": 0.4973048643598519,
"learning_rate": 6.319364508887371e-06,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592758297920227,
"step": 3330,
"valid_targets_mean": 4736.2,
"valid_targets_min": 1812
},
{
"epoch": 5.37037037037037,
"grad_norm": 0.569769342446689,
"learning_rate": 6.260895153209763e-06,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18152937293052673,
"step": 3335,
"valid_targets_mean": 4268.9,
"valid_targets_min": 1431
},
{
"epoch": 5.3784219001610305,
"grad_norm": 0.5016879405573162,
"learning_rate": 6.202647310887764e-06,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17833814024925232,
"step": 3340,
"valid_targets_mean": 4741.9,
"valid_targets_min": 1679
},
{
"epoch": 5.386473429951691,
"grad_norm": 0.5247407647892519,
"learning_rate": 6.14462192104188e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20044955611228943,
"step": 3345,
"valid_targets_mean": 4656.0,
"valid_targets_min": 2099
},
{
"epoch": 5.394524959742351,
"grad_norm": 0.47014870620352595,
"learning_rate": 6.086819919206051e-06,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17010408639907837,
"step": 3350,
"valid_targets_mean": 5653.4,
"valid_targets_min": 2097
},
{
"epoch": 5.402576489533011,
"grad_norm": 0.6060057637724512,
"learning_rate": 6.029242237312554e-06,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18121179938316345,
"step": 3355,
"valid_targets_mean": 5222.9,
"valid_targets_min": 532
},
{
"epoch": 5.4106280193236715,
"grad_norm": 0.5270241265183322,
"learning_rate": 5.971889803676996e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16754843294620514,
"step": 3360,
"valid_targets_mean": 4372.1,
"valid_targets_min": 1892
},
{
"epoch": 5.418679549114332,
"grad_norm": 0.5131324243265083,
"learning_rate": 5.914763542983355e-06,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18260961771011353,
"step": 3365,
"valid_targets_mean": 5181.3,
"valid_targets_min": 1175
},
{
"epoch": 5.426731078904992,
"grad_norm": 0.5192149826300284,
"learning_rate": 5.857864376269051e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18823757767677307,
"step": 3370,
"valid_targets_mean": 4809.2,
"valid_targets_min": 1171
},
{
"epoch": 5.434782608695652,
"grad_norm": 0.5980250860155677,
"learning_rate": 5.801193220910108e-06,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16703063249588013,
"step": 3375,
"valid_targets_mean": 4509.7,
"valid_targets_min": 1367
},
{
"epoch": 5.442834138486313,
"grad_norm": 0.551837937511895,
"learning_rate": 5.744750990606356e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15874727070331573,
"step": 3380,
"valid_targets_mean": 3712.6,
"valid_targets_min": 311
},
{
"epoch": 5.450885668276973,
"grad_norm": 0.49161398228706626,
"learning_rate": 5.688538595366706e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.155176043510437,
"step": 3385,
"valid_targets_mean": 4476.1,
"valid_targets_min": 1936
},
{
"epoch": 5.458937198067633,
"grad_norm": 0.5355381631745951,
"learning_rate": 5.632556941494482e-06,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.153697669506073,
"step": 3390,
"valid_targets_mean": 3974.2,
"valid_targets_min": 1569
},
{
"epoch": 5.466988727858293,
"grad_norm": 0.5115948764108772,
"learning_rate": 5.5768069315727895e-06,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1722053587436676,
"step": 3395,
"valid_targets_mean": 4293.4,
"valid_targets_min": 2260
},
{
"epoch": 5.475040257648954,
"grad_norm": 0.4799188086454644,
"learning_rate": 5.521289464449975e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17728543281555176,
"step": 3400,
"valid_targets_mean": 5211.7,
"valid_targets_min": 363
},
{
"epoch": 5.483091787439614,
"grad_norm": 0.5570316610757228,
"learning_rate": 5.46600543522515e-06,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16196802258491516,
"step": 3405,
"valid_targets_mean": 4058.4,
"valid_targets_min": 653
},
{
"epoch": 5.491143317230274,
"grad_norm": 0.6736055907952796,
"learning_rate": 5.410955735233736e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.171076238155365,
"step": 3410,
"valid_targets_mean": 5974.8,
"valid_targets_min": 2681
},
{
"epoch": 5.499194847020934,
"grad_norm": 0.5508461582818147,
"learning_rate": 5.3561412520331025e-06,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14637523889541626,
"step": 3415,
"valid_targets_mean": 4094.3,
"valid_targets_min": 904
},
{
"epoch": 5.507246376811594,
"grad_norm": 0.5142188355081284,
"learning_rate": 5.30156286938826e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1733294427394867,
"step": 3420,
"valid_targets_mean": 4461.4,
"valid_targets_min": 1105
},
{
"epoch": 5.515297906602254,
"grad_norm": 0.5905481814384393,
"learning_rate": 5.24722146725761e-06,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17892040312290192,
"step": 3425,
"valid_targets_mean": 4002.8,
"valid_targets_min": 1672
},
{
"epoch": 5.523349436392914,
"grad_norm": 0.45334104473741593,
"learning_rate": 5.193117921778743e-06,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13965705037117004,
"step": 3430,
"valid_targets_mean": 4802.2,
"valid_targets_min": 1812
},
{
"epoch": 5.531400966183575,
"grad_norm": 0.742354374585886,
"learning_rate": 5.139253105254336e-06,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18780140578746796,
"step": 3435,
"valid_targets_mean": 4082.1,
"valid_targets_min": 1116
},
{
"epoch": 5.539452495974235,
"grad_norm": 0.44385771676975855,
"learning_rate": 5.085627886138078e-06,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14621910452842712,
"step": 3440,
"valid_targets_mean": 5131.4,
"valid_targets_min": 1610
},
{
"epoch": 5.547504025764895,
"grad_norm": 0.47820099076305106,
"learning_rate": 5.032243129020671e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16836556792259216,
"step": 3445,
"valid_targets_mean": 5182.5,
"valid_targets_min": 1770
},
{
"epoch": 5.555555555555555,
"grad_norm": 0.5335135512220336,
"learning_rate": 4.9790996946158695e-06,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18833035230636597,
"step": 3450,
"valid_targets_mean": 4468.0,
"valid_targets_min": 1464
},
{
"epoch": 5.563607085346216,
"grad_norm": 0.5452849565299809,
"learning_rate": 4.926198439746641e-06,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16549217700958252,
"step": 3455,
"valid_targets_mean": 3943.1,
"valid_targets_min": 1663
},
{
"epoch": 5.571658615136876,
"grad_norm": 0.47569229716225025,
"learning_rate": 4.873540217331325e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14578670263290405,
"step": 3460,
"valid_targets_mean": 4942.0,
"valid_targets_min": 1587
},
{
"epoch": 5.579710144927536,
"grad_norm": 0.6257220241925262,
"learning_rate": 4.82112587636989e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14457204937934875,
"step": 3465,
"valid_targets_mean": 4796.1,
"valid_targets_min": 1025
},
{
"epoch": 5.587761674718196,
"grad_norm": 0.5126249751180715,
"learning_rate": 4.768956261930233e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21914073824882507,
"step": 3470,
"valid_targets_mean": 5159.1,
"valid_targets_min": 1672
},
{
"epoch": 5.595813204508857,
"grad_norm": 0.5030438743653675,
"learning_rate": 4.717032215134576e-06,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1816645860671997,
"step": 3475,
"valid_targets_mean": 5501.6,
"valid_targets_min": 1066
},
{
"epoch": 5.603864734299517,
"grad_norm": 0.7789904581155889,
"learning_rate": 4.66535457314589e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1629607379436493,
"step": 3480,
"valid_targets_mean": 5301.9,
"valid_targets_min": 1650
},
{
"epoch": 5.611916264090177,
"grad_norm": 0.5094527470833449,
"learning_rate": 4.613924169154406e-06,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16425767540931702,
"step": 3485,
"valid_targets_mean": 4554.6,
"valid_targets_min": 1654
},
{
"epoch": 5.6199677938808374,
"grad_norm": 0.48660247544704416,
"learning_rate": 4.5627418323641705e-06,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17449656128883362,
"step": 3490,
"valid_targets_mean": 5440.4,
"valid_targets_min": 3305
},
{
"epoch": 5.628019323671498,
"grad_norm": 0.6588365172160204,
"learning_rate": 4.51180838797969e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16700059175491333,
"step": 3495,
"valid_targets_mean": 3524.9,
"valid_targets_min": 431
},
{
"epoch": 5.636070853462158,
"grad_norm": 0.5649424861690088,
"learning_rate": 4.461124657192612e-06,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16424767673015594,
"step": 3500,
"valid_targets_mean": 3976.2,
"valid_targets_min": 327
},
{
"epoch": 5.644122383252818,
"grad_norm": 0.5402856059826509,
"learning_rate": 4.410691457168488e-06,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17043063044548035,
"step": 3505,
"valid_targets_mean": 4236.4,
"valid_targets_min": 1605
},
{
"epoch": 5.6521739130434785,
"grad_norm": 0.6565234736534431,
"learning_rate": 4.3605096010336115e-06,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19410403072834015,
"step": 3510,
"valid_targets_mean": 3966.3,
"valid_targets_min": 374
},
{
"epoch": 5.660225442834139,
"grad_norm": 0.46809524453228724,
"learning_rate": 4.310579897861902e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14890244603157043,
"step": 3515,
"valid_targets_mean": 5078.9,
"valid_targets_min": 1866
},
{
"epoch": 5.668276972624799,
"grad_norm": 0.5402583356363803,
"learning_rate": 4.26090315266185e-06,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18138787150382996,
"step": 3520,
"valid_targets_mean": 4479.4,
"valid_targets_min": 1667
},
{
"epoch": 5.676328502415459,
"grad_norm": 0.5567198301706011,
"learning_rate": 4.2114801663635504e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19387924671173096,
"step": 3525,
"valid_targets_mean": 4855.1,
"valid_targets_min": 1475
},
{
"epoch": 5.6843800322061195,
"grad_norm": 0.5076182712626346,
"learning_rate": 4.1623117358057865e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16965937614440918,
"step": 3530,
"valid_targets_mean": 4802.6,
"valid_targets_min": 2133
},
{
"epoch": 5.692431561996779,
"grad_norm": 0.5638233787105313,
"learning_rate": 4.113398653723168e-06,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1688123494386673,
"step": 3535,
"valid_targets_mean": 4551.8,
"valid_targets_min": 590
},
{
"epoch": 5.70048309178744,
"grad_norm": 0.6026682576927842,
"learning_rate": 4.0647417087333776e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17929375171661377,
"step": 3540,
"valid_targets_mean": 4203.6,
"valid_targets_min": 1303
},
{
"epoch": 5.708534621578099,
"grad_norm": 0.4840327343136473,
"learning_rate": 4.0163416853244385e-06,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15817004442214966,
"step": 3545,
"valid_targets_mean": 4813.0,
"valid_targets_min": 321
},
{
"epoch": 5.71658615136876,
"grad_norm": 0.5122311264991213,
"learning_rate": 3.968199363842056e-06,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15911847352981567,
"step": 3550,
"valid_targets_mean": 4163.8,
"valid_targets_min": 2141
},
{
"epoch": 5.72463768115942,
"grad_norm": 0.5526613981940242,
"learning_rate": 3.920315520477065e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16690890491008759,
"step": 3555,
"valid_targets_mean": 3781.4,
"valid_targets_min": 434
},
{
"epoch": 5.73268921095008,
"grad_norm": 0.5154673260140975,
"learning_rate": 3.872690927252891e-06,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18027852475643158,
"step": 3560,
"valid_targets_mean": 4373.6,
"valid_targets_min": 1594
},
{
"epoch": 5.7407407407407405,
"grad_norm": 0.48703994856912225,
"learning_rate": 3.825326352013119e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16559578478336334,
"step": 3565,
"valid_targets_mean": 4382.0,
"valid_targets_min": 1603
},
{
"epoch": 5.748792270531401,
"grad_norm": 0.5472851978165418,
"learning_rate": 3.7782225584091016e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15613017976284027,
"step": 3570,
"valid_targets_mean": 4052.4,
"valid_targets_min": 339
},
{
"epoch": 5.756843800322061,
"grad_norm": 0.5873806542864478,
"learning_rate": 3.731380305887644e-06,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17352142930030823,
"step": 3575,
"valid_targets_mean": 4468.3,
"valid_targets_min": 860
},
{
"epoch": 5.764895330112721,
"grad_norm": 0.562715584188104,
"learning_rate": 3.684800349678781e-06,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19309145212173462,
"step": 3580,
"valid_targets_mean": 3819.3,
"valid_targets_min": 831
},
{
"epoch": 5.7729468599033815,
"grad_norm": 0.584825018902196,
"learning_rate": 3.638483440783576e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22266249358654022,
"step": 3585,
"valid_targets_mean": 4084.6,
"valid_targets_min": 1924
},
{
"epoch": 5.780998389694042,
"grad_norm": 0.5288099238647191,
"learning_rate": 3.5924303259620307e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15193787217140198,
"step": 3590,
"valid_targets_mean": 4209.9,
"valid_targets_min": 963
},
{
"epoch": 5.789049919484702,
"grad_norm": 0.5275609216950717,
"learning_rate": 3.546641747721036e-06,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16384585201740265,
"step": 3595,
"valid_targets_mean": 4627.3,
"valid_targets_min": 1626
},
{
"epoch": 5.797101449275362,
"grad_norm": 0.725525221737914,
"learning_rate": 3.501118444302394e-06,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18506191670894623,
"step": 3600,
"valid_targets_mean": 3873.7,
"valid_targets_min": 756
},
{
"epoch": 5.805152979066023,
"grad_norm": 0.5082224637456563,
"learning_rate": 3.4558611496709384e-06,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.165011465549469,
"step": 3605,
"valid_targets_mean": 4355.2,
"valid_targets_min": 776
},
{
"epoch": 5.813204508856683,
"grad_norm": 0.8025807922419831,
"learning_rate": 3.4108705935026685e-06,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15931957960128784,
"step": 3610,
"valid_targets_mean": 3695.9,
"valid_targets_min": 1119
},
{
"epoch": 5.821256038647343,
"grad_norm": 0.5168844656413334,
"learning_rate": 3.3661475011730206e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15300890803337097,
"step": 3615,
"valid_targets_mean": 4747.3,
"valid_targets_min": 1185
},
{
"epoch": 5.829307568438003,
"grad_norm": 0.5249631418738182,
"learning_rate": 3.321692593745147e-06,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15493711829185486,
"step": 3620,
"valid_targets_mean": 3726.0,
"valid_targets_min": 1610
},
{
"epoch": 5.837359098228664,
"grad_norm": 0.5331107342319671,
"learning_rate": 3.2775065879582948e-06,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17267771065235138,
"step": 3625,
"valid_targets_mean": 5503.0,
"valid_targets_min": 1978
},
{
"epoch": 5.845410628019324,
"grad_norm": 0.5222892591386691,
"learning_rate": 3.233590196216263e-06,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1816999316215515,
"step": 3630,
"valid_targets_mean": 4842.2,
"valid_targets_min": 545
},
{
"epoch": 5.853462157809984,
"grad_norm": 0.5132154525081916,
"learning_rate": 3.1899441265759036e-06,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19336271286010742,
"step": 3635,
"valid_targets_mean": 5282.2,
"valid_targets_min": 1948
},
{
"epoch": 5.861513687600644,
"grad_norm": 0.5087976961623909,
"learning_rate": 3.1465690827356955e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17752087116241455,
"step": 3640,
"valid_targets_mean": 4912.0,
"valid_targets_min": 1166
},
{
"epoch": 5.869565217391305,
"grad_norm": 0.5723530802904422,
"learning_rate": 3.103465764024438e-06,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1567440927028656,
"step": 3645,
"valid_targets_mean": 3882.6,
"valid_targets_min": 627
},
{
"epoch": 5.877616747181965,
"grad_norm": 0.6212444706400745,
"learning_rate": 3.0606348653899288e-06,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16555482149124146,
"step": 3650,
"valid_targets_mean": 4280.1,
"valid_targets_min": 1429
},
{
"epoch": 5.885668276972625,
"grad_norm": 0.6037643784134114,
"learning_rate": 3.0180770773877866e-06,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1539427787065506,
"step": 3655,
"valid_targets_mean": 3446.1,
"valid_targets_min": 864
},
{
"epoch": 5.8937198067632846,
"grad_norm": 0.5417204859207484,
"learning_rate": 2.9757930861703223e-06,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1333686113357544,
"step": 3660,
"valid_targets_mean": 4272.0,
"valid_targets_min": 993
},
{
"epoch": 5.901771336553946,
"grad_norm": 0.545060770024728,
"learning_rate": 2.9337835734754504e-06,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16815856099128723,
"step": 3665,
"valid_targets_mean": 4364.4,
"valid_targets_min": 1968
},
{
"epoch": 5.909822866344605,
"grad_norm": 0.4807913485701676,
"learning_rate": 2.892049216615724e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16856727004051208,
"step": 3670,
"valid_targets_mean": 4645.9,
"valid_targets_min": 1236
},
{
"epoch": 5.917874396135265,
"grad_norm": 0.5872896027676431,
"learning_rate": 2.850590688467405e-06,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17276933789253235,
"step": 3675,
"valid_targets_mean": 4079.1,
"valid_targets_min": 758
},
{
"epoch": 5.925925925925926,
"grad_norm": 0.5081772741434722,
"learning_rate": 2.8094086574595934e-06,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17815062403678894,
"step": 3680,
"valid_targets_mean": 4622.2,
"valid_targets_min": 506
},
{
"epoch": 5.933977455716586,
"grad_norm": 0.5314566948595292,
"learning_rate": 2.768503787563497e-06,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15440833568572998,
"step": 3685,
"valid_targets_mean": 4177.4,
"valid_targets_min": 1764
},
{
"epoch": 5.942028985507246,
"grad_norm": 0.5944657537451915,
"learning_rate": 2.7278767382816828e-06,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15870711207389832,
"step": 3690,
"valid_targets_mean": 4034.2,
"valid_targets_min": 346
},
{
"epoch": 5.950080515297906,
"grad_norm": 0.5150609346752764,
"learning_rate": 2.687528164637474e-06,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16893523931503296,
"step": 3695,
"valid_targets_mean": 4341.7,
"valid_targets_min": 544
},
{
"epoch": 5.958132045088567,
"grad_norm": 0.622800014898735,
"learning_rate": 2.647458717164357e-06,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1420368254184723,
"step": 3700,
"valid_targets_mean": 4181.0,
"valid_targets_min": 930
},
{
"epoch": 5.966183574879227,
"grad_norm": 0.5118850984097806,
"learning_rate": 2.607669041895535e-06,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17651256918907166,
"step": 3705,
"valid_targets_mean": 5766.2,
"valid_targets_min": 2526
},
{
"epoch": 5.974235104669887,
"grad_norm": 0.5922490816235029,
"learning_rate": 2.568159780353476e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15372015535831451,
"step": 3710,
"valid_targets_mean": 3693.7,
"valid_targets_min": 614
},
{
"epoch": 5.982286634460547,
"grad_norm": 0.5223810749820793,
"learning_rate": 2.5289315695395834e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17238521575927734,
"step": 3715,
"valid_targets_mean": 3895.1,
"valid_targets_min": 703
},
{
"epoch": 5.990338164251208,
"grad_norm": 0.6140059891446761,
"learning_rate": 2.489985041923928e-06,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18047456443309784,
"step": 3720,
"valid_targets_mean": 4203.8,
"valid_targets_min": 989
},
{
"epoch": 5.998389694041868,
"grad_norm": 0.5110659722384324,
"learning_rate": 2.4513208254350486e-06,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1803944855928421,
"step": 3725,
"valid_targets_mean": 4611.9,
"valid_targets_min": 1053
},
{
"epoch": 6.006441223832528,
"grad_norm": 0.46649632563361154,
"learning_rate": 2.412939543449828e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1679632067680359,
"step": 3730,
"valid_targets_mean": 4868.8,
"valid_targets_min": 1373
},
{
"epoch": 6.0144927536231885,
"grad_norm": 0.5752464912619374,
"learning_rate": 2.3748418147834394e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14780664443969727,
"step": 3735,
"valid_targets_mean": 3625.4,
"valid_targets_min": 705
},
{
"epoch": 6.022544283413849,
"grad_norm": 0.4873295942554316,
"learning_rate": 2.337028253679381e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14143216609954834,
"step": 3740,
"valid_targets_mean": 4609.2,
"valid_targets_min": 1716
},
{
"epoch": 6.030595813204509,
"grad_norm": 0.4572827913243831,
"learning_rate": 2.299499469799542e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1580767184495926,
"step": 3745,
"valid_targets_mean": 5816.4,
"valid_targets_min": 1119
},
{
"epoch": 6.038647342995169,
"grad_norm": 0.5186439466567816,
"learning_rate": 2.262256068214421e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17476163804531097,
"step": 3750,
"valid_targets_mean": 4437.0,
"valid_targets_min": 757
},
{
"epoch": 6.0466988727858295,
"grad_norm": 0.5118711095108422,
"learning_rate": 2.2252986493933237e-06,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16541600227355957,
"step": 3755,
"valid_targets_mean": 4525.7,
"valid_targets_min": 2162
},
{
"epoch": 6.05475040257649,
"grad_norm": 0.5109434582294012,
"learning_rate": 2.18862780919471e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15595577657222748,
"step": 3760,
"valid_targets_mean": 4511.2,
"valid_targets_min": 1010
},
{
"epoch": 6.06280193236715,
"grad_norm": 0.5324485507591655,
"learning_rate": 2.152244138856585e-06,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1731036901473999,
"step": 3765,
"valid_targets_mean": 4594.2,
"valid_targets_min": 1788
},
{
"epoch": 6.07085346215781,
"grad_norm": 0.4936303320259845,
"learning_rate": 2.1161482249869513e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14089539647102356,
"step": 3770,
"valid_targets_mean": 5116.8,
"valid_targets_min": 422
},
{
"epoch": 6.078904991948471,
"grad_norm": 0.5698965758566077,
"learning_rate": 2.080340649554369e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16755038499832153,
"step": 3775,
"valid_targets_mean": 4225.4,
"valid_targets_min": 536
},
{
"epoch": 6.086956521739131,
"grad_norm": 0.5229210197667631,
"learning_rate": 2.044821989878558e-06,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16623234748840332,
"step": 3780,
"valid_targets_mean": 4262.9,
"valid_targets_min": 1577
},
{
"epoch": 6.095008051529791,
"grad_norm": 0.5459701049906057,
"learning_rate": 2.0095928186210956e-06,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.147607684135437,
"step": 3785,
"valid_targets_mean": 4724.4,
"valid_targets_min": 1787
},
{
"epoch": 6.1030595813204505,
"grad_norm": 0.5581543823448861,
"learning_rate": 1.974653703776188e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18220457434654236,
"step": 3790,
"valid_targets_mean": 5031.3,
"valid_targets_min": 392
},
{
"epoch": 6.111111111111111,
"grad_norm": 0.5197842393741545,
"learning_rate": 1.9400052086615153e-06,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1598493456840515,
"step": 3795,
"valid_targets_mean": 4375.8,
"valid_targets_min": 1759
},
{
"epoch": 6.119162640901771,
"grad_norm": 0.5494186611639191,
"learning_rate": 1.9056478919091236e-06,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19067052006721497,
"step": 3800,
"valid_targets_mean": 4341.0,
"valid_targets_min": 692
},
{
"epoch": 6.127214170692431,
"grad_norm": 0.5103976820611801,
"learning_rate": 1.8715823074564587e-06,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15958425402641296,
"step": 3805,
"valid_targets_mean": 4729.6,
"valid_targets_min": 362
},
{
"epoch": 6.1352657004830915,
"grad_norm": 0.5752435508668234,
"learning_rate": 1.837809004537401e-06,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595839112997055,
"step": 3810,
"valid_targets_mean": 4986.8,
"valid_targets_min": 897
},
{
"epoch": 6.143317230273752,
"grad_norm": 0.6232969103900382,
"learning_rate": 1.8043285276734334e-06,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17083576321601868,
"step": 3815,
"valid_targets_mean": 3214.8,
"valid_targets_min": 547
},
{
"epoch": 6.151368760064412,
"grad_norm": 0.5085611865605083,
"learning_rate": 1.7711414166648365e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15489043295383453,
"step": 3820,
"valid_targets_mean": 4428.2,
"valid_targets_min": 1416
},
{
"epoch": 6.159420289855072,
"grad_norm": 0.5686690339243041,
"learning_rate": 1.7382482065820138e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16790664196014404,
"step": 3825,
"valid_targets_mean": 4888.5,
"valid_targets_min": 1755
},
{
"epoch": 6.1674718196457325,
"grad_norm": 0.6929429650574811,
"learning_rate": 1.7056494277568503e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1905716359615326,
"step": 3830,
"valid_targets_mean": 3701.2,
"valid_targets_min": 1170
},
{
"epoch": 6.175523349436393,
"grad_norm": 0.6367228356359814,
"learning_rate": 1.6733456057741592e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1782214492559433,
"step": 3835,
"valid_targets_mean": 3788.4,
"valid_targets_min": 1742
},
{
"epoch": 6.183574879227053,
"grad_norm": 0.532748190271915,
"learning_rate": 1.641337261463216e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18782779574394226,
"step": 3840,
"valid_targets_mean": 4424.2,
"valid_targets_min": 745
},
{
"epoch": 6.191626409017713,
"grad_norm": 0.5944352055775861,
"learning_rate": 1.6096249108893602e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14986079931259155,
"step": 3845,
"valid_targets_mean": 4633.4,
"valid_targets_min": 817
},
{
"epoch": 6.199677938808374,
"grad_norm": 0.4718113061336701,
"learning_rate": 1.5782090653456616e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15445095300674438,
"step": 3850,
"valid_targets_mean": 5366.3,
"valid_targets_min": 2465
},
{
"epoch": 6.207729468599034,
"grad_norm": 0.5299032276018538,
"learning_rate": 1.547090231344699e-06,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1652597188949585,
"step": 3855,
"valid_targets_mean": 4490.8,
"valid_targets_min": 2050
},
{
"epoch": 6.215780998389694,
"grad_norm": 0.4937926792080132,
"learning_rate": 1.5162689106103746e-06,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16262544691562653,
"step": 3860,
"valid_targets_mean": 5297.2,
"valid_targets_min": 758
},
{
"epoch": 6.223832528180354,
"grad_norm": 0.5983118290721653,
"learning_rate": 1.4857456000698366e-06,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21267688274383545,
"step": 3865,
"valid_targets_mean": 5259.9,
"valid_targets_min": 1772
},
{
"epoch": 6.231884057971015,
"grad_norm": 0.5186630493468379,
"learning_rate": 1.4555207918454662e-06,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20158061385154724,
"step": 3870,
"valid_targets_mean": 5251.4,
"valid_targets_min": 570
},
{
"epoch": 6.239935587761675,
"grad_norm": 0.5732567692410732,
"learning_rate": 1.4255949732469309e-06,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15088540315628052,
"step": 3875,
"valid_targets_mean": 3437.3,
"valid_targets_min": 1053
},
{
"epoch": 6.247987117552335,
"grad_norm": 0.5122360577374575,
"learning_rate": 1.3959686267633488e-06,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1651184856891632,
"step": 3880,
"valid_targets_mean": 5088.6,
"valid_targets_min": 1995
},
{
"epoch": 6.256038647342995,
"grad_norm": 0.48110861215986517,
"learning_rate": 1.3666422300554905e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16647136211395264,
"step": 3885,
"valid_targets_mean": 5231.4,
"valid_targets_min": 2355
},
{
"epoch": 6.264090177133656,
"grad_norm": 0.582851491108072,
"learning_rate": 1.3376162559480822e-06,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18534335494041443,
"step": 3890,
"valid_targets_mean": 4512.3,
"valid_targets_min": 2039
},
{
"epoch": 6.272141706924316,
"grad_norm": 0.5404662794082068,
"learning_rate": 1.308891172422193e-06,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919654756784439,
"step": 3895,
"valid_targets_mean": 4829.6,
"valid_targets_min": 972
},
{
"epoch": 6.280193236714976,
"grad_norm": 0.628437639331324,
"learning_rate": 1.2804674426076757e-06,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21055009961128235,
"step": 3900,
"valid_targets_mean": 4256.2,
"valid_targets_min": 846
},
{
"epoch": 6.2882447665056365,
"grad_norm": 0.4797286979992782,
"learning_rate": 1.2523455247757088e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14173908531665802,
"step": 3905,
"valid_targets_mean": 5012.4,
"valid_targets_min": 1956
},
{
"epoch": 6.296296296296296,
"grad_norm": 0.5914383870555415,
"learning_rate": 1.224525872331408e-06,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17256557941436768,
"step": 3910,
"valid_targets_mean": 3722.4,
"valid_targets_min": 1185
},
{
"epoch": 6.304347826086957,
"grad_norm": 0.5475160234396864,
"learning_rate": 1.1970089338065071e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16874639689922333,
"step": 3915,
"valid_targets_mean": 4964.1,
"valid_targets_min": 1411
},
{
"epoch": 6.312399355877616,
"grad_norm": 0.6352630163683538,
"learning_rate": 1.1697951528521422e-06,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16274841129779816,
"step": 3920,
"valid_targets_mean": 3514.2,
"valid_targets_min": 1903
},
{
"epoch": 6.320450885668277,
"grad_norm": 0.5450852465931986,
"learning_rate": 1.1428849682316766e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16449615359306335,
"step": 3925,
"valid_targets_mean": 4061.4,
"valid_targets_min": 1262
},
{
"epoch": 6.328502415458937,
"grad_norm": 0.48987328370522754,
"learning_rate": 1.116278813813647e-06,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13572901487350464,
"step": 3930,
"valid_targets_mean": 4505.6,
"valid_targets_min": 1616
},
{
"epoch": 6.336553945249597,
"grad_norm": 0.503141267860805,
"learning_rate": 1.08997711856476e-06,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16356249153614044,
"step": 3935,
"valid_targets_mean": 4598.4,
"valid_targets_min": 1028
},
{
"epoch": 6.344605475040257,
"grad_norm": 0.7893130983095663,
"learning_rate": 1.0639803065429755e-06,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20338299870491028,
"step": 3940,
"valid_targets_mean": 5540.6,
"valid_targets_min": 2279
},
{
"epoch": 6.352657004830918,
"grad_norm": 0.5464519825128046,
"learning_rate": 1.0382887968906718e-06,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1746448576450348,
"step": 3945,
"valid_targets_mean": 3995.6,
"valid_targets_min": 1677
},
{
"epoch": 6.360708534621578,
"grad_norm": 0.5620117079550653,
"learning_rate": 1.012903003827883e-06,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740240752696991,
"step": 3950,
"valid_targets_mean": 3910.2,
"valid_targets_min": 1147
},
{
"epoch": 6.368760064412238,
"grad_norm": 0.5014202584177402,
"learning_rate": 9.87823336645628e-07,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15709742903709412,
"step": 3955,
"valid_targets_mean": 4344.8,
"valid_targets_min": 2201
},
{
"epoch": 6.3768115942028984,
"grad_norm": 0.5362938011516779,
"learning_rate": 9.630501996993091e-07,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17129208147525787,
"step": 3960,
"valid_targets_mean": 4717.5,
"valid_targets_min": 1989
},
{
"epoch": 6.384863123993559,
"grad_norm": 0.44355010700619574,
"learning_rate": 9.385839924021844e-07,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14925384521484375,
"step": 3965,
"valid_targets_mean": 5392.1,
"valid_targets_min": 2034
},
{
"epoch": 6.392914653784219,
"grad_norm": 0.5637410567366077,
"learning_rate": 9.144251092189416e-07,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033105343580246,
"step": 3970,
"valid_targets_mean": 4397.6,
"valid_targets_min": 529
},
{
"epoch": 6.400966183574879,
"grad_norm": 0.5246003448080508,
"learning_rate": 8.905739396593316e-07,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16925036907196045,
"step": 3975,
"valid_targets_mean": 4739.1,
"valid_targets_min": 720
},
{
"epoch": 6.4090177133655395,
"grad_norm": 0.5406121384840578,
"learning_rate": 8.670308682718853e-07,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594831645488739,
"step": 3980,
"valid_targets_mean": 4337.4,
"valid_targets_min": 800
},
{
"epoch": 6.4170692431562,
"grad_norm": 0.4785613416301052,
"learning_rate": 8.437962746377204e-07,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1622602641582489,
"step": 3985,
"valid_targets_mean": 5365.6,
"valid_targets_min": 1316
},
{
"epoch": 6.42512077294686,
"grad_norm": 0.4972685992182721,
"learning_rate": 8.208705333644129e-07,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1673496663570404,
"step": 3990,
"valid_targets_mean": 4327.2,
"valid_targets_min": 873
},
{
"epoch": 6.43317230273752,
"grad_norm": 0.51768549782515,
"learning_rate": 7.982540140799688e-07,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161638081073761,
"step": 3995,
"valid_targets_mean": 4245.7,
"valid_targets_min": 1725
},
{
"epoch": 6.4412238325281805,
"grad_norm": 0.6255107806087558,
"learning_rate": 7.759470814268489e-07,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16319170594215393,
"step": 4000,
"valid_targets_mean": 3573.4,
"valid_targets_min": 216
},
{
"epoch": 6.449275362318841,
"grad_norm": 0.5117136147623905,
"learning_rate": 7.539500950561063e-07,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18081682920455933,
"step": 4005,
"valid_targets_mean": 5030.6,
"valid_targets_min": 941
},
{
"epoch": 6.457326892109501,
"grad_norm": 0.5410913172933577,
"learning_rate": 7.322634096215831e-07,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15669681131839752,
"step": 4010,
"valid_targets_mean": 4348.8,
"valid_targets_min": 713
},
{
"epoch": 6.465378421900161,
"grad_norm": 0.4986868222815654,
"learning_rate": 7.108873747741807e-07,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14274120330810547,
"step": 4015,
"valid_targets_mean": 4543.1,
"valid_targets_min": 1717
},
{
"epoch": 6.473429951690822,
"grad_norm": 0.469433549650835,
"learning_rate": 6.898223351562405e-07,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15934091806411743,
"step": 4020,
"valid_targets_mean": 5432.7,
"valid_targets_min": 2526
},
{
"epoch": 6.481481481481482,
"grad_norm": 0.622115989263229,
"learning_rate": 6.690686303959748e-07,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18453718721866608,
"step": 4025,
"valid_targets_mean": 3467.2,
"valid_targets_min": 545
},
{
"epoch": 6.489533011272142,
"grad_norm": 0.5270621108254152,
"learning_rate": 6.48626595101991e-07,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19507281482219696,
"step": 4030,
"valid_targets_mean": 5011.7,
"valid_targets_min": 2115
},
{
"epoch": 6.4975845410628015,
"grad_norm": 0.5614424641002262,
"learning_rate": 6.284965588579028e-07,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1735997200012207,
"step": 4035,
"valid_targets_mean": 4858.7,
"valid_targets_min": 1516
},
{
"epoch": 6.505636070853463,
"grad_norm": 0.6277678468034912,
"learning_rate": 6.08678846217019e-07,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.173121377825737,
"step": 4040,
"valid_targets_mean": 4697.3,
"valid_targets_min": 434
},
{
"epoch": 6.513687600644122,
"grad_norm": 0.557886874518275,
"learning_rate": 5.891737766970984e-07,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16518916189670563,
"step": 4045,
"valid_targets_mean": 4401.9,
"valid_targets_min": 596
},
{
"epoch": 6.521739130434782,
"grad_norm": 0.5026467498773549,
"learning_rate": 5.699816647752077e-07,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16781866550445557,
"step": 4050,
"valid_targets_mean": 4928.8,
"valid_targets_min": 2215
},
{
"epoch": 6.5297906602254425,
"grad_norm": 0.5451182471548547,
"learning_rate": 5.511028198826496e-07,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17092815041542053,
"step": 4055,
"valid_targets_mean": 4106.2,
"valid_targets_min": 451
},
{
"epoch": 6.537842190016103,
"grad_norm": 0.5743885198199623,
"learning_rate": 5.32537546399976e-07,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16788442432880402,
"step": 4060,
"valid_targets_mean": 4289.1,
"valid_targets_min": 1684
},
{
"epoch": 6.545893719806763,
"grad_norm": 0.6037224090967725,
"learning_rate": 5.142861436520763e-07,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20297744870185852,
"step": 4065,
"valid_targets_mean": 3997.9,
"valid_targets_min": 383
},
{
"epoch": 6.553945249597423,
"grad_norm": 0.8388825418667704,
"learning_rate": 4.963489059033477e-07,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16553989052772522,
"step": 4070,
"valid_targets_mean": 4784.5,
"valid_targets_min": 2033
},
{
"epoch": 6.561996779388084,
"grad_norm": 0.5970930999537574,
"learning_rate": 4.787261223529616e-07,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17344771325588226,
"step": 4075,
"valid_targets_mean": 3786.6,
"valid_targets_min": 898
},
{
"epoch": 6.570048309178744,
"grad_norm": 0.471204909767901,
"learning_rate": 4.6141807713019793e-07,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13417160511016846,
"step": 4080,
"valid_targets_mean": 5032.4,
"valid_targets_min": 1912
},
{
"epoch": 6.578099838969404,
"grad_norm": 0.4884625900862524,
"learning_rate": 4.444250492898539e-07,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16039326786994934,
"step": 4085,
"valid_targets_mean": 5670.8,
"valid_targets_min": 1963
},
{
"epoch": 6.586151368760064,
"grad_norm": 1.3562926760409872,
"learning_rate": 4.277473128077625e-07,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15605992078781128,
"step": 4090,
"valid_targets_mean": 5004.9,
"valid_targets_min": 390
},
{
"epoch": 6.594202898550725,
"grad_norm": 0.5293266001333903,
"learning_rate": 4.113851365763544e-07,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1735745668411255,
"step": 4095,
"valid_targets_mean": 5240.4,
"valid_targets_min": 1701
},
{
"epoch": 6.602254428341385,
"grad_norm": 0.5578624317503144,
"learning_rate": 3.953387844003431e-07,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1669292151927948,
"step": 4100,
"valid_targets_mean": 4350.2,
"valid_targets_min": 2309
},
{
"epoch": 6.610305958132045,
"grad_norm": 0.604399390427962,
"learning_rate": 3.7960851499245554e-07,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14910921454429626,
"step": 4105,
"valid_targets_mean": 3900.4,
"valid_targets_min": 823
},
{
"epoch": 6.618357487922705,
"grad_norm": 0.5270613962718504,
"learning_rate": 3.6419458196926825e-07,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1642162799835205,
"step": 4110,
"valid_targets_mean": 4613.5,
"valid_targets_min": 1191
},
{
"epoch": 6.626409017713366,
"grad_norm": 0.4768249623670376,
"learning_rate": 3.4909723384712436e-07,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15536585450172424,
"step": 4115,
"valid_targets_mean": 4920.4,
"valid_targets_min": 1743
},
{
"epoch": 6.634460547504026,
"grad_norm": 0.7880877824521434,
"learning_rate": 3.3431671403811207e-07,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14975430071353912,
"step": 4120,
"valid_targets_mean": 4408.2,
"valid_targets_min": 431
},
{
"epoch": 6.642512077294686,
"grad_norm": 0.5055031311515263,
"learning_rate": 3.198532608461524e-07,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18191225826740265,
"step": 4125,
"valid_targets_mean": 5325.4,
"valid_targets_min": 881
},
{
"epoch": 6.650563607085346,
"grad_norm": 0.7377711817281254,
"learning_rate": 3.0570710746314903e-07,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1757345199584961,
"step": 4130,
"valid_targets_mean": 4204.0,
"valid_targets_min": 851
},
{
"epoch": 6.658615136876007,
"grad_norm": 0.49184719888721345,
"learning_rate": 2.9187848196524205e-07,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542222797870636,
"step": 4135,
"valid_targets_mean": 4731.2,
"valid_targets_min": 429
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.6105305368391408,
"learning_rate": 2.7836760730910464e-07,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17159178853034973,
"step": 4140,
"valid_targets_mean": 3496.8,
"valid_targets_min": 397
},
{
"epoch": 6.674718196457327,
"grad_norm": 0.5519746733795567,
"learning_rate": 2.6517470132838117e-07,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1730884313583374,
"step": 4145,
"valid_targets_mean": 4672.2,
"valid_targets_min": 1995
},
{
"epoch": 6.6827697262479875,
"grad_norm": 0.5635266522753974,
"learning_rate": 2.522999767301482e-07,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15275679528713226,
"step": 4150,
"valid_targets_mean": 3927.0,
"valid_targets_min": 300
},
{
"epoch": 6.690821256038648,
"grad_norm": 0.5061168238375812,
"learning_rate": 2.3974364109149886e-07,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14958354830741882,
"step": 4155,
"valid_targets_mean": 3901.1,
"valid_targets_min": 1810
},
{
"epoch": 6.698872785829307,
"grad_norm": 0.5040398527635441,
"learning_rate": 2.2750589685619495e-07,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17061063647270203,
"step": 4160,
"valid_targets_mean": 4585.4,
"valid_targets_min": 1591
},
{
"epoch": 6.706924315619968,
"grad_norm": 0.5035025471661269,
"learning_rate": 2.1558694133139823e-07,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16706478595733643,
"step": 4165,
"valid_targets_mean": 4401.9,
"valid_targets_min": 310
},
{
"epoch": 6.714975845410628,
"grad_norm": 0.5623618030459923,
"learning_rate": 2.039869666844929e-07,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1561906784772873,
"step": 4170,
"valid_targets_mean": 3450.5,
"valid_targets_min": 1034
},
{
"epoch": 6.723027375201288,
"grad_norm": 0.5216795359225037,
"learning_rate": 1.9270615993998375e-07,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1636110544204712,
"step": 4175,
"valid_targets_mean": 4135.8,
"valid_targets_min": 1656
},
{
"epoch": 6.731078904991948,
"grad_norm": 0.5368469010480501,
"learning_rate": 1.817447029764874e-07,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16674436628818512,
"step": 4180,
"valid_targets_mean": 4527.6,
"valid_targets_min": 1381
},
{
"epoch": 6.739130434782608,
"grad_norm": 0.6438973279011997,
"learning_rate": 1.7110277252379238e-07,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15082503855228424,
"step": 4185,
"valid_targets_mean": 4736.3,
"valid_targets_min": 1379
},
{
"epoch": 6.747181964573269,
"grad_norm": 0.4998287056476511,
"learning_rate": 1.607805401600149e-07,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17229287326335907,
"step": 4190,
"valid_targets_mean": 4969.6,
"valid_targets_min": 1283
},
{
"epoch": 6.755233494363929,
"grad_norm": 0.599169633423643,
"learning_rate": 1.5077817230883419e-07,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15904340147972107,
"step": 4195,
"valid_targets_mean": 4552.9,
"valid_targets_min": 1866
},
{
"epoch": 6.763285024154589,
"grad_norm": 0.570759522637566,
"learning_rate": 1.4109583023679706e-07,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15024811029434204,
"step": 4200,
"valid_targets_mean": 5746.9,
"valid_targets_min": 1892
},
{
"epoch": 6.7713365539452495,
"grad_norm": 0.5403647002807387,
"learning_rate": 1.3173367005073545e-07,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17785856127738953,
"step": 4205,
"valid_targets_mean": 4047.6,
"valid_targets_min": 2002
},
{
"epoch": 6.77938808373591,
"grad_norm": 0.5226238218670288,
"learning_rate": 1.2269184269523282e-07,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16204693913459778,
"step": 4210,
"valid_targets_mean": 4730.7,
"valid_targets_min": 1508
},
{
"epoch": 6.78743961352657,
"grad_norm": 0.5555947999177602,
"learning_rate": 1.1397049395020842e-07,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16874821484088898,
"step": 4215,
"valid_targets_mean": 4100.5,
"valid_targets_min": 1171
},
{
"epoch": 6.79549114331723,
"grad_norm": 0.5473832146836152,
"learning_rate": 1.0556976442854805e-07,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18583595752716064,
"step": 4220,
"valid_targets_mean": 4135.4,
"valid_targets_min": 344
},
{
"epoch": 6.8035426731078905,
"grad_norm": 0.5690884856327217,
"learning_rate": 9.748978957385025e-08,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1753610521554947,
"step": 4225,
"valid_targets_mean": 4328.1,
"valid_targets_min": 669
},
{
"epoch": 6.811594202898551,
"grad_norm": 0.5625787536362429,
"learning_rate": 8.9730699658237e-08,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15724310278892517,
"step": 4230,
"valid_targets_mean": 4711.9,
"valid_targets_min": 2299
},
{
"epoch": 6.819645732689211,
"grad_norm": 0.5162132722455169,
"learning_rate": 8.229261978025316e-08,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17424245178699493,
"step": 4235,
"valid_targets_mean": 4760.0,
"valid_targets_min": 2276
},
{
"epoch": 6.827697262479871,
"grad_norm": 0.6156039773080834,
"learning_rate": 7.517566986285474e-08,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1574200689792633,
"step": 4240,
"valid_targets_mean": 3681.5,
"valid_targets_min": 751
},
{
"epoch": 6.835748792270532,
"grad_norm": 0.5832771610140742,
"learning_rate": 6.837996465146823e-08,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17290878295898438,
"step": 4245,
"valid_targets_mean": 3748.6,
"valid_targets_min": 284
},
{
"epoch": 6.843800322061192,
"grad_norm": 0.5576720036336581,
"learning_rate": 6.190561371214321e-08,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16148659586906433,
"step": 4250,
"valid_targets_mean": 4166.0,
"valid_targets_min": 930
},
{
"epoch": 6.851851851851852,
"grad_norm": 0.5878319666889452,
"learning_rate": 5.575272142978927e-08,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.172722727060318,
"step": 4255,
"valid_targets_mean": 4018.2,
"valid_targets_min": 754
},
{
"epoch": 6.859903381642512,
"grad_norm": 0.479443149906381,
"learning_rate": 4.992138700649074e-08,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13948974013328552,
"step": 4260,
"valid_targets_mean": 4858.1,
"valid_targets_min": 1813
},
{
"epoch": 6.867954911433173,
"grad_norm": 0.5541385500661399,
"learning_rate": 4.4411704459903506e-08,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1660829335451126,
"step": 4265,
"valid_targets_mean": 4232.4,
"valid_targets_min": 1054
},
{
"epoch": 6.876006441223833,
"grad_norm": 0.6179225703483298,
"learning_rate": 3.92237626217451e-08,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16906727850437164,
"step": 4270,
"valid_targets_mean": 4460.8,
"valid_targets_min": 1530
},
{
"epoch": 6.884057971014493,
"grad_norm": 0.5783966854225258,
"learning_rate": 3.435764513635809e-08,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17848993837833405,
"step": 4275,
"valid_targets_mean": 4309.5,
"valid_targets_min": 1717
},
{
"epoch": 6.892109500805153,
"grad_norm": 0.5351867682144865,
"learning_rate": 2.9813430459364465e-08,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17882059514522552,
"step": 4280,
"valid_targets_mean": 4416.9,
"valid_targets_min": 1611
},
{
"epoch": 6.900161030595813,
"grad_norm": 0.573670983161385,
"learning_rate": 2.5591191856397802e-08,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15430384874343872,
"step": 4285,
"valid_targets_mean": 4570.9,
"valid_targets_min": 1407
},
{
"epoch": 6.908212560386474,
"grad_norm": 0.5344897585917823,
"learning_rate": 2.1690997401928593e-08,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16887977719306946,
"step": 4290,
"valid_targets_mean": 4439.5,
"valid_targets_min": 2172
},
{
"epoch": 6.916264090177133,
"grad_norm": 0.551697601245166,
"learning_rate": 1.811290997815851e-08,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17137417197227478,
"step": 4295,
"valid_targets_mean": 4672.2,
"valid_targets_min": 590
},
{
"epoch": 6.9243156199677935,
"grad_norm": 0.5535638309128108,
"learning_rate": 1.485698727400564e-08,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14466409385204315,
"step": 4300,
"valid_targets_mean": 3469.3,
"valid_targets_min": 1197
},
{
"epoch": 6.932367149758454,
"grad_norm": 0.5119337022576111,
"learning_rate": 1.1923281784185226e-08,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16587556898593903,
"step": 4305,
"valid_targets_mean": 4396.5,
"valid_targets_min": 1299
},
{
"epoch": 6.940418679549114,
"grad_norm": 0.5923102041383612,
"learning_rate": 9.311840808357009e-09,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823520064353943,
"step": 4310,
"valid_targets_mean": 4216.1,
"valid_targets_min": 1303
},
{
"epoch": 6.948470209339774,
"grad_norm": 0.5103445914494756,
"learning_rate": 7.022706450354744e-09,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15162253379821777,
"step": 4315,
"valid_targets_mean": 5503.6,
"valid_targets_min": 2231
},
{
"epoch": 6.956521739130435,
"grad_norm": 0.533406608295802,
"learning_rate": 5.055915617522278e-09,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14400282502174377,
"step": 4320,
"valid_targets_mean": 4314.7,
"valid_targets_min": 1448
},
{
"epoch": 6.964573268921095,
"grad_norm": 0.6879701190779768,
"learning_rate": 3.411500020109593e-09,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823330670595169,
"step": 4325,
"valid_targets_mean": 3070.6,
"valid_targets_min": 467
},
{
"epoch": 6.972624798711755,
"grad_norm": 0.6418600229930465,
"learning_rate": 2.08948617075988e-09,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15779449045658112,
"step": 4330,
"valid_targets_mean": 3922.4,
"valid_targets_min": 1291
},
{
"epoch": 6.980676328502415,
"grad_norm": 0.5848882869027459,
"learning_rate": 1.0898953840898786e-09,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18286889791488647,
"step": 4335,
"valid_targets_mean": 4633.8,
"valid_targets_min": 695
},
{
"epoch": 6.988727858293076,
"grad_norm": 0.45093430680878505,
"learning_rate": 4.127437763390418e-10,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15890920162200928,
"step": 4340,
"valid_targets_mean": 5343.4,
"valid_targets_min": 2478
},
{
"epoch": 6.996779388083736,
"grad_norm": 0.5378585489037748,
"learning_rate": 5.804226511196831e-11,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15117883682250977,
"step": 4345,
"valid_targets_mean": 3975.8,
"valid_targets_min": 2081
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17696434259414673,
"step": 4347,
"total_flos": 1518375161495552.0,
"train_loss": 0.21155054198480733,
"train_runtime": 25607.106,
"train_samples_per_second": 2.714,
"train_steps_per_second": 0.17,
"valid_targets_mean": 4512.6,
"valid_targets_min": 535
}
],
"logging_steps": 5,
"max_steps": 4347,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1518375161495552.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}