nl2bash-stack-over5050 / trainer_state.json
hf-reset
Reset repository without checkpoints directories
5b8b6f4
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 7161,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.004887585532746823,
"grad_norm": 12.44376256794233,
"learning_rate": 2.2315202231520225e-07,
"loss": 0.775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7660703063011169,
"step": 5,
"valid_targets_mean": 2759.7,
"valid_targets_min": 789
},
{
"epoch": 0.009775171065493646,
"grad_norm": 13.083127751453706,
"learning_rate": 5.020920502092051e-07,
"loss": 0.7585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7838925123214722,
"step": 10,
"valid_targets_mean": 2175.1,
"valid_targets_min": 647
},
{
"epoch": 0.01466275659824047,
"grad_norm": 10.557856263973706,
"learning_rate": 7.810320781032078e-07,
"loss": 0.7713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7736507654190063,
"step": 15,
"valid_targets_mean": 2148.8,
"valid_targets_min": 803
},
{
"epoch": 0.019550342130987292,
"grad_norm": 9.4146088353884,
"learning_rate": 1.0599721059972108e-06,
"loss": 0.7562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7820156812667847,
"step": 20,
"valid_targets_mean": 2958.0,
"valid_targets_min": 945
},
{
"epoch": 0.024437927663734114,
"grad_norm": 8.510426871763977,
"learning_rate": 1.3389121338912134e-06,
"loss": 0.7276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7074830532073975,
"step": 25,
"valid_targets_mean": 2418.9,
"valid_targets_min": 734
},
{
"epoch": 0.02932551319648094,
"grad_norm": 5.967061937258563,
"learning_rate": 1.6178521617852163e-06,
"loss": 0.6946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7003393769264221,
"step": 30,
"valid_targets_mean": 2274.1,
"valid_targets_min": 724
},
{
"epoch": 0.03421309872922776,
"grad_norm": 5.128418930959132,
"learning_rate": 1.8967921896792191e-06,
"loss": 0.6951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6412136554718018,
"step": 35,
"valid_targets_mean": 2286.8,
"valid_targets_min": 1077
},
{
"epoch": 0.039100684261974585,
"grad_norm": 3.685105984706391,
"learning_rate": 2.175732217573222e-06,
"loss": 0.622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6155872344970703,
"step": 40,
"valid_targets_mean": 2433.9,
"valid_targets_min": 635
},
{
"epoch": 0.04398826979472141,
"grad_norm": 3.552082634936528,
"learning_rate": 2.4546722454672246e-06,
"loss": 0.6131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.622800350189209,
"step": 45,
"valid_targets_mean": 2232.9,
"valid_targets_min": 914
},
{
"epoch": 0.04887585532746823,
"grad_norm": 2.6301835879043747,
"learning_rate": 2.7336122733612273e-06,
"loss": 0.5903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.57831209897995,
"step": 50,
"valid_targets_mean": 2736.5,
"valid_targets_min": 1194
},
{
"epoch": 0.053763440860215055,
"grad_norm": 1.939146654771752,
"learning_rate": 3.0125523012552303e-06,
"loss": 0.566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5587443113327026,
"step": 55,
"valid_targets_mean": 2471.7,
"valid_targets_min": 753
},
{
"epoch": 0.05865102639296188,
"grad_norm": 1.3923623066674402,
"learning_rate": 3.2914923291492334e-06,
"loss": 0.5091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5293725728988647,
"step": 60,
"valid_targets_mean": 3486.3,
"valid_targets_min": 1205
},
{
"epoch": 0.0635386119257087,
"grad_norm": 1.2847016539983112,
"learning_rate": 3.570432357043236e-06,
"loss": 0.5174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48333871364593506,
"step": 65,
"valid_targets_mean": 2133.9,
"valid_targets_min": 639
},
{
"epoch": 0.06842619745845552,
"grad_norm": 1.1703945643061187,
"learning_rate": 3.849372384937239e-06,
"loss": 0.4767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47202277183532715,
"step": 70,
"valid_targets_mean": 2432.9,
"valid_targets_min": 820
},
{
"epoch": 0.07331378299120235,
"grad_norm": 1.1061255401631531,
"learning_rate": 4.128312412831242e-06,
"loss": 0.5054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5339841842651367,
"step": 75,
"valid_targets_mean": 2277.9,
"valid_targets_min": 741
},
{
"epoch": 0.07820136852394917,
"grad_norm": 1.1039585723531486,
"learning_rate": 4.407252440725244e-06,
"loss": 0.4741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49983298778533936,
"step": 80,
"valid_targets_mean": 2021.4,
"valid_targets_min": 855
},
{
"epoch": 0.08308895405669599,
"grad_norm": 0.9865369304789178,
"learning_rate": 4.6861924686192475e-06,
"loss": 0.4612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42603811621665955,
"step": 85,
"valid_targets_mean": 2219.6,
"valid_targets_min": 734
},
{
"epoch": 0.08797653958944282,
"grad_norm": 1.071853710354841,
"learning_rate": 4.9651324965132506e-06,
"loss": 0.4694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45195892453193665,
"step": 90,
"valid_targets_mean": 2383.9,
"valid_targets_min": 1015
},
{
"epoch": 0.09286412512218964,
"grad_norm": 0.9176728913117824,
"learning_rate": 5.244072524407254e-06,
"loss": 0.4449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42296427488327026,
"step": 95,
"valid_targets_mean": 2121.6,
"valid_targets_min": 967
},
{
"epoch": 0.09775171065493646,
"grad_norm": 0.9296613279197797,
"learning_rate": 5.523012552301256e-06,
"loss": 0.4326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4197250008583069,
"step": 100,
"valid_targets_mean": 2173.2,
"valid_targets_min": 895
},
{
"epoch": 0.10263929618768329,
"grad_norm": 0.9405388278402095,
"learning_rate": 5.801952580195258e-06,
"loss": 0.4436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4366050362586975,
"step": 105,
"valid_targets_mean": 2097.8,
"valid_targets_min": 816
},
{
"epoch": 0.10752688172043011,
"grad_norm": 0.7924545346293838,
"learning_rate": 6.080892608089262e-06,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4147997796535492,
"step": 110,
"valid_targets_mean": 2730.9,
"valid_targets_min": 955
},
{
"epoch": 0.11241446725317693,
"grad_norm": 0.789932617535872,
"learning_rate": 6.359832635983264e-06,
"loss": 0.4256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4059978723526001,
"step": 115,
"valid_targets_mean": 2887.8,
"valid_targets_min": 1001
},
{
"epoch": 0.11730205278592376,
"grad_norm": 0.8095583193686153,
"learning_rate": 6.6387726638772664e-06,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4052962064743042,
"step": 120,
"valid_targets_mean": 2514.8,
"valid_targets_min": 847
},
{
"epoch": 0.12218963831867058,
"grad_norm": 0.7949836362164371,
"learning_rate": 6.91771269177127e-06,
"loss": 0.4196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4143103063106537,
"step": 125,
"valid_targets_mean": 2648.2,
"valid_targets_min": 826
},
{
"epoch": 0.1270772238514174,
"grad_norm": 0.799726720099262,
"learning_rate": 7.1966527196652726e-06,
"loss": 0.4221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4228057265281677,
"step": 130,
"valid_targets_mean": 2594.8,
"valid_targets_min": 698
},
{
"epoch": 0.13196480938416422,
"grad_norm": 0.9617534138420096,
"learning_rate": 7.475592747559275e-06,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42820626497268677,
"step": 135,
"valid_targets_mean": 2055.6,
"valid_targets_min": 632
},
{
"epoch": 0.13685239491691104,
"grad_norm": 0.8348186060833679,
"learning_rate": 7.754532775453279e-06,
"loss": 0.4162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4349338114261627,
"step": 140,
"valid_targets_mean": 2389.0,
"valid_targets_min": 1020
},
{
"epoch": 0.14173998044965788,
"grad_norm": 0.8157340380976558,
"learning_rate": 8.033472803347281e-06,
"loss": 0.4207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42874521017074585,
"step": 145,
"valid_targets_mean": 2644.0,
"valid_targets_min": 684
},
{
"epoch": 0.1466275659824047,
"grad_norm": 0.8180117684614197,
"learning_rate": 8.312412831241283e-06,
"loss": 0.3971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4317898452281952,
"step": 150,
"valid_targets_mean": 2665.6,
"valid_targets_min": 869
},
{
"epoch": 0.15151515151515152,
"grad_norm": 0.8885682855346618,
"learning_rate": 8.591352859135287e-06,
"loss": 0.3854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4081709384918213,
"step": 155,
"valid_targets_mean": 2359.7,
"valid_targets_min": 872
},
{
"epoch": 0.15640273704789834,
"grad_norm": 0.8080583509361516,
"learning_rate": 8.87029288702929e-06,
"loss": 0.3982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.410560667514801,
"step": 160,
"valid_targets_mean": 2443.3,
"valid_targets_min": 650
},
{
"epoch": 0.16129032258064516,
"grad_norm": 1.0075730249123667,
"learning_rate": 9.149232914923292e-06,
"loss": 0.3827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3756175637245178,
"step": 165,
"valid_targets_mean": 2445.9,
"valid_targets_min": 729
},
{
"epoch": 0.16617790811339198,
"grad_norm": 0.7988923971464764,
"learning_rate": 9.428172942817295e-06,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3763277530670166,
"step": 170,
"valid_targets_mean": 2335.2,
"valid_targets_min": 754
},
{
"epoch": 0.1710654936461388,
"grad_norm": 0.8801234974461333,
"learning_rate": 9.707112970711298e-06,
"loss": 0.4039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4362441897392273,
"step": 175,
"valid_targets_mean": 2604.2,
"valid_targets_min": 722
},
{
"epoch": 0.17595307917888564,
"grad_norm": 1.0573428481191474,
"learning_rate": 9.986052998605302e-06,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3826301395893097,
"step": 180,
"valid_targets_mean": 1948.0,
"valid_targets_min": 718
},
{
"epoch": 0.18084066471163246,
"grad_norm": 0.8244047729823328,
"learning_rate": 1.0264993026499304e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3717021346092224,
"step": 185,
"valid_targets_mean": 2318.2,
"valid_targets_min": 868
},
{
"epoch": 0.18572825024437928,
"grad_norm": 0.8733754607654697,
"learning_rate": 1.0543933054393308e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41147416830062866,
"step": 190,
"valid_targets_mean": 2373.2,
"valid_targets_min": 855
},
{
"epoch": 0.1906158357771261,
"grad_norm": 0.8971397713788575,
"learning_rate": 1.0822873082287308e-05,
"loss": 0.399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4053829312324524,
"step": 195,
"valid_targets_mean": 2233.9,
"valid_targets_min": 731
},
{
"epoch": 0.19550342130987292,
"grad_norm": 1.0257634454527333,
"learning_rate": 1.1101813110181312e-05,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34646230936050415,
"step": 200,
"valid_targets_mean": 1661.8,
"valid_targets_min": 652
},
{
"epoch": 0.20039100684261973,
"grad_norm": 0.8750695251551033,
"learning_rate": 1.1380753138075316e-05,
"loss": 0.3884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39979293942451477,
"step": 205,
"valid_targets_mean": 2502.0,
"valid_targets_min": 749
},
{
"epoch": 0.20527859237536658,
"grad_norm": 0.8985663536980157,
"learning_rate": 1.1659693165969317e-05,
"loss": 0.3715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3521466553211212,
"step": 210,
"valid_targets_mean": 2193.1,
"valid_targets_min": 1185
},
{
"epoch": 0.2101661779081134,
"grad_norm": 0.8690020156723633,
"learning_rate": 1.193863319386332e-05,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39606279134750366,
"step": 215,
"valid_targets_mean": 2162.5,
"valid_targets_min": 791
},
{
"epoch": 0.21505376344086022,
"grad_norm": 0.7851411691827029,
"learning_rate": 1.2217573221757324e-05,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3474773168563843,
"step": 220,
"valid_targets_mean": 2564.4,
"valid_targets_min": 754
},
{
"epoch": 0.21994134897360704,
"grad_norm": 0.8708152091406828,
"learning_rate": 1.2496513249651325e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3648437261581421,
"step": 225,
"valid_targets_mean": 2014.6,
"valid_targets_min": 544
},
{
"epoch": 0.22482893450635386,
"grad_norm": 0.8997257441861602,
"learning_rate": 1.2775453277545329e-05,
"loss": 0.3817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3548926115036011,
"step": 230,
"valid_targets_mean": 1954.0,
"valid_targets_min": 627
},
{
"epoch": 0.22971652003910067,
"grad_norm": 0.7622734239422039,
"learning_rate": 1.3054393305439333e-05,
"loss": 0.3576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3857002854347229,
"step": 235,
"valid_targets_mean": 2903.6,
"valid_targets_min": 964
},
{
"epoch": 0.23460410557184752,
"grad_norm": 0.8137819570309708,
"learning_rate": 1.3333333333333333e-05,
"loss": 0.367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3650803864002228,
"step": 240,
"valid_targets_mean": 2334.2,
"valid_targets_min": 746
},
{
"epoch": 0.23949169110459434,
"grad_norm": 0.9062648393789453,
"learning_rate": 1.3612273361227337e-05,
"loss": 0.3859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38647863268852234,
"step": 245,
"valid_targets_mean": 2119.2,
"valid_targets_min": 933
},
{
"epoch": 0.24437927663734116,
"grad_norm": 0.8593102670864973,
"learning_rate": 1.3891213389121341e-05,
"loss": 0.3547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32468748092651367,
"step": 250,
"valid_targets_mean": 2219.7,
"valid_targets_min": 807
},
{
"epoch": 0.24926686217008798,
"grad_norm": 1.6459054094057368,
"learning_rate": 1.4170153417015342e-05,
"loss": 0.3763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3920065760612488,
"step": 255,
"valid_targets_mean": 3263.6,
"valid_targets_min": 886
},
{
"epoch": 0.2541544477028348,
"grad_norm": 0.8244627390914492,
"learning_rate": 1.4449093444909346e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3641440272331238,
"step": 260,
"valid_targets_mean": 2413.2,
"valid_targets_min": 819
},
{
"epoch": 0.2590420332355816,
"grad_norm": 0.947648955580425,
"learning_rate": 1.472803347280335e-05,
"loss": 0.3644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3710935413837433,
"step": 265,
"valid_targets_mean": 1834.6,
"valid_targets_min": 668
},
{
"epoch": 0.26392961876832843,
"grad_norm": 0.7479773006623937,
"learning_rate": 1.500697350069735e-05,
"loss": 0.3868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3943009376525879,
"step": 270,
"valid_targets_mean": 2967.0,
"valid_targets_min": 712
},
{
"epoch": 0.26881720430107525,
"grad_norm": 0.6850159478077383,
"learning_rate": 1.5285913528591356e-05,
"loss": 0.357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33576327562332153,
"step": 275,
"valid_targets_mean": 3043.9,
"valid_targets_min": 648
},
{
"epoch": 0.27370478983382207,
"grad_norm": 0.8054999780008923,
"learning_rate": 1.5564853556485358e-05,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36960098147392273,
"step": 280,
"valid_targets_mean": 2678.3,
"valid_targets_min": 1027
},
{
"epoch": 0.2785923753665689,
"grad_norm": 0.9675054347484953,
"learning_rate": 1.584379358437936e-05,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3982788324356079,
"step": 285,
"valid_targets_mean": 1821.8,
"valid_targets_min": 701
},
{
"epoch": 0.28347996089931576,
"grad_norm": 0.9860609488043531,
"learning_rate": 1.6122733612273362e-05,
"loss": 0.3773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3843904137611389,
"step": 290,
"valid_targets_mean": 2513.7,
"valid_targets_min": 881
},
{
"epoch": 0.2883675464320626,
"grad_norm": 0.991847663374839,
"learning_rate": 1.6401673640167365e-05,
"loss": 0.379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4282916784286499,
"step": 295,
"valid_targets_mean": 2874.1,
"valid_targets_min": 1072
},
{
"epoch": 0.2932551319648094,
"grad_norm": 0.8307727140975414,
"learning_rate": 1.6680613668061367e-05,
"loss": 0.3548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34740254282951355,
"step": 300,
"valid_targets_mean": 2016.8,
"valid_targets_min": 681
},
{
"epoch": 0.2981427174975562,
"grad_norm": 0.7143528489591171,
"learning_rate": 1.6959553695955372e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.359591007232666,
"step": 305,
"valid_targets_mean": 3070.4,
"valid_targets_min": 774
},
{
"epoch": 0.30303030303030304,
"grad_norm": 0.9089966300203021,
"learning_rate": 1.7238493723849375e-05,
"loss": 0.3498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33375781774520874,
"step": 310,
"valid_targets_mean": 1869.1,
"valid_targets_min": 780
},
{
"epoch": 0.30791788856304986,
"grad_norm": 0.8634809970221224,
"learning_rate": 1.7517433751743377e-05,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37010622024536133,
"step": 315,
"valid_targets_mean": 2224.5,
"valid_targets_min": 754
},
{
"epoch": 0.3128054740957967,
"grad_norm": 0.8540663264632482,
"learning_rate": 1.779637377963738e-05,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3211752772331238,
"step": 320,
"valid_targets_mean": 2225.6,
"valid_targets_min": 777
},
{
"epoch": 0.3176930596285435,
"grad_norm": 0.8804814214418613,
"learning_rate": 1.807531380753138e-05,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35791587829589844,
"step": 325,
"valid_targets_mean": 2065.7,
"valid_targets_min": 548
},
{
"epoch": 0.3225806451612903,
"grad_norm": 0.7640563487552252,
"learning_rate": 1.8354253835425383e-05,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3520016074180603,
"step": 330,
"valid_targets_mean": 2701.5,
"valid_targets_min": 944
},
{
"epoch": 0.32746823069403713,
"grad_norm": 0.7296882324617866,
"learning_rate": 1.863319386331939e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31554561853408813,
"step": 335,
"valid_targets_mean": 3010.9,
"valid_targets_min": 1211
},
{
"epoch": 0.33235581622678395,
"grad_norm": 0.7271443111223936,
"learning_rate": 1.891213389121339e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3308175802230835,
"step": 340,
"valid_targets_mean": 2877.0,
"valid_targets_min": 1375
},
{
"epoch": 0.33724340175953077,
"grad_norm": 0.8360036681979609,
"learning_rate": 1.9191073919107393e-05,
"loss": 0.3671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34241533279418945,
"step": 345,
"valid_targets_mean": 2568.8,
"valid_targets_min": 656
},
{
"epoch": 0.3421309872922776,
"grad_norm": 0.8550409656130434,
"learning_rate": 1.9470013947001396e-05,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3601570427417755,
"step": 350,
"valid_targets_mean": 2331.7,
"valid_targets_min": 679
},
{
"epoch": 0.34701857282502446,
"grad_norm": 0.9155877630691556,
"learning_rate": 1.9748953974895398e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38951539993286133,
"step": 355,
"valid_targets_mean": 2071.4,
"valid_targets_min": 760
},
{
"epoch": 0.3519061583577713,
"grad_norm": 0.883435595055635,
"learning_rate": 2.0027894002789404e-05,
"loss": 0.36,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3670802414417267,
"step": 360,
"valid_targets_mean": 1985.2,
"valid_targets_min": 592
},
{
"epoch": 0.3567937438905181,
"grad_norm": 0.9206852695774652,
"learning_rate": 2.0306834030683406e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3370826840400696,
"step": 365,
"valid_targets_mean": 2055.2,
"valid_targets_min": 799
},
{
"epoch": 0.3616813294232649,
"grad_norm": 0.7244221713153408,
"learning_rate": 2.0585774058577405e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36608511209487915,
"step": 370,
"valid_targets_mean": 3176.6,
"valid_targets_min": 1237
},
{
"epoch": 0.36656891495601174,
"grad_norm": 0.8515795547939923,
"learning_rate": 2.086471408647141e-05,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3597974181175232,
"step": 375,
"valid_targets_mean": 2919.8,
"valid_targets_min": 1215
},
{
"epoch": 0.37145650048875856,
"grad_norm": 0.8264921304378712,
"learning_rate": 2.1143654114365412e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.364242821931839,
"step": 380,
"valid_targets_mean": 2541.9,
"valid_targets_min": 763
},
{
"epoch": 0.3763440860215054,
"grad_norm": 0.907898110015603,
"learning_rate": 2.1422594142259415e-05,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32725921273231506,
"step": 385,
"valid_targets_mean": 1902.6,
"valid_targets_min": 464
},
{
"epoch": 0.3812316715542522,
"grad_norm": 0.938573710378532,
"learning_rate": 2.170153417015342e-05,
"loss": 0.3244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34030425548553467,
"step": 390,
"valid_targets_mean": 2139.0,
"valid_targets_min": 627
},
{
"epoch": 0.386119257086999,
"grad_norm": 0.9348906560243034,
"learning_rate": 2.1980474198047422e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3462354838848114,
"step": 395,
"valid_targets_mean": 2194.8,
"valid_targets_min": 738
},
{
"epoch": 0.39100684261974583,
"grad_norm": 0.6752427727321951,
"learning_rate": 2.225941422594142e-05,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33034390211105347,
"step": 400,
"valid_targets_mean": 3065.8,
"valid_targets_min": 796
},
{
"epoch": 0.39589442815249265,
"grad_norm": 0.8105931491656845,
"learning_rate": 2.2538354253835427e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3310199975967407,
"step": 405,
"valid_targets_mean": 2525.2,
"valid_targets_min": 900
},
{
"epoch": 0.40078201368523947,
"grad_norm": 0.8829736004010716,
"learning_rate": 2.281729428172943e-05,
"loss": 0.3529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3105641305446625,
"step": 410,
"valid_targets_mean": 2156.9,
"valid_targets_min": 805
},
{
"epoch": 0.4056695992179863,
"grad_norm": 1.053696655919182,
"learning_rate": 2.309623430962343e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3739250898361206,
"step": 415,
"valid_targets_mean": 2282.6,
"valid_targets_min": 1170
},
{
"epoch": 0.41055718475073316,
"grad_norm": 0.809739823282899,
"learning_rate": 2.3375174337517437e-05,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35403841733932495,
"step": 420,
"valid_targets_mean": 2249.1,
"valid_targets_min": 698
},
{
"epoch": 0.41544477028348,
"grad_norm": 0.8114625727115713,
"learning_rate": 2.365411436541144e-05,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3622049391269684,
"step": 425,
"valid_targets_mean": 2313.3,
"valid_targets_min": 766
},
{
"epoch": 0.4203323558162268,
"grad_norm": 0.7569678066302454,
"learning_rate": 2.3933054393305438e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33777353167533875,
"step": 430,
"valid_targets_mean": 2816.7,
"valid_targets_min": 859
},
{
"epoch": 0.4252199413489736,
"grad_norm": 0.7327933630295097,
"learning_rate": 2.4211994421199444e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3273935317993164,
"step": 435,
"valid_targets_mean": 2645.7,
"valid_targets_min": 1098
},
{
"epoch": 0.43010752688172044,
"grad_norm": 0.8665670559962085,
"learning_rate": 2.4490934449093446e-05,
"loss": 0.3425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3423697054386139,
"step": 440,
"valid_targets_mean": 2181.8,
"valid_targets_min": 604
},
{
"epoch": 0.43499511241446726,
"grad_norm": 0.8580346981985594,
"learning_rate": 2.4769874476987448e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34883952140808105,
"step": 445,
"valid_targets_mean": 2146.7,
"valid_targets_min": 638
},
{
"epoch": 0.4398826979472141,
"grad_norm": 0.8238090290163292,
"learning_rate": 2.5048814504881454e-05,
"loss": 0.3507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31056028604507446,
"step": 450,
"valid_targets_mean": 2293.9,
"valid_targets_min": 943
},
{
"epoch": 0.4447702834799609,
"grad_norm": 0.6463651486346894,
"learning_rate": 2.5327754532775456e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2803493142127991,
"step": 455,
"valid_targets_mean": 2967.7,
"valid_targets_min": 865
},
{
"epoch": 0.4496578690127077,
"grad_norm": 0.941311131272596,
"learning_rate": 2.5606694560669455e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3155880570411682,
"step": 460,
"valid_targets_mean": 1743.8,
"valid_targets_min": 764
},
{
"epoch": 0.45454545454545453,
"grad_norm": 0.736803043029875,
"learning_rate": 2.588563458856346e-05,
"loss": 0.3442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36394965648651123,
"step": 465,
"valid_targets_mean": 2932.3,
"valid_targets_min": 763
},
{
"epoch": 0.45943304007820135,
"grad_norm": 0.7921374525507471,
"learning_rate": 2.6164574616457463e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3570030927658081,
"step": 470,
"valid_targets_mean": 3040.9,
"valid_targets_min": 796
},
{
"epoch": 0.46432062561094817,
"grad_norm": 0.7900857884761241,
"learning_rate": 2.6443514644351465e-05,
"loss": 0.342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37542372941970825,
"step": 475,
"valid_targets_mean": 3116.3,
"valid_targets_min": 926
},
{
"epoch": 0.46920821114369504,
"grad_norm": 1.159582734344674,
"learning_rate": 2.672245467224547e-05,
"loss": 0.3439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36254942417144775,
"step": 480,
"valid_targets_mean": 2185.8,
"valid_targets_min": 713
},
{
"epoch": 0.47409579667644186,
"grad_norm": 0.7897072764788433,
"learning_rate": 2.7001394700139473e-05,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33607053756713867,
"step": 485,
"valid_targets_mean": 2364.0,
"valid_targets_min": 1086
},
{
"epoch": 0.4789833822091887,
"grad_norm": 0.8400859552438328,
"learning_rate": 2.728033472803347e-05,
"loss": 0.3359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3387121856212616,
"step": 490,
"valid_targets_mean": 2131.7,
"valid_targets_min": 640
},
{
"epoch": 0.4838709677419355,
"grad_norm": 0.7446625512121486,
"learning_rate": 2.7559274755927477e-05,
"loss": 0.334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3753664493560791,
"step": 495,
"valid_targets_mean": 2741.8,
"valid_targets_min": 548
},
{
"epoch": 0.4887585532746823,
"grad_norm": 0.7424189633962999,
"learning_rate": 2.783821478382148e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35922667384147644,
"step": 500,
"valid_targets_mean": 3106.8,
"valid_targets_min": 668
},
{
"epoch": 0.49364613880742914,
"grad_norm": 0.8398560921552762,
"learning_rate": 2.811715481171548e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27231159806251526,
"step": 505,
"valid_targets_mean": 2408.9,
"valid_targets_min": 742
},
{
"epoch": 0.49853372434017595,
"grad_norm": 0.8650127139587513,
"learning_rate": 2.8396094839609487e-05,
"loss": 0.3244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31993523240089417,
"step": 510,
"valid_targets_mean": 2272.2,
"valid_targets_min": 672
},
{
"epoch": 0.5034213098729228,
"grad_norm": 0.8145474264636156,
"learning_rate": 2.867503486750349e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3184545040130615,
"step": 515,
"valid_targets_mean": 2181.7,
"valid_targets_min": 676
},
{
"epoch": 0.5083088954056696,
"grad_norm": 0.8995961884293948,
"learning_rate": 2.8953974895397488e-05,
"loss": 0.3233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34413954615592957,
"step": 520,
"valid_targets_mean": 2101.1,
"valid_targets_min": 1055
},
{
"epoch": 0.5131964809384164,
"grad_norm": 0.7980166217846976,
"learning_rate": 2.9232914923291494e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3372722864151001,
"step": 525,
"valid_targets_mean": 2395.6,
"valid_targets_min": 1282
},
{
"epoch": 0.5180840664711632,
"grad_norm": 1.1201293160921861,
"learning_rate": 2.9511854951185496e-05,
"loss": 0.323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31446385383605957,
"step": 530,
"valid_targets_mean": 2134.9,
"valid_targets_min": 922
},
{
"epoch": 0.52297165200391,
"grad_norm": 0.7342360486498539,
"learning_rate": 2.9790794979079498e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30906954407691956,
"step": 535,
"valid_targets_mean": 2658.1,
"valid_targets_min": 1076
},
{
"epoch": 0.5278592375366569,
"grad_norm": 0.7267057803106786,
"learning_rate": 3.0069735006973504e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3381599187850952,
"step": 540,
"valid_targets_mean": 2644.8,
"valid_targets_min": 814
},
{
"epoch": 0.5327468230694037,
"grad_norm": 0.8500045196292703,
"learning_rate": 3.0348675034867506e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29569292068481445,
"step": 545,
"valid_targets_mean": 1866.9,
"valid_targets_min": 530
},
{
"epoch": 0.5376344086021505,
"grad_norm": 0.7412443952817233,
"learning_rate": 3.062761506276151e-05,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.345531165599823,
"step": 550,
"valid_targets_mean": 2880.6,
"valid_targets_min": 905
},
{
"epoch": 0.5425219941348973,
"grad_norm": 0.6993041939598253,
"learning_rate": 3.0906555090655514e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3102779984474182,
"step": 555,
"valid_targets_mean": 2846.2,
"valid_targets_min": 790
},
{
"epoch": 0.5474095796676441,
"grad_norm": 0.7359314473756243,
"learning_rate": 3.118549511854951e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32391446828842163,
"step": 560,
"valid_targets_mean": 2719.4,
"valid_targets_min": 816
},
{
"epoch": 0.552297165200391,
"grad_norm": 0.8113820976460382,
"learning_rate": 3.146443514644352e-05,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30669841170310974,
"step": 565,
"valid_targets_mean": 2390.4,
"valid_targets_min": 669
},
{
"epoch": 0.5571847507331378,
"grad_norm": 0.8096140445105596,
"learning_rate": 3.1743375174337524e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3120150566101074,
"step": 570,
"valid_targets_mean": 2190.9,
"valid_targets_min": 739
},
{
"epoch": 0.5620723362658846,
"grad_norm": 0.9110568245840788,
"learning_rate": 3.202231520223152e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3165706992149353,
"step": 575,
"valid_targets_mean": 1853.4,
"valid_targets_min": 722
},
{
"epoch": 0.5669599217986315,
"grad_norm": 0.7684538091148991,
"learning_rate": 3.230125523012553e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956627607345581,
"step": 580,
"valid_targets_mean": 2559.9,
"valid_targets_min": 987
},
{
"epoch": 0.5718475073313783,
"grad_norm": 0.7441624896883247,
"learning_rate": 3.258019525801953e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3297075033187866,
"step": 585,
"valid_targets_mean": 2662.0,
"valid_targets_min": 711
},
{
"epoch": 0.5767350928641252,
"grad_norm": 0.8719735596323135,
"learning_rate": 3.285913528591353e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3282514214515686,
"step": 590,
"valid_targets_mean": 2034.2,
"valid_targets_min": 851
},
{
"epoch": 0.581622678396872,
"grad_norm": 0.8090870634352967,
"learning_rate": 3.313807531380754e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31386953592300415,
"step": 595,
"valid_targets_mean": 2551.9,
"valid_targets_min": 914
},
{
"epoch": 0.5865102639296188,
"grad_norm": 0.7207352022007785,
"learning_rate": 3.341701534170154e-05,
"loss": 0.3237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3386681079864502,
"step": 600,
"valid_targets_mean": 2835.5,
"valid_targets_min": 661
},
{
"epoch": 0.5913978494623656,
"grad_norm": 0.7584008460860305,
"learning_rate": 3.3695955369595536e-05,
"loss": 0.3284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28931134939193726,
"step": 605,
"valid_targets_mean": 2277.4,
"valid_targets_min": 1014
},
{
"epoch": 0.5962854349951124,
"grad_norm": 0.792721139679117,
"learning_rate": 3.397489539748954e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33046597242355347,
"step": 610,
"valid_targets_mean": 2322.7,
"valid_targets_min": 704
},
{
"epoch": 0.6011730205278593,
"grad_norm": 0.7784271949093392,
"learning_rate": 3.425383542538355e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3591078519821167,
"step": 615,
"valid_targets_mean": 2750.8,
"valid_targets_min": 929
},
{
"epoch": 0.6060606060606061,
"grad_norm": 0.8776498743873912,
"learning_rate": 3.4532775453277546e-05,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33385688066482544,
"step": 620,
"valid_targets_mean": 2140.5,
"valid_targets_min": 642
},
{
"epoch": 0.6109481915933529,
"grad_norm": 0.746820447052271,
"learning_rate": 3.481171548117155e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33402806520462036,
"step": 625,
"valid_targets_mean": 2436.4,
"valid_targets_min": 895
},
{
"epoch": 0.6158357771260997,
"grad_norm": 0.7897960735140778,
"learning_rate": 3.509065550906556e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31994372606277466,
"step": 630,
"valid_targets_mean": 2388.4,
"valid_targets_min": 915
},
{
"epoch": 0.6207233626588465,
"grad_norm": 0.7255296236144402,
"learning_rate": 3.5369595536959556e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3037095069885254,
"step": 635,
"valid_targets_mean": 2603.6,
"valid_targets_min": 635
},
{
"epoch": 0.6256109481915934,
"grad_norm": 0.8068527468176921,
"learning_rate": 3.564853556485356e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31424158811569214,
"step": 640,
"valid_targets_mean": 2459.6,
"valid_targets_min": 636
},
{
"epoch": 0.6304985337243402,
"grad_norm": 0.7702625587232006,
"learning_rate": 3.592747559274756e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3524268567562103,
"step": 645,
"valid_targets_mean": 2649.3,
"valid_targets_min": 1140
},
{
"epoch": 0.635386119257087,
"grad_norm": 0.7714466133072925,
"learning_rate": 3.6206415620641566e-05,
"loss": 0.3286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31589627265930176,
"step": 650,
"valid_targets_mean": 2330.5,
"valid_targets_min": 657
},
{
"epoch": 0.6402737047898338,
"grad_norm": 0.7977408416406456,
"learning_rate": 3.648535564853557e-05,
"loss": 0.3244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29703885316848755,
"step": 655,
"valid_targets_mean": 2082.4,
"valid_targets_min": 725
},
{
"epoch": 0.6451612903225806,
"grad_norm": 0.897859600419085,
"learning_rate": 3.676429567642957e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32600027322769165,
"step": 660,
"valid_targets_mean": 2019.0,
"valid_targets_min": 740
},
{
"epoch": 0.6500488758553274,
"grad_norm": 0.8217894407117475,
"learning_rate": 3.704323570432357e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2989169955253601,
"step": 665,
"valid_targets_mean": 2451.2,
"valid_targets_min": 1105
},
{
"epoch": 0.6549364613880743,
"grad_norm": 0.6967345052464025,
"learning_rate": 3.7322175732217575e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28789329528808594,
"step": 670,
"valid_targets_mean": 2827.7,
"valid_targets_min": 692
},
{
"epoch": 0.6598240469208211,
"grad_norm": 0.730001904109528,
"learning_rate": 3.760111576011158e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31676405668258667,
"step": 675,
"valid_targets_mean": 2389.0,
"valid_targets_min": 660
},
{
"epoch": 0.6647116324535679,
"grad_norm": 0.7898161538858068,
"learning_rate": 3.788005578800558e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29914867877960205,
"step": 680,
"valid_targets_mean": 2101.6,
"valid_targets_min": 894
},
{
"epoch": 0.6695992179863147,
"grad_norm": 0.7857150534119379,
"learning_rate": 3.8158995815899585e-05,
"loss": 0.3295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3327745199203491,
"step": 685,
"valid_targets_mean": 2511.1,
"valid_targets_min": 744
},
{
"epoch": 0.6744868035190615,
"grad_norm": 0.6691932395126847,
"learning_rate": 3.843793584379359e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3309377431869507,
"step": 690,
"valid_targets_mean": 2951.6,
"valid_targets_min": 644
},
{
"epoch": 0.6793743890518084,
"grad_norm": 1.1193866441330809,
"learning_rate": 3.871687587168759e-05,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36905205249786377,
"step": 695,
"valid_targets_mean": 2194.1,
"valid_targets_min": 818
},
{
"epoch": 0.6842619745845552,
"grad_norm": 0.7857310721423778,
"learning_rate": 3.8995815899581595e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30003082752227783,
"step": 700,
"valid_targets_mean": 2174.9,
"valid_targets_min": 557
},
{
"epoch": 0.6891495601173021,
"grad_norm": 0.7397963727859,
"learning_rate": 3.9274755927475594e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808341383934021,
"step": 705,
"valid_targets_mean": 2378.6,
"valid_targets_min": 794
},
{
"epoch": 0.6940371456500489,
"grad_norm": 1.068416619253061,
"learning_rate": 3.95536959553696e-05,
"loss": 0.3241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32398268580436707,
"step": 710,
"valid_targets_mean": 1853.6,
"valid_targets_min": 791
},
{
"epoch": 0.6989247311827957,
"grad_norm": 0.7883949750339846,
"learning_rate": 3.9832635983263605e-05,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3216050863265991,
"step": 715,
"valid_targets_mean": 2201.4,
"valid_targets_min": 661
},
{
"epoch": 0.7038123167155426,
"grad_norm": 0.7210396481396164,
"learning_rate": 3.999999049288738e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32969582080841064,
"step": 720,
"valid_targets_mean": 2724.2,
"valid_targets_min": 572
},
{
"epoch": 0.7086999022482894,
"grad_norm": 0.6780724521617006,
"learning_rate": 3.9999883537974135e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3392641842365265,
"step": 725,
"valid_targets_mean": 2957.1,
"valid_targets_min": 856
},
{
"epoch": 0.7135874877810362,
"grad_norm": 1.4001056248209713,
"learning_rate": 3.999965774489451e-05,
"loss": 0.3241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31240707635879517,
"step": 730,
"valid_targets_mean": 2448.2,
"valid_targets_min": 740
},
{
"epoch": 0.718475073313783,
"grad_norm": 0.7066267173981833,
"learning_rate": 3.999931311499014e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2746642827987671,
"step": 735,
"valid_targets_mean": 2677.8,
"valid_targets_min": 1280
},
{
"epoch": 0.7233626588465298,
"grad_norm": 0.9463337394740791,
"learning_rate": 3.999884965030881e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34243521094322205,
"step": 740,
"valid_targets_mean": 1775.4,
"valid_targets_min": 679
},
{
"epoch": 0.7282502443792767,
"grad_norm": 0.7034930040606712,
"learning_rate": 3.9998267353604396e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3177798390388489,
"step": 745,
"valid_targets_mean": 2800.6,
"valid_targets_min": 920
},
{
"epoch": 0.7331378299120235,
"grad_norm": 0.6916689022053226,
"learning_rate": 3.9997566228336865e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289054274559021,
"step": 750,
"valid_targets_mean": 2406.8,
"valid_targets_min": 856
},
{
"epoch": 0.7380254154447703,
"grad_norm": 0.7430166452541812,
"learning_rate": 3.999674627867228e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29457688331604004,
"step": 755,
"valid_targets_mean": 2496.6,
"valid_targets_min": 804
},
{
"epoch": 0.7429130009775171,
"grad_norm": 0.7604153844606187,
"learning_rate": 3.9995807509482715e-05,
"loss": 0.3298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37004536390304565,
"step": 760,
"valid_targets_mean": 2459.6,
"valid_targets_min": 910
},
{
"epoch": 0.7478005865102639,
"grad_norm": 0.7783050791408205,
"learning_rate": 3.99947499263463e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26048505306243896,
"step": 765,
"valid_targets_mean": 1702.1,
"valid_targets_min": 641
},
{
"epoch": 0.7526881720430108,
"grad_norm": 0.6842291009472856,
"learning_rate": 3.999357353554712e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2890620529651642,
"step": 770,
"valid_targets_mean": 2460.7,
"valid_targets_min": 741
},
{
"epoch": 0.7575757575757576,
"grad_norm": 0.7667053941772743,
"learning_rate": 3.999227834407523e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3236725330352783,
"step": 775,
"valid_targets_mean": 2326.1,
"valid_targets_min": 1024
},
{
"epoch": 0.7624633431085044,
"grad_norm": 0.9459473272945332,
"learning_rate": 3.9990864359626586e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2749725580215454,
"step": 780,
"valid_targets_mean": 2354.9,
"valid_targets_min": 914
},
{
"epoch": 0.7673509286412512,
"grad_norm": 0.7184999480991484,
"learning_rate": 3.9989331590603e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3461282253265381,
"step": 785,
"valid_targets_mean": 2811.2,
"valid_targets_min": 725
},
{
"epoch": 0.772238514173998,
"grad_norm": 0.6593556008310089,
"learning_rate": 3.998768004611209e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35281455516815186,
"step": 790,
"valid_targets_mean": 3194.9,
"valid_targets_min": 1180
},
{
"epoch": 0.7771260997067448,
"grad_norm": 0.7230785157141715,
"learning_rate": 3.998590973596725e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3064287304878235,
"step": 795,
"valid_targets_mean": 2452.0,
"valid_targets_min": 786
},
{
"epoch": 0.7820136852394917,
"grad_norm": 0.6934289312826055,
"learning_rate": 3.998402067068755e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3232996165752411,
"step": 800,
"valid_targets_mean": 2586.8,
"valid_targets_min": 1015
},
{
"epoch": 0.7869012707722385,
"grad_norm": 0.6558930070169424,
"learning_rate": 3.998201286149772e-05,
"loss": 0.3206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33236560225486755,
"step": 805,
"valid_targets_mean": 3404.1,
"valid_targets_min": 660
},
{
"epoch": 0.7917888563049853,
"grad_norm": 0.7295217695663251,
"learning_rate": 3.997988632032805e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009946346282959,
"step": 810,
"valid_targets_mean": 2459.5,
"valid_targets_min": 970
},
{
"epoch": 0.7966764418377321,
"grad_norm": 0.8584536403730917,
"learning_rate": 3.99776410598143e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32543686032295227,
"step": 815,
"valid_targets_mean": 2278.4,
"valid_targets_min": 852
},
{
"epoch": 0.8015640273704789,
"grad_norm": 0.7449337414001902,
"learning_rate": 3.997527709329772e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3691062927246094,
"step": 820,
"valid_targets_mean": 2001.3,
"valid_targets_min": 625
},
{
"epoch": 0.8064516129032258,
"grad_norm": 0.7287752989474822,
"learning_rate": 3.997279443482484e-05,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3165518045425415,
"step": 825,
"valid_targets_mean": 2824.4,
"valid_targets_min": 1123
},
{
"epoch": 0.8113391984359726,
"grad_norm": 0.7414141117963199,
"learning_rate": 3.997019309914747e-05,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3582077622413635,
"step": 830,
"valid_targets_mean": 2533.0,
"valid_targets_min": 922
},
{
"epoch": 0.8162267839687195,
"grad_norm": 0.6604646667995736,
"learning_rate": 3.996747310172261e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009747266769409,
"step": 835,
"valid_targets_mean": 2743.4,
"valid_targets_min": 815
},
{
"epoch": 0.8211143695014663,
"grad_norm": 0.7869481152483848,
"learning_rate": 3.996463445871233e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28774186968803406,
"step": 840,
"valid_targets_mean": 2012.9,
"valid_targets_min": 1019
},
{
"epoch": 0.8260019550342131,
"grad_norm": 0.7796967007238236,
"learning_rate": 3.996167718698368e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28823673725128174,
"step": 845,
"valid_targets_mean": 1971.4,
"valid_targets_min": 858
},
{
"epoch": 0.83088954056696,
"grad_norm": 0.7921234290446715,
"learning_rate": 3.9958601304108596e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29436832666397095,
"step": 850,
"valid_targets_mean": 2040.2,
"valid_targets_min": 780
},
{
"epoch": 0.8357771260997068,
"grad_norm": 0.7773209045309674,
"learning_rate": 3.995540682836381e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320604145526886,
"step": 855,
"valid_targets_mean": 2100.3,
"valid_targets_min": 635
},
{
"epoch": 0.8406647116324536,
"grad_norm": 0.7068147985901192,
"learning_rate": 3.99520937787307e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2897074818611145,
"step": 860,
"valid_targets_mean": 2451.1,
"valid_targets_min": 781
},
{
"epoch": 0.8455522971652004,
"grad_norm": 0.6227835458943253,
"learning_rate": 3.994866217489523e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2862326502799988,
"step": 865,
"valid_targets_mean": 3045.1,
"valid_targets_min": 892
},
{
"epoch": 0.8504398826979472,
"grad_norm": 0.8510089182055716,
"learning_rate": 3.994511203724779e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31772327423095703,
"step": 870,
"valid_targets_mean": 2259.7,
"valid_targets_min": 900
},
{
"epoch": 0.855327468230694,
"grad_norm": 0.7031577446655919,
"learning_rate": 3.9941443386883086e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3305051922798157,
"step": 875,
"valid_targets_mean": 2753.0,
"valid_targets_min": 976
},
{
"epoch": 0.8602150537634409,
"grad_norm": 0.7949638614035321,
"learning_rate": 3.9937656245600044e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3418285846710205,
"step": 880,
"valid_targets_mean": 2385.2,
"valid_targets_min": 804
},
{
"epoch": 0.8651026392961877,
"grad_norm": 0.7305187723607021,
"learning_rate": 3.993375063590164e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128136992454529,
"step": 885,
"valid_targets_mean": 2648.4,
"valid_targets_min": 1208
},
{
"epoch": 0.8699902248289345,
"grad_norm": 1.1746959130401167,
"learning_rate": 3.9929726580994775e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2941882610321045,
"step": 890,
"valid_targets_mean": 2617.6,
"valid_targets_min": 904
},
{
"epoch": 0.8748778103616813,
"grad_norm": 0.7402990200201592,
"learning_rate": 3.992558410479015e-05,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2941339612007141,
"step": 895,
"valid_targets_mean": 2542.5,
"valid_targets_min": 735
},
{
"epoch": 0.8797653958944281,
"grad_norm": 0.7737988843199513,
"learning_rate": 3.992132323190214e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2719045579433441,
"step": 900,
"valid_targets_mean": 1987.3,
"valid_targets_min": 878
},
{
"epoch": 0.884652981427175,
"grad_norm": 0.7582651606562361,
"learning_rate": 3.99169439876486e-05,
"loss": 0.3268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3535369634628296,
"step": 905,
"valid_targets_mean": 2560.1,
"valid_targets_min": 870
},
{
"epoch": 0.8895405669599218,
"grad_norm": 0.7699462585158438,
"learning_rate": 3.991244639805074e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3052283823490143,
"step": 910,
"valid_targets_mean": 2282.6,
"valid_targets_min": 900
},
{
"epoch": 0.8944281524926686,
"grad_norm": 0.7785182577824628,
"learning_rate": 3.9907830489832993e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26899123191833496,
"step": 915,
"valid_targets_mean": 2104.2,
"valid_targets_min": 676
},
{
"epoch": 0.8993157380254154,
"grad_norm": 0.8574210895658473,
"learning_rate": 3.990309629042281e-05,
"loss": 0.3052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2943177819252014,
"step": 920,
"valid_targets_mean": 2444.8,
"valid_targets_min": 1100
},
{
"epoch": 0.9042033235581622,
"grad_norm": 0.7284561255560225,
"learning_rate": 3.989824382795055e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29493361711502075,
"step": 925,
"valid_targets_mean": 2599.8,
"valid_targets_min": 801
},
{
"epoch": 0.9090909090909091,
"grad_norm": 0.6857751641162575,
"learning_rate": 3.989327313124926e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3466421961784363,
"step": 930,
"valid_targets_mean": 2798.0,
"valid_targets_min": 911
},
{
"epoch": 0.9139784946236559,
"grad_norm": 0.7493847771371742,
"learning_rate": 3.9888184229854525e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32370316982269287,
"step": 935,
"valid_targets_mean": 2422.5,
"valid_targets_min": 703
},
{
"epoch": 0.9188660801564027,
"grad_norm": 0.6989351581606708,
"learning_rate": 3.988297715400432e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930717468261719,
"step": 940,
"valid_targets_mean": 2921.4,
"valid_targets_min": 1264
},
{
"epoch": 0.9237536656891495,
"grad_norm": 0.7430743004739445,
"learning_rate": 3.987765193463879e-05,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25492438673973083,
"step": 945,
"valid_targets_mean": 2135.5,
"valid_targets_min": 800
},
{
"epoch": 0.9286412512218963,
"grad_norm": 0.6670033217086339,
"learning_rate": 3.987220860340009e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3239936828613281,
"step": 950,
"valid_targets_mean": 3289.5,
"valid_targets_min": 715
},
{
"epoch": 0.9335288367546432,
"grad_norm": 0.6702989912107715,
"learning_rate": 3.9866647192632176e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33095431327819824,
"step": 955,
"valid_targets_mean": 2921.6,
"valid_targets_min": 1062
},
{
"epoch": 0.9384164222873901,
"grad_norm": 0.6929820388448079,
"learning_rate": 3.986096773538063e-05,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3430343270301819,
"step": 960,
"valid_targets_mean": 2701.9,
"valid_targets_min": 1179
},
{
"epoch": 0.9433040078201369,
"grad_norm": 0.7185025063166174,
"learning_rate": 3.985517026539247e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29739582538604736,
"step": 965,
"valid_targets_mean": 2256.4,
"valid_targets_min": 980
},
{
"epoch": 0.9481915933528837,
"grad_norm": 0.7330014703291616,
"learning_rate": 3.9849254817115925e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30947941541671753,
"step": 970,
"valid_targets_mean": 2393.1,
"valid_targets_min": 814
},
{
"epoch": 0.9530791788856305,
"grad_norm": 0.692392838579322,
"learning_rate": 3.984322142570026e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2626379728317261,
"step": 975,
"valid_targets_mean": 2232.8,
"valid_targets_min": 854
},
{
"epoch": 0.9579667644183774,
"grad_norm": 0.7858755039683706,
"learning_rate": 3.983707012699554e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31549689173698425,
"step": 980,
"valid_targets_mean": 2162.8,
"valid_targets_min": 967
},
{
"epoch": 0.9628543499511242,
"grad_norm": 1.1798359180734284,
"learning_rate": 3.983080095755242e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30286744236946106,
"step": 985,
"valid_targets_mean": 2232.1,
"valid_targets_min": 612
},
{
"epoch": 0.967741935483871,
"grad_norm": 0.6652279763756077,
"learning_rate": 3.982441395462196e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2915736436843872,
"step": 990,
"valid_targets_mean": 2793.2,
"valid_targets_min": 903
},
{
"epoch": 0.9726295210166178,
"grad_norm": 0.7934359151694675,
"learning_rate": 3.9817909156155364e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128136396408081,
"step": 995,
"valid_targets_mean": 2334.7,
"valid_targets_min": 642
},
{
"epoch": 0.9775171065493646,
"grad_norm": 0.6891936895341518,
"learning_rate": 3.981128660080377e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2969144880771637,
"step": 1000,
"valid_targets_mean": 2541.0,
"valid_targets_min": 634
},
{
"epoch": 0.9824046920821115,
"grad_norm": 0.6463480054438933,
"learning_rate": 3.9804546327918025e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29501742124557495,
"step": 1005,
"valid_targets_mean": 2564.6,
"valid_targets_min": 714
},
{
"epoch": 0.9872922776148583,
"grad_norm": 0.6654896254454947,
"learning_rate": 3.9797688377548443e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30969366431236267,
"step": 1010,
"valid_targets_mean": 3066.6,
"valid_targets_min": 682
},
{
"epoch": 0.9921798631476051,
"grad_norm": 0.6711120956545672,
"learning_rate": 3.979071279044458e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3256608247756958,
"step": 1015,
"valid_targets_mean": 2601.2,
"valid_targets_min": 1157
},
{
"epoch": 0.9970674486803519,
"grad_norm": 0.7414237101887737,
"learning_rate": 3.9783619608054976e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34451091289520264,
"step": 1020,
"valid_targets_mean": 2595.6,
"valid_targets_min": 1188
},
{
"epoch": 1.0019550342130987,
"grad_norm": 0.6693075231319553,
"learning_rate": 3.977640887252691e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29463478922843933,
"step": 1025,
"valid_targets_mean": 2843.2,
"valid_targets_min": 985
},
{
"epoch": 1.0068426197458455,
"grad_norm": 0.7374854812974025,
"learning_rate": 3.976908062670616e-05,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664167284965515,
"step": 1030,
"valid_targets_mean": 2574.8,
"valid_targets_min": 1291
},
{
"epoch": 1.0117302052785924,
"grad_norm": 0.7176161611789769,
"learning_rate": 3.976163491413675e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3102620840072632,
"step": 1035,
"valid_targets_mean": 2583.6,
"valid_targets_min": 964
},
{
"epoch": 1.0166177908113392,
"grad_norm": 0.6120097146085149,
"learning_rate": 3.9754071779060674e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29326507449150085,
"step": 1040,
"valid_targets_mean": 3918.3,
"valid_targets_min": 812
},
{
"epoch": 1.021505376344086,
"grad_norm": 0.6381885490796083,
"learning_rate": 3.9746391266417664e-05,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916497588157654,
"step": 1045,
"valid_targets_mean": 3250.8,
"valid_targets_min": 672
},
{
"epoch": 1.0263929618768328,
"grad_norm": 0.6912845827934561,
"learning_rate": 3.973859342184487e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3102365732192993,
"step": 1050,
"valid_targets_mean": 3456.9,
"valid_targets_min": 1028
},
{
"epoch": 1.0312805474095796,
"grad_norm": 0.6994698165553925,
"learning_rate": 3.973067829167664e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2805289030075073,
"step": 1055,
"valid_targets_mean": 2511.4,
"valid_targets_min": 1131
},
{
"epoch": 1.0361681329423265,
"grad_norm": 0.7049190368603762,
"learning_rate": 3.972264592294424e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27423086762428284,
"step": 1060,
"valid_targets_mean": 2325.2,
"valid_targets_min": 617
},
{
"epoch": 1.0410557184750733,
"grad_norm": 0.803585152797481,
"learning_rate": 3.971449636337553e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054800033569336,
"step": 1065,
"valid_targets_mean": 2130.8,
"valid_targets_min": 633
},
{
"epoch": 1.04594330400782,
"grad_norm": 0.8125386640556346,
"learning_rate": 3.970622966139474e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3040192723274231,
"step": 1070,
"valid_targets_mean": 2165.8,
"valid_targets_min": 726
},
{
"epoch": 1.050830889540567,
"grad_norm": 0.6875765301460454,
"learning_rate": 3.969784586612213e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2739431858062744,
"step": 1075,
"valid_targets_mean": 2306.1,
"valid_targets_min": 750
},
{
"epoch": 1.0557184750733137,
"grad_norm": 0.7590315528229628,
"learning_rate": 3.968934502737375e-05,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28198593854904175,
"step": 1080,
"valid_targets_mean": 2487.6,
"valid_targets_min": 703
},
{
"epoch": 1.0606060606060606,
"grad_norm": 0.767363949833768,
"learning_rate": 3.968072719566108e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2522793114185333,
"step": 1085,
"valid_targets_mean": 1953.9,
"valid_targets_min": 746
},
{
"epoch": 1.0654936461388074,
"grad_norm": 0.763111692809638,
"learning_rate": 3.96719924221908e-05,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31584176421165466,
"step": 1090,
"valid_targets_mean": 2352.2,
"valid_targets_min": 788
},
{
"epoch": 1.0703812316715542,
"grad_norm": 0.7106137161882315,
"learning_rate": 3.966314075886442e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2609940767288208,
"step": 1095,
"valid_targets_mean": 2245.1,
"valid_targets_min": 867
},
{
"epoch": 1.075268817204301,
"grad_norm": 0.8801431366949057,
"learning_rate": 3.9654172258278026e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26888507604599,
"step": 1100,
"valid_targets_mean": 2219.1,
"valid_targets_min": 737
},
{
"epoch": 1.0801564027370478,
"grad_norm": 0.9630113421733234,
"learning_rate": 3.964508697372194e-05,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2783164083957672,
"step": 1105,
"valid_targets_mean": 2106.6,
"valid_targets_min": 670
},
{
"epoch": 1.0850439882697946,
"grad_norm": 0.7056624571864765,
"learning_rate": 3.96358849591804e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2580503821372986,
"step": 1110,
"valid_targets_mean": 2245.5,
"valid_targets_min": 830
},
{
"epoch": 1.0899315738025415,
"grad_norm": 0.7476404563873276,
"learning_rate": 3.9626566269331254e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25160929560661316,
"step": 1115,
"valid_targets_mean": 2236.5,
"valid_targets_min": 824
},
{
"epoch": 1.0948191593352883,
"grad_norm": 0.7462231828953746,
"learning_rate": 3.9617130959545614e-05,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28869083523750305,
"step": 1120,
"valid_targets_mean": 2205.5,
"valid_targets_min": 548
},
{
"epoch": 1.099706744868035,
"grad_norm": 0.6350210512856392,
"learning_rate": 3.960757908588757e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29355528950691223,
"step": 1125,
"valid_targets_mean": 2905.8,
"valid_targets_min": 990
},
{
"epoch": 1.104594330400782,
"grad_norm": 0.7768451815168522,
"learning_rate": 3.95979107051138e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29628539085388184,
"step": 1130,
"valid_targets_mean": 1995.6,
"valid_targets_min": 796
},
{
"epoch": 1.1094819159335287,
"grad_norm": 0.715701114754943,
"learning_rate": 3.958812587467327e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2757974863052368,
"step": 1135,
"valid_targets_mean": 2513.9,
"valid_targets_min": 795
},
{
"epoch": 1.1143695014662756,
"grad_norm": 0.657177833956688,
"learning_rate": 3.957822465270689e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28396639227867126,
"step": 1140,
"valid_targets_mean": 2740.9,
"valid_targets_min": 1028
},
{
"epoch": 1.1192570869990224,
"grad_norm": 0.7265698253166278,
"learning_rate": 3.9568207098047144e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3029360771179199,
"step": 1145,
"valid_targets_mean": 2664.1,
"valid_targets_min": 1073
},
{
"epoch": 1.1241446725317692,
"grad_norm": 0.6515253109002876,
"learning_rate": 3.9558073270217784e-05,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2731107771396637,
"step": 1150,
"valid_targets_mean": 2830.1,
"valid_targets_min": 815
},
{
"epoch": 1.129032258064516,
"grad_norm": 0.7342300835153387,
"learning_rate": 3.954782322943343e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26124700903892517,
"step": 1155,
"valid_targets_mean": 2346.8,
"valid_targets_min": 728
},
{
"epoch": 1.1339198435972628,
"grad_norm": 0.7264943185964359,
"learning_rate": 3.953745703659924e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29263490438461304,
"step": 1160,
"valid_targets_mean": 2200.6,
"valid_targets_min": 912
},
{
"epoch": 1.1388074291300097,
"grad_norm": 0.7531165993253246,
"learning_rate": 3.952697475331054e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2604370415210724,
"step": 1165,
"valid_targets_mean": 1966.1,
"valid_targets_min": 810
},
{
"epoch": 1.1436950146627567,
"grad_norm": 0.5807064795538424,
"learning_rate": 3.951637644185245e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2689421474933624,
"step": 1170,
"valid_targets_mean": 3077.1,
"valid_targets_min": 663
},
{
"epoch": 1.1485826001955035,
"grad_norm": 0.7320623987196705,
"learning_rate": 3.9505662165199546e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726061940193176,
"step": 1175,
"valid_targets_mean": 2399.1,
"valid_targets_min": 953
},
{
"epoch": 1.1534701857282503,
"grad_norm": 0.718063434455999,
"learning_rate": 3.949483198701544e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2901926040649414,
"step": 1180,
"valid_targets_mean": 1989.6,
"valid_targets_min": 467
},
{
"epoch": 1.1583577712609971,
"grad_norm": 0.7091718018989998,
"learning_rate": 3.948388597165244e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2814217805862427,
"step": 1185,
"valid_targets_mean": 2682.6,
"valid_targets_min": 977
},
{
"epoch": 1.163245356793744,
"grad_norm": 0.7198188497547705,
"learning_rate": 3.947282418415114e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26243048906326294,
"step": 1190,
"valid_targets_mean": 2464.7,
"valid_targets_min": 1207
},
{
"epoch": 1.1681329423264908,
"grad_norm": 0.8032209187501614,
"learning_rate": 3.946164669024005e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2906745374202728,
"step": 1195,
"valid_targets_mean": 2152.6,
"valid_targets_min": 1274
},
{
"epoch": 1.1730205278592376,
"grad_norm": 0.69719975762219,
"learning_rate": 3.945035355633519e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29841500520706177,
"step": 1200,
"valid_targets_mean": 2345.9,
"valid_targets_min": 886
},
{
"epoch": 1.1779081133919844,
"grad_norm": 0.6974558842300727,
"learning_rate": 3.943894484953974e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29451218247413635,
"step": 1205,
"valid_targets_mean": 2422.9,
"valid_targets_min": 512
},
{
"epoch": 1.1827956989247312,
"grad_norm": 0.7729057032255819,
"learning_rate": 3.9427420637643566e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30238640308380127,
"step": 1210,
"valid_targets_mean": 2235.3,
"valid_targets_min": 1257
},
{
"epoch": 1.187683284457478,
"grad_norm": 0.7935199270678439,
"learning_rate": 3.941578098912288e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25925132632255554,
"step": 1215,
"valid_targets_mean": 1819.3,
"valid_targets_min": 868
},
{
"epoch": 1.1925708699902249,
"grad_norm": 0.7190594576509517,
"learning_rate": 3.940402597313982e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30240678787231445,
"step": 1220,
"valid_targets_mean": 2756.8,
"valid_targets_min": 513
},
{
"epoch": 1.1974584555229717,
"grad_norm": 0.6468704089059654,
"learning_rate": 3.939215565954201e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27174267172813416,
"step": 1225,
"valid_targets_mean": 2537.5,
"valid_targets_min": 842
},
{
"epoch": 1.2023460410557185,
"grad_norm": 0.6638979450727887,
"learning_rate": 3.938017011886217e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25439706444740295,
"step": 1230,
"valid_targets_mean": 2504.9,
"valid_targets_min": 857
},
{
"epoch": 1.2072336265884653,
"grad_norm": 0.7494764475924144,
"learning_rate": 3.936806942231772e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2995947003364563,
"step": 1235,
"valid_targets_mean": 2547.0,
"valid_targets_min": 667
},
{
"epoch": 1.2121212121212122,
"grad_norm": 0.7304687661971925,
"learning_rate": 3.9355853641810286e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266486793756485,
"step": 1240,
"valid_targets_mean": 2214.6,
"valid_targets_min": 309
},
{
"epoch": 1.217008797653959,
"grad_norm": 0.7022740270462892,
"learning_rate": 3.9343522849925355e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25830769538879395,
"step": 1245,
"valid_targets_mean": 2205.6,
"valid_targets_min": 728
},
{
"epoch": 1.2218963831867058,
"grad_norm": 0.6749560565367534,
"learning_rate": 3.933107711993177e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063586354255676,
"step": 1250,
"valid_targets_mean": 2899.1,
"valid_targets_min": 1467
},
{
"epoch": 1.2267839687194526,
"grad_norm": 0.640174555103181,
"learning_rate": 3.931851652578137e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26264217495918274,
"step": 1255,
"valid_targets_mean": 2715.5,
"valid_targets_min": 765
},
{
"epoch": 1.2316715542521994,
"grad_norm": 0.7175756349653029,
"learning_rate": 3.930584114210847e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2843489348888397,
"step": 1260,
"valid_targets_mean": 2394.0,
"valid_targets_min": 1130
},
{
"epoch": 1.2365591397849462,
"grad_norm": 0.6471066400554928,
"learning_rate": 3.929305104422949e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25573495030403137,
"step": 1265,
"valid_targets_mean": 2673.3,
"valid_targets_min": 859
},
{
"epoch": 1.241446725317693,
"grad_norm": 0.7057472774221171,
"learning_rate": 3.928014630814245e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29683718085289,
"step": 1270,
"valid_targets_mean": 2584.6,
"valid_targets_min": 704
},
{
"epoch": 1.2463343108504399,
"grad_norm": 0.7027021456995992,
"learning_rate": 3.926712701052656e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23105719685554504,
"step": 1275,
"valid_targets_mean": 2057.8,
"valid_targets_min": 548
},
{
"epoch": 1.2512218963831867,
"grad_norm": 0.8306679586454391,
"learning_rate": 3.925399322874175e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2782430350780487,
"step": 1280,
"valid_targets_mean": 1920.4,
"valid_targets_min": 782
},
{
"epoch": 1.2561094819159335,
"grad_norm": 0.6271862299342814,
"learning_rate": 3.9240745040828196e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2829798460006714,
"step": 1285,
"valid_targets_mean": 3158.1,
"valid_targets_min": 807
},
{
"epoch": 1.2609970674486803,
"grad_norm": 0.7221564579455654,
"learning_rate": 3.922738252550587e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2566811740398407,
"step": 1290,
"valid_targets_mean": 2186.9,
"valid_targets_min": 659
},
{
"epoch": 1.2658846529814272,
"grad_norm": 0.7065825530165445,
"learning_rate": 3.921390576217408e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27165934443473816,
"step": 1295,
"valid_targets_mean": 2100.2,
"valid_targets_min": 698
},
{
"epoch": 1.270772238514174,
"grad_norm": 0.9761318767014419,
"learning_rate": 3.9200314830910986e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744409441947937,
"step": 1300,
"valid_targets_mean": 1900.2,
"valid_targets_min": 668
},
{
"epoch": 1.2756598240469208,
"grad_norm": 0.8388053078423351,
"learning_rate": 3.918660981247312e-05,
"loss": 0.2735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2818601727485657,
"step": 1305,
"valid_targets_mean": 1785.4,
"valid_targets_min": 769
},
{
"epoch": 1.2805474095796676,
"grad_norm": 0.613252199578922,
"learning_rate": 3.9172790788294924e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25405043363571167,
"step": 1310,
"valid_targets_mean": 2779.4,
"valid_targets_min": 875
},
{
"epoch": 1.2854349951124144,
"grad_norm": 0.702566015145273,
"learning_rate": 3.9158857840488253e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808951437473297,
"step": 1315,
"valid_targets_mean": 2675.1,
"valid_targets_min": 770
},
{
"epoch": 1.2903225806451613,
"grad_norm": 0.7219389062248595,
"learning_rate": 3.914481105184188e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27677303552627563,
"step": 1320,
"valid_targets_mean": 2169.5,
"valid_targets_min": 789
},
{
"epoch": 1.295210166177908,
"grad_norm": 0.6230877367684657,
"learning_rate": 3.913065050582103e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999587059020996,
"step": 1325,
"valid_targets_mean": 3419.2,
"valid_targets_min": 722
},
{
"epoch": 1.300097751710655,
"grad_norm": 0.6833998876959554,
"learning_rate": 3.911637628656685e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252625048160553,
"step": 1330,
"valid_targets_mean": 2527.4,
"valid_targets_min": 849
},
{
"epoch": 1.3049853372434017,
"grad_norm": 0.7469165884381328,
"learning_rate": 3.910198847889595e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2838708162307739,
"step": 1335,
"valid_targets_mean": 2485.5,
"valid_targets_min": 622
},
{
"epoch": 1.3098729227761485,
"grad_norm": 0.6617163563012934,
"learning_rate": 3.908748716829984e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29781484603881836,
"step": 1340,
"valid_targets_mean": 3058.6,
"valid_targets_min": 961
},
{
"epoch": 1.3147605083088953,
"grad_norm": 0.6917934222962383,
"learning_rate": 3.90728724409445e-05,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23285894095897675,
"step": 1345,
"valid_targets_mean": 2165.1,
"valid_targets_min": 689
},
{
"epoch": 1.3196480938416422,
"grad_norm": 0.8112229286729639,
"learning_rate": 3.90581443836698e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2841215133666992,
"step": 1350,
"valid_targets_mean": 2388.8,
"valid_targets_min": 972
},
{
"epoch": 1.324535679374389,
"grad_norm": 0.7050055286781818,
"learning_rate": 3.9043303083989e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793377935886383,
"step": 1355,
"valid_targets_mean": 2531.8,
"valid_targets_min": 839
},
{
"epoch": 1.3294232649071358,
"grad_norm": 0.7692436746915501,
"learning_rate": 3.9028348630088285e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29042643308639526,
"step": 1360,
"valid_targets_mean": 2408.2,
"valid_targets_min": 972
},
{
"epoch": 1.3343108504398826,
"grad_norm": 0.7453876083199784,
"learning_rate": 3.9013281110826146e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25248265266418457,
"step": 1365,
"valid_targets_mean": 2040.0,
"valid_targets_min": 996
},
{
"epoch": 1.3391984359726294,
"grad_norm": 0.6300162995824621,
"learning_rate": 3.899810061573293e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27708175778388977,
"step": 1370,
"valid_targets_mean": 2868.4,
"valid_targets_min": 1109
},
{
"epoch": 1.3440860215053765,
"grad_norm": 0.6688370034426764,
"learning_rate": 3.898280723501027e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2765743136405945,
"step": 1375,
"valid_targets_mean": 2953.6,
"valid_targets_min": 960
},
{
"epoch": 1.3489736070381233,
"grad_norm": 0.6214024065518173,
"learning_rate": 3.896740105953056e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931886911392212,
"step": 1380,
"valid_targets_mean": 3082.7,
"valid_targets_min": 1298
},
{
"epoch": 1.3538611925708701,
"grad_norm": 0.6750814309638632,
"learning_rate": 3.895188218083641e-05,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23927871882915497,
"step": 1385,
"valid_targets_mean": 2085.7,
"valid_targets_min": 605
},
{
"epoch": 1.358748778103617,
"grad_norm": 1.0887637501386116,
"learning_rate": 3.893625069114013e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28028884530067444,
"step": 1390,
"valid_targets_mean": 2176.3,
"valid_targets_min": 999
},
{
"epoch": 1.3636363636363638,
"grad_norm": 0.773730842008043,
"learning_rate": 3.892050668332312e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27753153443336487,
"step": 1395,
"valid_targets_mean": 2301.8,
"valid_targets_min": 816
},
{
"epoch": 1.3685239491691106,
"grad_norm": 0.7189179648090815,
"learning_rate": 3.890465025093538e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30436086654663086,
"step": 1400,
"valid_targets_mean": 2609.4,
"valid_targets_min": 869
},
{
"epoch": 1.3734115347018574,
"grad_norm": 0.6426850788526689,
"learning_rate": 3.8888681488194934e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3102635145187378,
"step": 1405,
"valid_targets_mean": 3093.6,
"valid_targets_min": 1107
},
{
"epoch": 1.3782991202346042,
"grad_norm": 0.734389179384258,
"learning_rate": 3.887260048998726e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662855386734009,
"step": 1410,
"valid_targets_mean": 2011.6,
"valid_targets_min": 684
},
{
"epoch": 1.383186705767351,
"grad_norm": 0.6225396878904635,
"learning_rate": 3.885640735186472e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845187783241272,
"step": 1415,
"valid_targets_mean": 3417.9,
"valid_targets_min": 1093
},
{
"epoch": 1.3880742913000979,
"grad_norm": 0.789834712593994,
"learning_rate": 3.884010217004601e-05,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29228654503822327,
"step": 1420,
"valid_targets_mean": 2669.8,
"valid_targets_min": 1027
},
{
"epoch": 1.3929618768328447,
"grad_norm": 0.7464915480075731,
"learning_rate": 3.882368504141562e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28257280588150024,
"step": 1425,
"valid_targets_mean": 2574.6,
"valid_targets_min": 1474
},
{
"epoch": 1.3978494623655915,
"grad_norm": 0.7059861573051313,
"learning_rate": 3.8807156063523164e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2998770475387573,
"step": 1430,
"valid_targets_mean": 2475.3,
"valid_targets_min": 570
},
{
"epoch": 1.4027370478983383,
"grad_norm": 0.6645964659054957,
"learning_rate": 3.879051533458289e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769964933395386,
"step": 1435,
"valid_targets_mean": 2476.9,
"valid_targets_min": 657
},
{
"epoch": 1.4076246334310851,
"grad_norm": 0.7558136295073548,
"learning_rate": 3.8773762953473066e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2779275178909302,
"step": 1440,
"valid_targets_mean": 1848.9,
"valid_targets_min": 762
},
{
"epoch": 1.412512218963832,
"grad_norm": 0.6943029966676353,
"learning_rate": 3.8756899019735385e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2840909957885742,
"step": 1445,
"valid_targets_mean": 2471.9,
"valid_targets_min": 772
},
{
"epoch": 1.4173998044965788,
"grad_norm": 0.6342596835576019,
"learning_rate": 3.873992363357437e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2653612196445465,
"step": 1450,
"valid_targets_mean": 2900.2,
"valid_targets_min": 1140
},
{
"epoch": 1.4222873900293256,
"grad_norm": 0.579209777162739,
"learning_rate": 3.8722836895856814e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24776488542556763,
"step": 1455,
"valid_targets_mean": 2874.0,
"valid_targets_min": 632
},
{
"epoch": 1.4271749755620724,
"grad_norm": 0.6564233693786774,
"learning_rate": 3.870563890811111e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3028268814086914,
"step": 1460,
"valid_targets_mean": 3045.8,
"valid_targets_min": 891
},
{
"epoch": 1.4320625610948192,
"grad_norm": 0.6629636773046359,
"learning_rate": 3.868832977252675e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27365946769714355,
"step": 1465,
"valid_targets_mean": 2735.8,
"valid_targets_min": 799
},
{
"epoch": 1.436950146627566,
"grad_norm": 0.6785573010408985,
"learning_rate": 3.86709095919536e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2917429804801941,
"step": 1470,
"valid_targets_mean": 2449.4,
"valid_targets_min": 756
},
{
"epoch": 1.4418377321603129,
"grad_norm": 0.6465288698245589,
"learning_rate": 3.86533784699014e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25123557448387146,
"step": 1475,
"valid_targets_mean": 2389.1,
"valid_targets_min": 696
},
{
"epoch": 1.4467253176930597,
"grad_norm": 0.7015331893695984,
"learning_rate": 3.8635736510539065e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667387127876282,
"step": 1480,
"valid_targets_mean": 2461.5,
"valid_targets_min": 717
},
{
"epoch": 1.4516129032258065,
"grad_norm": 0.7629144665484076,
"learning_rate": 3.861798381869412e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29424476623535156,
"step": 1485,
"valid_targets_mean": 2159.1,
"valid_targets_min": 763
},
{
"epoch": 1.4565004887585533,
"grad_norm": 0.752596217358227,
"learning_rate": 3.860012049985204e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25024765729904175,
"step": 1490,
"valid_targets_mean": 1827.2,
"valid_targets_min": 888
},
{
"epoch": 1.4613880742913001,
"grad_norm": 0.700994546408206,
"learning_rate": 3.858214666015565e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29054421186447144,
"step": 1495,
"valid_targets_mean": 2365.5,
"valid_targets_min": 695
},
{
"epoch": 1.466275659824047,
"grad_norm": 0.7116021660360209,
"learning_rate": 3.856406240640448e-05,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2625944912433624,
"step": 1500,
"valid_targets_mean": 2130.0,
"valid_targets_min": 684
},
{
"epoch": 1.4711632453567938,
"grad_norm": 0.7684258462239429,
"learning_rate": 3.8545867846054126e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951001524925232,
"step": 1505,
"valid_targets_mean": 2052.4,
"valid_targets_min": 1064
},
{
"epoch": 1.4760508308895406,
"grad_norm": 0.6507083544953332,
"learning_rate": 3.8527563087215634e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2922488749027252,
"step": 1510,
"valid_targets_mean": 2769.5,
"valid_targets_min": 843
},
{
"epoch": 1.4809384164222874,
"grad_norm": 0.7751727870506968,
"learning_rate": 3.8509148238654824e-05,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24178072810173035,
"step": 1515,
"valid_targets_mean": 1849.9,
"valid_targets_min": 780
},
{
"epoch": 1.4858260019550342,
"grad_norm": 0.5854852127584044,
"learning_rate": 3.84906234097917e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27021411061286926,
"step": 1520,
"valid_targets_mean": 3099.3,
"valid_targets_min": 1029
},
{
"epoch": 1.490713587487781,
"grad_norm": 0.6358169347672091,
"learning_rate": 3.8471988710699715e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26537126302719116,
"step": 1525,
"valid_targets_mean": 2957.4,
"valid_targets_min": 802
},
{
"epoch": 1.4956011730205279,
"grad_norm": 0.6204632468552115,
"learning_rate": 3.8453244252105194e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769279181957245,
"step": 1530,
"valid_targets_mean": 3130.9,
"valid_targets_min": 737
},
{
"epoch": 1.5004887585532747,
"grad_norm": 0.6411624274507086,
"learning_rate": 3.843439014538664e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26065292954444885,
"step": 1535,
"valid_targets_mean": 2861.7,
"valid_targets_min": 1023
},
{
"epoch": 1.5053763440860215,
"grad_norm": 0.7050285259422795,
"learning_rate": 3.841542650257408e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24625875055789948,
"step": 1540,
"valid_targets_mean": 2171.6,
"valid_targets_min": 1054
},
{
"epoch": 1.5102639296187683,
"grad_norm": 0.7521045411153422,
"learning_rate": 3.83963534363484e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3168919086456299,
"step": 1545,
"valid_targets_mean": 2370.8,
"valid_targets_min": 842
},
{
"epoch": 1.5151515151515151,
"grad_norm": 0.7217702499392185,
"learning_rate": 3.8377171060040666e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27114635705947876,
"step": 1550,
"valid_targets_mean": 2131.9,
"valid_targets_min": 783
},
{
"epoch": 1.520039100684262,
"grad_norm": 0.7137936454079413,
"learning_rate": 3.835787948763147e-05,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25275540351867676,
"step": 1555,
"valid_targets_mean": 2113.8,
"valid_targets_min": 748
},
{
"epoch": 1.5249266862170088,
"grad_norm": 0.9545717948909013,
"learning_rate": 3.833847883375022e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564704716205597,
"step": 1560,
"valid_targets_mean": 2187.5,
"valid_targets_min": 739
},
{
"epoch": 1.5298142717497556,
"grad_norm": 0.7470839745811981,
"learning_rate": 3.831896921367451e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791537940502167,
"step": 1565,
"valid_targets_mean": 1975.1,
"valid_targets_min": 686
},
{
"epoch": 1.5347018572825024,
"grad_norm": 0.7647266073732814,
"learning_rate": 3.829935074332938e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24994492530822754,
"step": 1570,
"valid_targets_mean": 2233.8,
"valid_targets_min": 837
},
{
"epoch": 1.5395894428152492,
"grad_norm": 0.7045036581823351,
"learning_rate": 3.827962353928667e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26855552196502686,
"step": 1575,
"valid_targets_mean": 2261.9,
"valid_targets_min": 763
},
{
"epoch": 1.544477028347996,
"grad_norm": 0.7143743531724757,
"learning_rate": 3.825978771876428e-05,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018741011619568,
"step": 1580,
"valid_targets_mean": 2336.8,
"valid_targets_min": 663
},
{
"epoch": 1.5493646138807429,
"grad_norm": 0.6475010659041159,
"learning_rate": 3.823984339962554e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29907166957855225,
"step": 1585,
"valid_targets_mean": 2830.2,
"valid_targets_min": 732
},
{
"epoch": 1.5542521994134897,
"grad_norm": 0.6898759516125273,
"learning_rate": 3.821979070037846e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999107241630554,
"step": 1590,
"valid_targets_mean": 2604.1,
"valid_targets_min": 631
},
{
"epoch": 1.5591397849462365,
"grad_norm": 0.6572278395987295,
"learning_rate": 3.8199629740175017e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2730094790458679,
"step": 1595,
"valid_targets_mean": 2485.9,
"valid_targets_min": 804
},
{
"epoch": 1.5640273704789833,
"grad_norm": 0.7008441805523876,
"learning_rate": 3.8179360638810503e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2944326102733612,
"step": 1600,
"valid_targets_mean": 2188.3,
"valid_targets_min": 669
},
{
"epoch": 1.5689149560117301,
"grad_norm": 0.5571584829883734,
"learning_rate": 3.815898351672275e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22917650640010834,
"step": 1605,
"valid_targets_mean": 3037.3,
"valid_targets_min": 765
},
{
"epoch": 1.573802541544477,
"grad_norm": 0.7410724781542547,
"learning_rate": 3.813849849499146e-05,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24475133419036865,
"step": 1610,
"valid_targets_mean": 1836.8,
"valid_targets_min": 741
},
{
"epoch": 1.5786901270772238,
"grad_norm": 0.7170995982719762,
"learning_rate": 3.811790569533746e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2909032106399536,
"step": 1615,
"valid_targets_mean": 2271.4,
"valid_targets_min": 689
},
{
"epoch": 1.5835777126099706,
"grad_norm": 0.7023440780016095,
"learning_rate": 3.8097205240121994e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3244866132736206,
"step": 1620,
"valid_targets_mean": 2630.7,
"valid_targets_min": 752
},
{
"epoch": 1.5884652981427174,
"grad_norm": 0.7145272097523425,
"learning_rate": 3.807639725234598e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28274455666542053,
"step": 1625,
"valid_targets_mean": 2337.7,
"valid_targets_min": 1045
},
{
"epoch": 1.5933528836754642,
"grad_norm": 0.6483060882499405,
"learning_rate": 3.8055481855649295e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898852825164795,
"step": 1630,
"valid_targets_mean": 2868.5,
"valid_targets_min": 1718
},
{
"epoch": 1.598240469208211,
"grad_norm": 0.6154123007304795,
"learning_rate": 3.8034459174310034e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24204128980636597,
"step": 1635,
"valid_targets_mean": 2880.8,
"valid_targets_min": 791
},
{
"epoch": 1.6031280547409579,
"grad_norm": 0.7242965707991273,
"learning_rate": 3.8013329333243765e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3221800923347473,
"step": 1640,
"valid_targets_mean": 2574.4,
"valid_targets_min": 836
},
{
"epoch": 1.6080156402737047,
"grad_norm": 0.8256849875812563,
"learning_rate": 3.7992092458002813e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2468244880437851,
"step": 1645,
"valid_targets_mean": 2232.7,
"valid_targets_min": 659
},
{
"epoch": 1.6129032258064515,
"grad_norm": 0.8957983328042407,
"learning_rate": 3.797074867477545e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2847079038619995,
"step": 1650,
"valid_targets_mean": 1988.9,
"valid_targets_min": 1107
},
{
"epoch": 1.6177908113391983,
"grad_norm": 0.7320454198900345,
"learning_rate": 3.794929811038525e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25967937707901,
"step": 1655,
"valid_targets_mean": 2044.0,
"valid_targets_min": 732
},
{
"epoch": 1.6226783968719452,
"grad_norm": 0.7944386390316857,
"learning_rate": 3.7927740892290225e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29300451278686523,
"step": 1660,
"valid_targets_mean": 1941.6,
"valid_targets_min": 584
},
{
"epoch": 1.627565982404692,
"grad_norm": 0.7033843489197059,
"learning_rate": 3.790607714858213e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27778416872024536,
"step": 1665,
"valid_targets_mean": 2372.6,
"valid_targets_min": 625
},
{
"epoch": 1.6324535679374388,
"grad_norm": 0.713583282306689,
"learning_rate": 3.78843070079857e-05,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2961004972457886,
"step": 1670,
"valid_targets_mean": 2199.5,
"valid_targets_min": 867
},
{
"epoch": 1.6373411534701856,
"grad_norm": 0.6811625348127058,
"learning_rate": 3.786243059985787e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24486398696899414,
"step": 1675,
"valid_targets_mean": 2072.9,
"valid_targets_min": 739
},
{
"epoch": 1.6422287390029324,
"grad_norm": 0.6214013174128027,
"learning_rate": 3.7840448054187004e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856760323047638,
"step": 1680,
"valid_targets_mean": 2886.9,
"valid_targets_min": 868
},
{
"epoch": 1.6471163245356792,
"grad_norm": 0.6763894621818294,
"learning_rate": 3.781835950159214e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664475739002228,
"step": 1685,
"valid_targets_mean": 2352.6,
"valid_targets_min": 647
},
{
"epoch": 1.652003910068426,
"grad_norm": 0.7476808183243178,
"learning_rate": 3.7796165073322194e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24394232034683228,
"step": 1690,
"valid_targets_mean": 1998.0,
"valid_targets_min": 857
},
{
"epoch": 1.6568914956011729,
"grad_norm": 0.6654065406280266,
"learning_rate": 3.777386490125518e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2673056721687317,
"step": 1695,
"valid_targets_mean": 2774.7,
"valid_targets_min": 941
},
{
"epoch": 1.6617790811339197,
"grad_norm": 1.0447139479563154,
"learning_rate": 3.7751459117897466e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29265016317367554,
"step": 1700,
"valid_targets_mean": 2134.6,
"valid_targets_min": 856
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.6756696155203493,
"learning_rate": 3.772894785638292e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29080730676651,
"step": 1705,
"valid_targets_mean": 2770.5,
"valid_targets_min": 1168
},
{
"epoch": 1.6715542521994133,
"grad_norm": 0.6063804591260533,
"learning_rate": 3.770633125047219e-05,
"loss": 0.2756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29159295558929443,
"step": 1710,
"valid_targets_mean": 3060.3,
"valid_targets_min": 1237
},
{
"epoch": 1.6764418377321602,
"grad_norm": 0.7088620832664758,
"learning_rate": 3.768360943455185e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26422443985939026,
"step": 1715,
"valid_targets_mean": 2225.6,
"valid_targets_min": 727
},
{
"epoch": 1.681329423264907,
"grad_norm": 0.8121289862781522,
"learning_rate": 3.7660782543633634e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.271615207195282,
"step": 1720,
"valid_targets_mean": 2280.4,
"valid_targets_min": 639
},
{
"epoch": 1.6862170087976538,
"grad_norm": 0.6721466708752135,
"learning_rate": 3.763785071335362e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2757419943809509,
"step": 1725,
"valid_targets_mean": 2551.2,
"valid_targets_min": 1072
},
{
"epoch": 1.6911045943304008,
"grad_norm": 0.7511340865178172,
"learning_rate": 3.761481407997144e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3051798939704895,
"step": 1730,
"valid_targets_mean": 2232.9,
"valid_targets_min": 884
},
{
"epoch": 1.6959921798631477,
"grad_norm": 0.7709735641548016,
"learning_rate": 3.759167278036945e-05,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28466472029685974,
"step": 1735,
"valid_targets_mean": 2116.8,
"valid_targets_min": 746
},
{
"epoch": 1.7008797653958945,
"grad_norm": 0.6541200445160277,
"learning_rate": 3.7568426952051936e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24498885869979858,
"step": 1740,
"valid_targets_mean": 2278.2,
"valid_targets_min": 615
},
{
"epoch": 1.7057673509286413,
"grad_norm": 0.8540951314910903,
"learning_rate": 3.754507673314429e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2802680730819702,
"step": 1745,
"valid_targets_mean": 2895.8,
"valid_targets_min": 834
},
{
"epoch": 1.710654936461388,
"grad_norm": 0.6993627250812203,
"learning_rate": 3.752162226239216e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2634274363517761,
"step": 1750,
"valid_targets_mean": 2296.5,
"valid_targets_min": 641
},
{
"epoch": 1.715542521994135,
"grad_norm": 0.7122786881252015,
"learning_rate": 3.749806367916069e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29387813806533813,
"step": 1755,
"valid_targets_mean": 2420.0,
"valid_targets_min": 719
},
{
"epoch": 1.7204301075268817,
"grad_norm": 0.6950186797619158,
"learning_rate": 3.747440112343363e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284950315952301,
"step": 1760,
"valid_targets_mean": 2666.9,
"valid_targets_min": 694
},
{
"epoch": 1.7253176930596286,
"grad_norm": 0.6540823928470759,
"learning_rate": 3.745063473581254e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26305273175239563,
"step": 1765,
"valid_targets_mean": 2482.1,
"valid_targets_min": 522
},
{
"epoch": 1.7302052785923754,
"grad_norm": 0.6533343607539351,
"learning_rate": 3.7426764657515926e-05,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32014939188957214,
"step": 1770,
"valid_targets_mean": 2911.1,
"valid_targets_min": 1390
},
{
"epoch": 1.7350928641251222,
"grad_norm": 0.681180973864994,
"learning_rate": 3.7402791030378446e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26099470257759094,
"step": 1775,
"valid_targets_mean": 2321.4,
"valid_targets_min": 514
},
{
"epoch": 1.739980449657869,
"grad_norm": 0.8019831916932382,
"learning_rate": 3.737871399685001e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27410048246383667,
"step": 1780,
"valid_targets_mean": 1795.9,
"valid_targets_min": 760
},
{
"epoch": 1.7448680351906158,
"grad_norm": 0.6599982007782187,
"learning_rate": 3.735453369999499e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2654041647911072,
"step": 1785,
"valid_targets_mean": 2488.9,
"valid_targets_min": 780
},
{
"epoch": 1.7497556207233627,
"grad_norm": 0.6985853935310431,
"learning_rate": 3.7330250283491316e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721864581108093,
"step": 1790,
"valid_targets_mean": 2234.3,
"valid_targets_min": 892
},
{
"epoch": 1.7546432062561095,
"grad_norm": 0.7815807491097794,
"learning_rate": 3.730586389162968e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2551916241645813,
"step": 1795,
"valid_targets_mean": 2119.4,
"valid_targets_min": 741
},
{
"epoch": 1.7595307917888563,
"grad_norm": 0.6983319157355613,
"learning_rate": 3.728137466931262e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26075512170791626,
"step": 1800,
"valid_targets_mean": 1934.5,
"valid_targets_min": 790
},
{
"epoch": 1.7644183773216031,
"grad_norm": 0.6167013764000374,
"learning_rate": 3.72567827620537e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2760656476020813,
"step": 1805,
"valid_targets_mean": 3027.8,
"valid_targets_min": 1151
},
{
"epoch": 1.76930596285435,
"grad_norm": 0.6509730292742568,
"learning_rate": 3.723208831597663e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275715172290802,
"step": 1810,
"valid_targets_mean": 2570.6,
"valid_targets_min": 881
},
{
"epoch": 1.7741935483870968,
"grad_norm": 0.6845280114796127,
"learning_rate": 3.720729147781438e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28714922070503235,
"step": 1815,
"valid_targets_mean": 2509.2,
"valid_targets_min": 842
},
{
"epoch": 1.7790811339198436,
"grad_norm": 0.692569209787489,
"learning_rate": 3.718239239490838e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29387450218200684,
"step": 1820,
"valid_targets_mean": 2449.2,
"valid_targets_min": 648
},
{
"epoch": 1.7839687194525904,
"grad_norm": 0.6702820731559377,
"learning_rate": 3.715739121520754e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28223657608032227,
"step": 1825,
"valid_targets_mean": 2757.1,
"valid_targets_min": 758
},
{
"epoch": 1.7888563049853372,
"grad_norm": 0.7241156064899832,
"learning_rate": 3.7132288087267444e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525007128715515,
"step": 1830,
"valid_targets_mean": 1929.8,
"valid_targets_min": 824
},
{
"epoch": 1.793743890518084,
"grad_norm": 0.6959493990441359,
"learning_rate": 3.710708316024945e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29006555676460266,
"step": 1835,
"valid_targets_mean": 2522.8,
"valid_targets_min": 887
},
{
"epoch": 1.7986314760508308,
"grad_norm": 1.0690505659751939,
"learning_rate": 3.708177658391979e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26409053802490234,
"step": 1840,
"valid_targets_mean": 2085.5,
"valid_targets_min": 898
},
{
"epoch": 1.8035190615835777,
"grad_norm": 0.6416781900383685,
"learning_rate": 3.70563685086487e-05,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2942282557487488,
"step": 1845,
"valid_targets_mean": 2790.2,
"valid_targets_min": 518
},
{
"epoch": 1.8084066471163245,
"grad_norm": 0.6292212211636715,
"learning_rate": 3.70308590854095e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2690730392932892,
"step": 1850,
"valid_targets_mean": 2605.3,
"valid_targets_min": 627
},
{
"epoch": 1.8132942326490715,
"grad_norm": 0.7563881415657474,
"learning_rate": 3.7005248465777753e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26602309942245483,
"step": 1855,
"valid_targets_mean": 1989.0,
"valid_targets_min": 880
},
{
"epoch": 1.8181818181818183,
"grad_norm": 0.6636462614146774,
"learning_rate": 3.697953680193028e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2749035358428955,
"step": 1860,
"valid_targets_mean": 2244.6,
"valid_targets_min": 1017
},
{
"epoch": 1.8230694037145652,
"grad_norm": 1.7607977847503449,
"learning_rate": 3.695372424664433e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29794639348983765,
"step": 1865,
"valid_targets_mean": 2888.2,
"valid_targets_min": 843
},
{
"epoch": 1.827956989247312,
"grad_norm": 0.6664158354412304,
"learning_rate": 3.692781095329662e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31028884649276733,
"step": 1870,
"valid_targets_mean": 2667.8,
"valid_targets_min": 774
},
{
"epoch": 1.8328445747800588,
"grad_norm": 0.6484592517147627,
"learning_rate": 3.690179707586247e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612004578113556,
"step": 1875,
"valid_targets_mean": 2415.0,
"valid_targets_min": 817
},
{
"epoch": 1.8377321603128056,
"grad_norm": 0.6881093759344453,
"learning_rate": 3.6875682768914847e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2743026912212372,
"step": 1880,
"valid_targets_mean": 3187.6,
"valid_targets_min": 1503
},
{
"epoch": 1.8426197458455524,
"grad_norm": 0.7092531777121036,
"learning_rate": 3.684946818762349e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24219094216823578,
"step": 1885,
"valid_targets_mean": 1849.3,
"valid_targets_min": 538
},
{
"epoch": 1.8475073313782993,
"grad_norm": 0.7102034739129834,
"learning_rate": 3.682315348775392e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2451900839805603,
"step": 1890,
"valid_targets_mean": 2226.6,
"valid_targets_min": 742
},
{
"epoch": 1.852394916911046,
"grad_norm": 0.6976435032370457,
"learning_rate": 3.6796738825666606e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34835338592529297,
"step": 1895,
"valid_targets_mean": 2488.8,
"valid_targets_min": 821
},
{
"epoch": 1.857282502443793,
"grad_norm": 0.8345683696586109,
"learning_rate": 3.6770224358315945e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3025885820388794,
"step": 1900,
"valid_targets_mean": 2416.9,
"valid_targets_min": 544
},
{
"epoch": 1.8621700879765397,
"grad_norm": 0.6734416069076511,
"learning_rate": 3.674361024324939e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562083601951599,
"step": 1905,
"valid_targets_mean": 2252.0,
"valid_targets_min": 1040
},
{
"epoch": 1.8670576735092865,
"grad_norm": 0.7258976397773823,
"learning_rate": 3.67168966386065e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29352593421936035,
"step": 1910,
"valid_targets_mean": 2220.9,
"valid_targets_min": 770
},
{
"epoch": 1.8719452590420333,
"grad_norm": 0.8267516235866793,
"learning_rate": 3.669008370311798e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26839086413383484,
"step": 1915,
"valid_targets_mean": 2146.9,
"valid_targets_min": 906
},
{
"epoch": 1.8768328445747802,
"grad_norm": 0.9090846152816757,
"learning_rate": 3.666317159610478e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2196088433265686,
"step": 1920,
"valid_targets_mean": 1943.8,
"valid_targets_min": 627
},
{
"epoch": 1.881720430107527,
"grad_norm": 0.6328104571501864,
"learning_rate": 3.6636160477477084e-05,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26850637793540955,
"step": 1925,
"valid_targets_mean": 2655.1,
"valid_targets_min": 1260
},
{
"epoch": 1.8866080156402738,
"grad_norm": 0.734256137030361,
"learning_rate": 3.6609050507733434e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635309100151062,
"step": 1930,
"valid_targets_mean": 2196.3,
"valid_targets_min": 865
},
{
"epoch": 1.8914956011730206,
"grad_norm": 0.6466263966198653,
"learning_rate": 3.6581841847959704e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23648956418037415,
"step": 1935,
"valid_targets_mean": 2312.8,
"valid_targets_min": 571
},
{
"epoch": 1.8963831867057674,
"grad_norm": 0.6012794126830221,
"learning_rate": 3.6554534659828214e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2779013514518738,
"step": 1940,
"valid_targets_mean": 2929.6,
"valid_targets_min": 682
},
{
"epoch": 1.9012707722385143,
"grad_norm": 0.7694228039973774,
"learning_rate": 3.652712910559671e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2838958203792572,
"step": 1945,
"valid_targets_mean": 2658.0,
"valid_targets_min": 1149
},
{
"epoch": 1.906158357771261,
"grad_norm": 0.6786164917053215,
"learning_rate": 3.649962534810743e-05,
"loss": 0.2663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2658728361129761,
"step": 1950,
"valid_targets_mean": 2249.3,
"valid_targets_min": 714
},
{
"epoch": 1.911045943304008,
"grad_norm": 0.6234672172314177,
"learning_rate": 3.647202355078614e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2740452289581299,
"step": 1955,
"valid_targets_mean": 2578.2,
"valid_targets_min": 720
},
{
"epoch": 1.9159335288367547,
"grad_norm": 0.6515984804744183,
"learning_rate": 3.644432387764113e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28338634967803955,
"step": 1960,
"valid_targets_mean": 2537.2,
"valid_targets_min": 781
},
{
"epoch": 1.9208211143695015,
"grad_norm": 0.6925882408989057,
"learning_rate": 3.641652649326228e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28017061948776245,
"step": 1965,
"valid_targets_mean": 2322.9,
"valid_targets_min": 790
},
{
"epoch": 1.9257086999022484,
"grad_norm": 0.721478062577497,
"learning_rate": 3.638863156282007e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2587317228317261,
"step": 1970,
"valid_targets_mean": 1998.3,
"valid_targets_min": 818
},
{
"epoch": 1.9305962854349952,
"grad_norm": 0.670482355423357,
"learning_rate": 3.6360639252064576e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28506842255592346,
"step": 1975,
"valid_targets_mean": 2706.6,
"valid_targets_min": 804
},
{
"epoch": 1.935483870967742,
"grad_norm": 0.7503529232237587,
"learning_rate": 3.633254972732452e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2652524411678314,
"step": 1980,
"valid_targets_mean": 2164.6,
"valid_targets_min": 1087
},
{
"epoch": 1.9403714565004888,
"grad_norm": 0.6787558928888673,
"learning_rate": 3.630436315550624e-05,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24034081399440765,
"step": 1985,
"valid_targets_mean": 2107.4,
"valid_targets_min": 771
},
{
"epoch": 1.9452590420332356,
"grad_norm": 0.7914047009085244,
"learning_rate": 3.6276079704092755e-05,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2761124074459076,
"step": 1990,
"valid_targets_mean": 2557.2,
"valid_targets_min": 836
},
{
"epoch": 1.9501466275659824,
"grad_norm": 0.6934610377236305,
"learning_rate": 3.6247699541142705e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904479503631592,
"step": 1995,
"valid_targets_mean": 2472.5,
"valid_targets_min": 620
},
{
"epoch": 1.9550342130987293,
"grad_norm": 0.7028198944986546,
"learning_rate": 3.62192228352894e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30306535959243774,
"step": 2000,
"valid_targets_mean": 2393.2,
"valid_targets_min": 820
},
{
"epoch": 1.959921798631476,
"grad_norm": 0.6656505685896379,
"learning_rate": 3.6190649755739803e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27111366391181946,
"step": 2005,
"valid_targets_mean": 2641.5,
"valid_targets_min": 655
},
{
"epoch": 1.964809384164223,
"grad_norm": 0.6548401411079302,
"learning_rate": 3.616198047227353e-05,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26000118255615234,
"step": 2010,
"valid_targets_mean": 2489.2,
"valid_targets_min": 1225
},
{
"epoch": 1.9696969696969697,
"grad_norm": 0.7088864087296969,
"learning_rate": 3.613321515524181e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2879897654056549,
"step": 2015,
"valid_targets_mean": 2197.8,
"valid_targets_min": 916
},
{
"epoch": 1.9745845552297165,
"grad_norm": 0.7810945047814258,
"learning_rate": 3.610435397556653e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25487759709358215,
"step": 2020,
"valid_targets_mean": 1809.1,
"valid_targets_min": 1181
},
{
"epoch": 1.9794721407624634,
"grad_norm": 0.6618807198434398,
"learning_rate": 3.607539710473916e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2809375524520874,
"step": 2025,
"valid_targets_mean": 2645.9,
"valid_targets_min": 714
},
{
"epoch": 1.9843597262952102,
"grad_norm": 0.6889464103259075,
"learning_rate": 3.6046344714819786e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27869024872779846,
"step": 2030,
"valid_targets_mean": 2894.4,
"valid_targets_min": 612
},
{
"epoch": 1.989247311827957,
"grad_norm": 0.7597436857623857,
"learning_rate": 3.601719697843604e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24141916632652283,
"step": 2035,
"valid_targets_mean": 1800.8,
"valid_targets_min": 648
},
{
"epoch": 1.9941348973607038,
"grad_norm": 0.6357417452126822,
"learning_rate": 3.5987954068782114e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28626328706741333,
"step": 2040,
"valid_targets_mean": 3067.6,
"valid_targets_min": 824
},
{
"epoch": 1.9990224828934506,
"grad_norm": 0.6268686861206388,
"learning_rate": 3.595861615961771e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25856465101242065,
"step": 2045,
"valid_targets_mean": 2928.6,
"valid_targets_min": 1156
},
{
"epoch": 2.0039100684261975,
"grad_norm": 0.5633104622128313,
"learning_rate": 3.5929183425267e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2239726036787033,
"step": 2050,
"valid_targets_mean": 2999.4,
"valid_targets_min": 631
},
{
"epoch": 2.0087976539589443,
"grad_norm": 0.7030082756993576,
"learning_rate": 3.589965604061762e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26195091009140015,
"step": 2055,
"valid_targets_mean": 2908.1,
"valid_targets_min": 793
},
{
"epoch": 2.013685239491691,
"grad_norm": 0.7032018693280796,
"learning_rate": 3.5870034181119605e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23086042702198029,
"step": 2060,
"valid_targets_mean": 2292.1,
"valid_targets_min": 748
},
{
"epoch": 2.018572825024438,
"grad_norm": 0.8062986669540131,
"learning_rate": 3.5840318022784345e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24330705404281616,
"step": 2065,
"valid_targets_mean": 2035.7,
"valid_targets_min": 804
},
{
"epoch": 2.0234604105571847,
"grad_norm": 0.7456760467454644,
"learning_rate": 3.5810507742183555e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24097514152526855,
"step": 2070,
"valid_targets_mean": 2251.5,
"valid_targets_min": 656
},
{
"epoch": 2.0283479960899315,
"grad_norm": 0.7974068850160627,
"learning_rate": 3.5780603516448235e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25509095191955566,
"step": 2075,
"valid_targets_mean": 2308.2,
"valid_targets_min": 842
},
{
"epoch": 2.0332355816226784,
"grad_norm": 0.7027608391523197,
"learning_rate": 3.575060552326758e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26107388734817505,
"step": 2080,
"valid_targets_mean": 2641.1,
"valid_targets_min": 702
},
{
"epoch": 2.038123167155425,
"grad_norm": 0.6771926382902913,
"learning_rate": 3.572051394088795e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.254364550113678,
"step": 2085,
"valid_targets_mean": 3093.8,
"valid_targets_min": 1095
},
{
"epoch": 2.043010752688172,
"grad_norm": 0.7920555868975577,
"learning_rate": 3.569032894811182e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25785136222839355,
"step": 2090,
"valid_targets_mean": 2053.3,
"valid_targets_min": 803
},
{
"epoch": 2.047898338220919,
"grad_norm": 0.6836448197530809,
"learning_rate": 3.566005072429668e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21475102007389069,
"step": 2095,
"valid_targets_mean": 2353.8,
"valid_targets_min": 976
},
{
"epoch": 2.0527859237536656,
"grad_norm": 0.712116095288442,
"learning_rate": 3.562967944935402e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23862826824188232,
"step": 2100,
"valid_targets_mean": 2316.5,
"valid_targets_min": 768
},
{
"epoch": 2.0576735092864125,
"grad_norm": 0.7340036820210002,
"learning_rate": 3.559921530374821e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310110479593277,
"step": 2105,
"valid_targets_mean": 2313.2,
"valid_targets_min": 763
},
{
"epoch": 2.0625610948191593,
"grad_norm": 0.7950851146965314,
"learning_rate": 3.556865846849547e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24690885841846466,
"step": 2110,
"valid_targets_mean": 1923.8,
"valid_targets_min": 684
},
{
"epoch": 2.067448680351906,
"grad_norm": 0.9485462964048043,
"learning_rate": 3.5538009125162774e-05,
"loss": 0.2383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2360670119524002,
"step": 2115,
"valid_targets_mean": 2597.2,
"valid_targets_min": 1328
},
{
"epoch": 2.072336265884653,
"grad_norm": 0.6042905131795798,
"learning_rate": 3.550726745586677e-05,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24113643169403076,
"step": 2120,
"valid_targets_mean": 3059.4,
"valid_targets_min": 884
},
{
"epoch": 2.0772238514173997,
"grad_norm": 0.6939861915048151,
"learning_rate": 3.5476433643272695e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23294597864151,
"step": 2125,
"valid_targets_mean": 2400.4,
"valid_targets_min": 863
},
{
"epoch": 2.0821114369501466,
"grad_norm": 0.7426227574519302,
"learning_rate": 3.5445507870593315e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2383473813533783,
"step": 2130,
"valid_targets_mean": 2200.8,
"valid_targets_min": 670
},
{
"epoch": 2.0869990224828934,
"grad_norm": 0.6868218935296267,
"learning_rate": 3.54144903215878e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2236156016588211,
"step": 2135,
"valid_targets_mean": 2512.4,
"valid_targets_min": 522
},
{
"epoch": 2.09188660801564,
"grad_norm": 0.734071113886848,
"learning_rate": 3.538338118056065e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26370787620544434,
"step": 2140,
"valid_targets_mean": 2402.6,
"valid_targets_min": 731
},
{
"epoch": 2.096774193548387,
"grad_norm": 0.7089461463159339,
"learning_rate": 3.5352180632360614e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.212519571185112,
"step": 2145,
"valid_targets_mean": 2266.1,
"valid_targets_min": 504
},
{
"epoch": 2.101661779081134,
"grad_norm": 0.791032807011372,
"learning_rate": 3.532088886237956e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2348712533712387,
"step": 2150,
"valid_targets_mean": 2305.6,
"valid_targets_min": 746
},
{
"epoch": 2.1065493646138806,
"grad_norm": 0.6579340652769179,
"learning_rate": 3.5289506056551414e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27510562539100647,
"step": 2155,
"valid_targets_mean": 2961.9,
"valid_targets_min": 680
},
{
"epoch": 2.1114369501466275,
"grad_norm": 0.7467367590945104,
"learning_rate": 3.5258032401351005e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22451433539390564,
"step": 2160,
"valid_targets_mean": 2105.4,
"valid_targets_min": 765
},
{
"epoch": 2.1163245356793743,
"grad_norm": 0.9754841406665122,
"learning_rate": 3.522646808379299e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2368217408657074,
"step": 2165,
"valid_targets_mean": 2108.7,
"valid_targets_min": 618
},
{
"epoch": 2.121212121212121,
"grad_norm": 0.679630597898811,
"learning_rate": 3.519481329143076e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23734697699546814,
"step": 2170,
"valid_targets_mean": 2571.5,
"valid_targets_min": 1089
},
{
"epoch": 2.126099706744868,
"grad_norm": 0.658153760353656,
"learning_rate": 3.5163068212355274e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.256761372089386,
"step": 2175,
"valid_targets_mean": 2925.9,
"valid_targets_min": 803
},
{
"epoch": 2.1309872922776147,
"grad_norm": 0.7475086838003469,
"learning_rate": 3.513123303519397e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22203174233436584,
"step": 2180,
"valid_targets_mean": 1844.1,
"valid_targets_min": 692
},
{
"epoch": 2.1358748778103616,
"grad_norm": 0.6041239999536051,
"learning_rate": 3.509930794910967e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22519180178642273,
"step": 2185,
"valid_targets_mean": 3204.3,
"valid_targets_min": 946
},
{
"epoch": 2.1407624633431084,
"grad_norm": 0.7509582157797575,
"learning_rate": 3.506729314379941e-05,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25604188442230225,
"step": 2190,
"valid_targets_mean": 2394.9,
"valid_targets_min": 677
},
{
"epoch": 2.145650048875855,
"grad_norm": 0.6750872876590103,
"learning_rate": 3.5035188809493335e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22361913323402405,
"step": 2195,
"valid_targets_mean": 2691.1,
"valid_targets_min": 791
},
{
"epoch": 2.150537634408602,
"grad_norm": 0.6447663759799113,
"learning_rate": 3.500299513695356e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22863362729549408,
"step": 2200,
"valid_targets_mean": 2783.2,
"valid_targets_min": 853
},
{
"epoch": 2.155425219941349,
"grad_norm": 0.7166550535292393,
"learning_rate": 3.497071231747306e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25535690784454346,
"step": 2205,
"valid_targets_mean": 2722.8,
"valid_targets_min": 989
},
{
"epoch": 2.1603128054740957,
"grad_norm": 0.8862852553501419,
"learning_rate": 3.493834054287449e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24125589430332184,
"step": 2210,
"valid_targets_mean": 2089.8,
"valid_targets_min": 787
},
{
"epoch": 2.1652003910068425,
"grad_norm": 0.7210539973246137,
"learning_rate": 3.490588000550911e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26080626249313354,
"step": 2215,
"valid_targets_mean": 2307.4,
"valid_targets_min": 995
},
{
"epoch": 2.1700879765395893,
"grad_norm": 0.6876101039598905,
"learning_rate": 3.4873330898255556e-05,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22508588433265686,
"step": 2220,
"valid_targets_mean": 2578.5,
"valid_targets_min": 551
},
{
"epoch": 2.174975562072336,
"grad_norm": 0.679616490089902,
"learning_rate": 3.4840693414518776e-05,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22549769282341003,
"step": 2225,
"valid_targets_mean": 2478.4,
"valid_targets_min": 1293
},
{
"epoch": 2.179863147605083,
"grad_norm": 0.6885669807827226,
"learning_rate": 3.4807967748228844e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21673941612243652,
"step": 2230,
"valid_targets_mean": 2484.1,
"valid_targets_min": 1140
},
{
"epoch": 2.1847507331378297,
"grad_norm": 0.6971954496384682,
"learning_rate": 3.477515409383979e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22069767117500305,
"step": 2235,
"valid_targets_mean": 2294.4,
"valid_targets_min": 914
},
{
"epoch": 2.1896383186705766,
"grad_norm": 0.7601614406567037,
"learning_rate": 3.474225264632847e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20157967507839203,
"step": 2240,
"valid_targets_mean": 1873.1,
"valid_targets_min": 615
},
{
"epoch": 2.1945259042033234,
"grad_norm": 0.6527427792093988,
"learning_rate": 3.470926360119343e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22357343137264252,
"step": 2245,
"valid_targets_mean": 2597.2,
"valid_targets_min": 720
},
{
"epoch": 2.19941348973607,
"grad_norm": 1.2913533556146168,
"learning_rate": 3.467618715445367e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2719864845275879,
"step": 2250,
"valid_targets_mean": 2356.8,
"valid_targets_min": 1038
},
{
"epoch": 2.204301075268817,
"grad_norm": 0.6982533310800236,
"learning_rate": 3.464302350264756e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23422983288764954,
"step": 2255,
"valid_targets_mean": 2767.9,
"valid_targets_min": 753
},
{
"epoch": 2.209188660801564,
"grad_norm": 0.7221984393019797,
"learning_rate": 3.460977284283162e-05,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266290545463562,
"step": 2260,
"valid_targets_mean": 2269.7,
"valid_targets_min": 822
},
{
"epoch": 2.2140762463343107,
"grad_norm": 0.7114567359248741,
"learning_rate": 3.457643537257938e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19123372435569763,
"step": 2265,
"valid_targets_mean": 1872.2,
"valid_targets_min": 570
},
{
"epoch": 2.2189638318670575,
"grad_norm": 0.6540588887195975,
"learning_rate": 3.454301128998018e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2638104259967804,
"step": 2270,
"valid_targets_mean": 3022.8,
"valid_targets_min": 987
},
{
"epoch": 2.2238514173998043,
"grad_norm": 0.6898490839976488,
"learning_rate": 3.4509500793638015e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2437189519405365,
"step": 2275,
"valid_targets_mean": 2453.7,
"valid_targets_min": 656
},
{
"epoch": 2.228739002932551,
"grad_norm": 0.7463219837340317,
"learning_rate": 3.447590408267034e-05,
"loss": 0.2394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21820449829101562,
"step": 2280,
"valid_targets_mean": 2064.9,
"valid_targets_min": 748
},
{
"epoch": 2.233626588465298,
"grad_norm": 0.7810585743007555,
"learning_rate": 3.444222135670688e-05,
"loss": 0.2394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506566643714905,
"step": 2285,
"valid_targets_mean": 2264.9,
"valid_targets_min": 820
},
{
"epoch": 2.2385141739980448,
"grad_norm": 0.7468906966516604,
"learning_rate": 3.44084528158885e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22076962888240814,
"step": 2290,
"valid_targets_mean": 2084.4,
"valid_targets_min": 721
},
{
"epoch": 2.2434017595307916,
"grad_norm": 0.7194591472281033,
"learning_rate": 3.437459866086591e-05,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23915450274944305,
"step": 2295,
"valid_targets_mean": 2377.3,
"valid_targets_min": 650
},
{
"epoch": 2.2482893450635384,
"grad_norm": 0.7180690575974027,
"learning_rate": 3.4340659092798594e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506748139858246,
"step": 2300,
"valid_targets_mean": 2737.3,
"valid_targets_min": 567
},
{
"epoch": 2.253176930596285,
"grad_norm": 0.6309852432550281,
"learning_rate": 3.4306634313353504e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2439078688621521,
"step": 2305,
"valid_targets_mean": 3100.8,
"valid_targets_min": 914
},
{
"epoch": 2.258064516129032,
"grad_norm": 0.7572600999737557,
"learning_rate": 3.427252452470395e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2431081384420395,
"step": 2310,
"valid_targets_mean": 1790.9,
"valid_targets_min": 640
},
{
"epoch": 2.262952101661779,
"grad_norm": 0.683772308399432,
"learning_rate": 3.423832992952836e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24556618928909302,
"step": 2315,
"valid_targets_mean": 2683.7,
"valid_targets_min": 801
},
{
"epoch": 2.2678396871945257,
"grad_norm": 0.8397527577042548,
"learning_rate": 3.420405073100905e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.254273384809494,
"step": 2320,
"valid_targets_mean": 2155.0,
"valid_targets_min": 867
},
{
"epoch": 2.2727272727272725,
"grad_norm": 0.851065317435724,
"learning_rate": 3.416968713283105e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2502952814102173,
"step": 2325,
"valid_targets_mean": 2122.0,
"valid_targets_min": 684
},
{
"epoch": 2.2776148582600193,
"grad_norm": 0.6985298739440852,
"learning_rate": 3.413523933918093e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22682811319828033,
"step": 2330,
"valid_targets_mean": 2159.1,
"valid_targets_min": 795
},
{
"epoch": 2.2825024437927666,
"grad_norm": 0.8111962594657017,
"learning_rate": 3.4100707554745495e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24102097749710083,
"step": 2335,
"valid_targets_mean": 2234.1,
"valid_targets_min": 705
},
{
"epoch": 2.2873900293255134,
"grad_norm": 0.5993930502127762,
"learning_rate": 3.406609198471064e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18438704311847687,
"step": 2340,
"valid_targets_mean": 2438.3,
"valid_targets_min": 1216
},
{
"epoch": 2.29227761485826,
"grad_norm": 0.7265646225215977,
"learning_rate": 3.403139283476011e-05,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2278384566307068,
"step": 2345,
"valid_targets_mean": 2198.9,
"valid_targets_min": 1056
},
{
"epoch": 2.297165200391007,
"grad_norm": 0.6075073209468058,
"learning_rate": 3.3996610311074266e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2122841477394104,
"step": 2350,
"valid_targets_mean": 2752.8,
"valid_targets_min": 762
},
{
"epoch": 2.302052785923754,
"grad_norm": 0.6706963737298545,
"learning_rate": 3.396174462032888e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.241616889834404,
"step": 2355,
"valid_targets_mean": 2314.3,
"valid_targets_min": 637
},
{
"epoch": 2.3069403714565007,
"grad_norm": 1.1053006675938248,
"learning_rate": 3.392679596969391e-05,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.232365682721138,
"step": 2360,
"valid_targets_mean": 2931.2,
"valid_targets_min": 1234
},
{
"epoch": 2.3118279569892475,
"grad_norm": 0.68661451987901,
"learning_rate": 3.389176456683222e-05,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2415533810853958,
"step": 2365,
"valid_targets_mean": 2462.8,
"valid_targets_min": 748
},
{
"epoch": 2.3167155425219943,
"grad_norm": 0.7999782604502889,
"learning_rate": 3.385665061989842e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21598216891288757,
"step": 2370,
"valid_targets_mean": 1724.7,
"valid_targets_min": 662
},
{
"epoch": 2.321603128054741,
"grad_norm": 0.7182473780722957,
"learning_rate": 3.382145433753758e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27340924739837646,
"step": 2375,
"valid_targets_mean": 2582.8,
"valid_targets_min": 774
},
{
"epoch": 2.326490713587488,
"grad_norm": 0.7676223492166587,
"learning_rate": 3.3786175928883994e-05,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21359305083751678,
"step": 2380,
"valid_targets_mean": 1934.9,
"valid_targets_min": 646
},
{
"epoch": 2.3313782991202348,
"grad_norm": 0.701569446945032,
"learning_rate": 3.375081560355996e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24448227882385254,
"step": 2385,
"valid_targets_mean": 2355.2,
"valid_targets_min": 700
},
{
"epoch": 2.3362658846529816,
"grad_norm": 0.668238001789143,
"learning_rate": 3.3715373571674495e-05,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24243560433387756,
"step": 2390,
"valid_targets_mean": 2480.6,
"valid_targets_min": 1062
},
{
"epoch": 2.3411534701857284,
"grad_norm": 0.7311150815773109,
"learning_rate": 3.367985004382216e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22406163811683655,
"step": 2395,
"valid_targets_mean": 1759.3,
"valid_targets_min": 1058
},
{
"epoch": 2.346041055718475,
"grad_norm": 0.6489801175202864,
"learning_rate": 3.36442452310817e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2665456533432007,
"step": 2400,
"valid_targets_mean": 2741.1,
"valid_targets_min": 772
},
{
"epoch": 2.350928641251222,
"grad_norm": 0.6383014149144618,
"learning_rate": 3.36085593450149e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23392713069915771,
"step": 2405,
"valid_targets_mean": 2465.8,
"valid_targets_min": 697
},
{
"epoch": 2.355816226783969,
"grad_norm": 0.6749587378319567,
"learning_rate": 3.3572792597665244e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2573961019515991,
"step": 2410,
"valid_targets_mean": 2782.9,
"valid_targets_min": 888
},
{
"epoch": 2.3607038123167157,
"grad_norm": 0.9440638611034704,
"learning_rate": 3.353694520155672e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24345912039279938,
"step": 2415,
"valid_targets_mean": 2128.4,
"valid_targets_min": 1012
},
{
"epoch": 2.3655913978494625,
"grad_norm": 0.7148978990158092,
"learning_rate": 3.350101736969249e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735242247581482,
"step": 2420,
"valid_targets_mean": 2309.9,
"valid_targets_min": 771
},
{
"epoch": 2.3704789833822093,
"grad_norm": 0.8017459949388398,
"learning_rate": 3.346500931555369e-05,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2165670096874237,
"step": 2425,
"valid_targets_mean": 2131.1,
"valid_targets_min": 708
},
{
"epoch": 2.375366568914956,
"grad_norm": 0.6221765808255351,
"learning_rate": 3.3428921253098126e-05,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26252031326293945,
"step": 2430,
"valid_targets_mean": 3323.1,
"valid_targets_min": 1030
},
{
"epoch": 2.380254154447703,
"grad_norm": 0.6740618705615318,
"learning_rate": 3.3392753396759e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23797520995140076,
"step": 2435,
"valid_targets_mean": 2207.9,
"valid_targets_min": 734
},
{
"epoch": 2.3851417399804498,
"grad_norm": 0.7273981487589926,
"learning_rate": 3.3356505961443644e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23226913809776306,
"step": 2440,
"valid_targets_mean": 2119.9,
"valid_targets_min": 685
},
{
"epoch": 2.3900293255131966,
"grad_norm": 0.7495183220790104,
"learning_rate": 3.332017916253227e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2352924793958664,
"step": 2445,
"valid_targets_mean": 2707.6,
"valid_targets_min": 714
},
{
"epoch": 2.3949169110459434,
"grad_norm": 0.7842291061024107,
"learning_rate": 3.328377321587662e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22039464116096497,
"step": 2450,
"valid_targets_mean": 1844.9,
"valid_targets_min": 544
},
{
"epoch": 2.39980449657869,
"grad_norm": 0.6173507633048779,
"learning_rate": 3.324728833779876e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23128989338874817,
"step": 2455,
"valid_targets_mean": 2820.6,
"valid_targets_min": 1219
},
{
"epoch": 2.404692082111437,
"grad_norm": 0.7009098945991525,
"learning_rate": 3.3210724745089757e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20386609435081482,
"step": 2460,
"valid_targets_mean": 2477.1,
"valid_targets_min": 622
},
{
"epoch": 2.409579667644184,
"grad_norm": 0.7651345366780957,
"learning_rate": 3.31740826550084e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2441290318965912,
"step": 2465,
"valid_targets_mean": 2235.6,
"valid_targets_min": 783
},
{
"epoch": 2.4144672531769307,
"grad_norm": 0.7279723174495759,
"learning_rate": 3.313736228527987e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2114153504371643,
"step": 2470,
"valid_targets_mean": 2223.0,
"valid_targets_min": 761
},
{
"epoch": 2.4193548387096775,
"grad_norm": 0.7868641978840135,
"learning_rate": 3.310056385409453e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26033109426498413,
"step": 2475,
"valid_targets_mean": 2057.3,
"valid_targets_min": 770
},
{
"epoch": 2.4242424242424243,
"grad_norm": 0.6636689132066698,
"learning_rate": 3.3063687580106544e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515316903591156,
"step": 2480,
"valid_targets_mean": 2834.2,
"valid_targets_min": 750
},
{
"epoch": 2.429130009775171,
"grad_norm": 0.7145023267491682,
"learning_rate": 3.302673368243264e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2276870310306549,
"step": 2485,
"valid_targets_mean": 2252.9,
"valid_targets_min": 668
},
{
"epoch": 2.434017595307918,
"grad_norm": 0.6488982935705684,
"learning_rate": 3.298970238065077e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.250893771648407,
"step": 2490,
"valid_targets_mean": 2848.4,
"valid_targets_min": 1069
},
{
"epoch": 2.4389051808406648,
"grad_norm": 0.6730474280370319,
"learning_rate": 3.2952593894798796e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22307783365249634,
"step": 2495,
"valid_targets_mean": 2428.5,
"valid_targets_min": 934
},
{
"epoch": 2.4437927663734116,
"grad_norm": 0.7947851421243562,
"learning_rate": 3.291540844537324e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531839907169342,
"step": 2500,
"valid_targets_mean": 1988.7,
"valid_targets_min": 690
},
{
"epoch": 2.4486803519061584,
"grad_norm": 0.6648566470243608,
"learning_rate": 3.287814625332792e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527335286140442,
"step": 2505,
"valid_targets_mean": 2601.8,
"valid_targets_min": 1007
},
{
"epoch": 2.4535679374389052,
"grad_norm": 0.7237098939276865,
"learning_rate": 3.2840807540072644e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24128659069538116,
"step": 2510,
"valid_targets_mean": 2112.2,
"valid_targets_min": 1071
},
{
"epoch": 2.458455522971652,
"grad_norm": 0.671690132960215,
"learning_rate": 3.280339252747192e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24696272611618042,
"step": 2515,
"valid_targets_mean": 2795.6,
"valid_targets_min": 610
},
{
"epoch": 2.463343108504399,
"grad_norm": 0.6700935950794794,
"learning_rate": 3.276590143784362e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21841683983802795,
"step": 2520,
"valid_targets_mean": 2417.8,
"valid_targets_min": 676
},
{
"epoch": 2.4682306940371457,
"grad_norm": 0.6719669379309949,
"learning_rate": 3.2728334493957654e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22499142587184906,
"step": 2525,
"valid_targets_mean": 2297.1,
"valid_targets_min": 699
},
{
"epoch": 2.4731182795698925,
"grad_norm": 0.6892705433904501,
"learning_rate": 3.269069191903466e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22186297178268433,
"step": 2530,
"valid_targets_mean": 2068.8,
"valid_targets_min": 740
},
{
"epoch": 2.4780058651026393,
"grad_norm": 0.7393767252579292,
"learning_rate": 3.2652973936744667e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2544059157371521,
"step": 2535,
"valid_targets_mean": 2338.4,
"valid_targets_min": 722
},
{
"epoch": 2.482893450635386,
"grad_norm": 0.7561597467756237,
"learning_rate": 3.261518077120578e-05,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21395118534564972,
"step": 2540,
"valid_targets_mean": 1770.1,
"valid_targets_min": 589
},
{
"epoch": 2.487781036168133,
"grad_norm": 0.753579094986984,
"learning_rate": 3.257731264698283e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21489103138446808,
"step": 2545,
"valid_targets_mean": 1672.8,
"valid_targets_min": 755
},
{
"epoch": 2.4926686217008798,
"grad_norm": 0.6589858003710982,
"learning_rate": 3.253936978908604e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24498148262500763,
"step": 2550,
"valid_targets_mean": 3218.2,
"valid_targets_min": 1118
},
{
"epoch": 2.4975562072336266,
"grad_norm": 0.7002768152776646,
"learning_rate": 3.250135242296971e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2629767060279846,
"step": 2555,
"valid_targets_mean": 2427.2,
"valid_targets_min": 796
},
{
"epoch": 2.5024437927663734,
"grad_norm": 0.786673139351379,
"learning_rate": 3.246326077453087e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22290992736816406,
"step": 2560,
"valid_targets_mean": 1889.1,
"valid_targets_min": 717
},
{
"epoch": 2.5073313782991202,
"grad_norm": 0.6164870341662336,
"learning_rate": 3.242509507010791e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23814159631729126,
"step": 2565,
"valid_targets_mean": 3004.0,
"valid_targets_min": 792
},
{
"epoch": 2.512218963831867,
"grad_norm": 0.7245474670367238,
"learning_rate": 3.238685553647927e-05,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21552202105522156,
"step": 2570,
"valid_targets_mean": 1887.2,
"valid_targets_min": 753
},
{
"epoch": 2.517106549364614,
"grad_norm": 0.7481756056168739,
"learning_rate": 3.2348542400862075e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534748911857605,
"step": 2575,
"valid_targets_mean": 2268.9,
"valid_targets_min": 632
},
{
"epoch": 2.5219941348973607,
"grad_norm": 0.7224008501321807,
"learning_rate": 3.231015589091079e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531392574310303,
"step": 2580,
"valid_targets_mean": 2338.6,
"valid_targets_min": 882
},
{
"epoch": 2.5268817204301075,
"grad_norm": 0.7291916308037362,
"learning_rate": 3.2271696234715866e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2746545374393463,
"step": 2585,
"valid_targets_mean": 2363.4,
"valid_targets_min": 843
},
{
"epoch": 2.5317693059628543,
"grad_norm": 1.0380167495946064,
"learning_rate": 3.2233163660802387e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21444106101989746,
"step": 2590,
"valid_targets_mean": 1598.9,
"valid_targets_min": 732
},
{
"epoch": 2.536656891495601,
"grad_norm": 0.6544024445784333,
"learning_rate": 3.219455839812871e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21233348548412323,
"step": 2595,
"valid_targets_mean": 2456.2,
"valid_targets_min": 1190
},
{
"epoch": 2.541544477028348,
"grad_norm": 0.628273229393255,
"learning_rate": 3.21558806760851e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2087693214416504,
"step": 2600,
"valid_targets_mean": 2745.5,
"valid_targets_min": 700
},
{
"epoch": 2.5464320625610948,
"grad_norm": 0.6030343066322286,
"learning_rate": 3.211713072449236e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22888022661209106,
"step": 2605,
"valid_targets_mean": 2916.0,
"valid_targets_min": 884
},
{
"epoch": 2.5513196480938416,
"grad_norm": 0.7152526807779622,
"learning_rate": 3.207830877360051e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22312462329864502,
"step": 2610,
"valid_targets_mean": 2152.1,
"valid_targets_min": 924
},
{
"epoch": 2.5562072336265884,
"grad_norm": 0.6731642169381366,
"learning_rate": 3.203941505408736e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21658943593502045,
"step": 2615,
"valid_targets_mean": 2331.7,
"valid_targets_min": 911
},
{
"epoch": 2.5610948191593352,
"grad_norm": 0.6639073922224608,
"learning_rate": 3.200044979705717e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22162654995918274,
"step": 2620,
"valid_targets_mean": 2536.9,
"valid_targets_min": 765
},
{
"epoch": 2.565982404692082,
"grad_norm": 0.7471285143763177,
"learning_rate": 3.1961413234039267e-05,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24290457367897034,
"step": 2625,
"valid_targets_mean": 2320.9,
"valid_targets_min": 970
},
{
"epoch": 2.570869990224829,
"grad_norm": 0.7014404171599978,
"learning_rate": 3.192230559698669e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2300807237625122,
"step": 2630,
"valid_targets_mean": 2163.2,
"valid_targets_min": 1099
},
{
"epoch": 2.5757575757575757,
"grad_norm": 0.7689908471529473,
"learning_rate": 3.1883127118274795e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22766678035259247,
"step": 2635,
"valid_targets_mean": 2223.1,
"valid_targets_min": 758
},
{
"epoch": 2.5806451612903225,
"grad_norm": 0.7524156572486015,
"learning_rate": 3.1843878030699843e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22420425713062286,
"step": 2640,
"valid_targets_mean": 2231.3,
"valid_targets_min": 900
},
{
"epoch": 2.5855327468230693,
"grad_norm": 0.6206868507870091,
"learning_rate": 3.180455856747768e-05,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23075121641159058,
"step": 2645,
"valid_targets_mean": 2600.9,
"valid_targets_min": 1010
},
{
"epoch": 2.590420332355816,
"grad_norm": 0.90695340921089,
"learning_rate": 3.1765168962242314e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2378099113702774,
"step": 2650,
"valid_targets_mean": 3146.6,
"valid_targets_min": 656
},
{
"epoch": 2.595307917888563,
"grad_norm": 0.7522437194650009,
"learning_rate": 3.172570944904454e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24361330270767212,
"step": 2655,
"valid_targets_mean": 1933.7,
"valid_targets_min": 607
},
{
"epoch": 2.60019550342131,
"grad_norm": 0.7385794100286881,
"learning_rate": 3.168618026235052e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2449553906917572,
"step": 2660,
"valid_targets_mean": 2196.0,
"valid_targets_min": 734
},
{
"epoch": 2.6050830889540566,
"grad_norm": 0.6811321355025456,
"learning_rate": 3.164658163704044e-05,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2384980171918869,
"step": 2665,
"valid_targets_mean": 2501.2,
"valid_targets_min": 826
},
{
"epoch": 2.6099706744868034,
"grad_norm": 0.7081141329414362,
"learning_rate": 3.160691380840705e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22777023911476135,
"step": 2670,
"valid_targets_mean": 2467.4,
"valid_targets_min": 747
},
{
"epoch": 2.6148582600195502,
"grad_norm": 0.6830393989705583,
"learning_rate": 3.156717701215433e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21992099285125732,
"step": 2675,
"valid_targets_mean": 2317.6,
"valid_targets_min": 950
},
{
"epoch": 2.619745845552297,
"grad_norm": 0.8012433854096802,
"learning_rate": 3.152737148439608e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27927660942077637,
"step": 2680,
"valid_targets_mean": 2117.2,
"valid_targets_min": 789
},
{
"epoch": 2.624633431085044,
"grad_norm": 0.6934903380108935,
"learning_rate": 3.1487497461654435e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25259506702423096,
"step": 2685,
"valid_targets_mean": 2417.8,
"valid_targets_min": 791
},
{
"epoch": 2.6295210166177907,
"grad_norm": 0.7359216165404469,
"learning_rate": 3.144755518085859e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24347510933876038,
"step": 2690,
"valid_targets_mean": 2227.3,
"valid_targets_min": 1027
},
{
"epoch": 2.6344086021505375,
"grad_norm": 0.7767880726332548,
"learning_rate": 3.1407544879343284e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24625647068023682,
"step": 2695,
"valid_targets_mean": 1754.9,
"valid_targets_min": 689
},
{
"epoch": 2.6392961876832843,
"grad_norm": 0.696674510993026,
"learning_rate": 3.136746679484746e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2380523532629013,
"step": 2700,
"valid_targets_mean": 2332.2,
"valid_targets_min": 790
},
{
"epoch": 2.644183773216031,
"grad_norm": 0.6694545044109874,
"learning_rate": 3.1327321165512784e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2502917945384979,
"step": 2705,
"valid_targets_mean": 2535.8,
"valid_targets_min": 1282
},
{
"epoch": 2.649071358748778,
"grad_norm": 0.6987439481563695,
"learning_rate": 3.128710822988231e-05,
"loss": 0.2343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21862663328647614,
"step": 2710,
"valid_targets_mean": 1921.0,
"valid_targets_min": 823
},
{
"epoch": 2.653958944281525,
"grad_norm": 0.6914300177187406,
"learning_rate": 3.1246828226899e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22969259321689606,
"step": 2715,
"valid_targets_mean": 2253.5,
"valid_targets_min": 824
},
{
"epoch": 2.6588465298142716,
"grad_norm": 0.602200287873372,
"learning_rate": 3.120648139590435e-05,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24584728479385376,
"step": 2720,
"valid_targets_mean": 3155.4,
"valid_targets_min": 1278
},
{
"epoch": 2.6637341153470184,
"grad_norm": 0.7075447193702563,
"learning_rate": 3.1166067976636906e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2338378131389618,
"step": 2725,
"valid_targets_mean": 2341.6,
"valid_targets_min": 533
},
{
"epoch": 2.6686217008797652,
"grad_norm": 0.6716820653818237,
"learning_rate": 3.1125588209230914e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.234563410282135,
"step": 2730,
"valid_targets_mean": 2494.7,
"valid_targets_min": 756
},
{
"epoch": 2.673509286412512,
"grad_norm": 0.6350189009309046,
"learning_rate": 3.108504233421482e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2456614375114441,
"step": 2735,
"valid_targets_mean": 2821.6,
"valid_targets_min": 761
},
{
"epoch": 2.678396871945259,
"grad_norm": 0.6980749472004388,
"learning_rate": 3.104443059250992e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24124208092689514,
"step": 2740,
"valid_targets_mean": 2521.0,
"valid_targets_min": 992
},
{
"epoch": 2.6832844574780057,
"grad_norm": 0.67259645483737,
"learning_rate": 3.1003753225428855e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22315667569637299,
"step": 2745,
"valid_targets_mean": 2475.1,
"valid_targets_min": 859
},
{
"epoch": 2.688172043010753,
"grad_norm": 0.6681313606790765,
"learning_rate": 3.0963010474674217e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.247651606798172,
"step": 2750,
"valid_targets_mean": 2558.2,
"valid_targets_min": 634
},
{
"epoch": 2.6930596285435,
"grad_norm": 0.6859361683493692,
"learning_rate": 3.0922202582337115e-05,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19534924626350403,
"step": 2755,
"valid_targets_mean": 2257.4,
"valid_targets_min": 876
},
{
"epoch": 2.6979472140762466,
"grad_norm": 0.6985818000049671,
"learning_rate": 3.08813297908957e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25439029932022095,
"step": 2760,
"valid_targets_mean": 2687.1,
"valid_targets_min": 958
},
{
"epoch": 2.7028347996089934,
"grad_norm": 0.6566705673923328,
"learning_rate": 3.084039234321379e-05,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557886242866516,
"step": 2765,
"valid_targets_mean": 2698.4,
"valid_targets_min": 549
},
{
"epoch": 2.7077223851417402,
"grad_norm": 0.6165188909289334,
"learning_rate": 3.079939048253934e-05,
"loss": 0.2493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24600160121917725,
"step": 2770,
"valid_targets_mean": 2858.0,
"valid_targets_min": 978
},
{
"epoch": 2.712609970674487,
"grad_norm": 0.6790410549127608,
"learning_rate": 3.0758324452503065e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2445409744977951,
"step": 2775,
"valid_targets_mean": 2667.5,
"valid_targets_min": 740
},
{
"epoch": 2.717497556207234,
"grad_norm": 0.6974981732520593,
"learning_rate": 3.071719449711699e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23706629872322083,
"step": 2780,
"valid_targets_mean": 2513.4,
"valid_targets_min": 1093
},
{
"epoch": 2.7223851417399807,
"grad_norm": 0.6737555976917173,
"learning_rate": 3.0676000860772956e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2328021228313446,
"step": 2785,
"valid_targets_mean": 2313.6,
"valid_targets_min": 684
},
{
"epoch": 2.7272727272727275,
"grad_norm": 1.2575294841809628,
"learning_rate": 3.063474378824119e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23096132278442383,
"step": 2790,
"valid_targets_mean": 1920.2,
"valid_targets_min": 891
},
{
"epoch": 2.7321603128054743,
"grad_norm": 0.6273895966528873,
"learning_rate": 3.0593423524668864e-05,
"loss": 0.2443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23225541412830353,
"step": 2795,
"valid_targets_mean": 2795.9,
"valid_targets_min": 815
},
{
"epoch": 2.737047898338221,
"grad_norm": 0.750013291851974,
"learning_rate": 3.055204031557863e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19314704835414886,
"step": 2800,
"valid_targets_mean": 1944.0,
"valid_targets_min": 839
},
{
"epoch": 2.741935483870968,
"grad_norm": 0.665083340706297,
"learning_rate": 3.0510594406867153e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23232056200504303,
"step": 2805,
"valid_targets_mean": 2747.2,
"valid_targets_min": 893
},
{
"epoch": 2.746823069403715,
"grad_norm": 0.6430016293534321,
"learning_rate": 3.0469086044803663e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22754496335983276,
"step": 2810,
"valid_targets_mean": 2441.9,
"valid_targets_min": 697
},
{
"epoch": 2.7517106549364616,
"grad_norm": 0.6672184525189786,
"learning_rate": 3.0427515476028468e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2377731204032898,
"step": 2815,
"valid_targets_mean": 2553.1,
"valid_targets_min": 1144
},
{
"epoch": 2.7565982404692084,
"grad_norm": 0.6337998207855043,
"learning_rate": 3.038588294755151e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2279859483242035,
"step": 2820,
"valid_targets_mean": 2683.7,
"valid_targets_min": 597
},
{
"epoch": 2.7614858260019552,
"grad_norm": 0.6415879365422061,
"learning_rate": 3.034418870675092e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25901520252227783,
"step": 2825,
"valid_targets_mean": 3471.3,
"valid_targets_min": 771
},
{
"epoch": 2.766373411534702,
"grad_norm": 0.6903646046533939,
"learning_rate": 3.0302433001371475e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619539499282837,
"step": 2830,
"valid_targets_mean": 2333.2,
"valid_targets_min": 890
},
{
"epoch": 2.771260997067449,
"grad_norm": 0.6243991438233805,
"learning_rate": 3.02606160795232e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2319139838218689,
"step": 2835,
"valid_targets_mean": 2468.5,
"valid_targets_min": 646
},
{
"epoch": 2.7761485826001957,
"grad_norm": 0.640200588738358,
"learning_rate": 3.021873818967986e-05,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20535393059253693,
"step": 2840,
"valid_targets_mean": 3473.6,
"valid_targets_min": 978
},
{
"epoch": 2.7810361681329425,
"grad_norm": 0.6766646508609335,
"learning_rate": 3.0176799580677477e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23535458743572235,
"step": 2845,
"valid_targets_mean": 2393.3,
"valid_targets_min": 861
},
{
"epoch": 2.7859237536656893,
"grad_norm": 0.6733786925421605,
"learning_rate": 3.013480050171289e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23346024751663208,
"step": 2850,
"valid_targets_mean": 2390.7,
"valid_targets_min": 728
},
{
"epoch": 2.790811339198436,
"grad_norm": 0.724460745453377,
"learning_rate": 3.009274120234221e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2303357571363449,
"step": 2855,
"valid_targets_mean": 2362.2,
"valid_targets_min": 786
},
{
"epoch": 2.795698924731183,
"grad_norm": 0.6645986334487373,
"learning_rate": 3.0050621932479402e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22619573771953583,
"step": 2860,
"valid_targets_mean": 2401.0,
"valid_targets_min": 832
},
{
"epoch": 2.80058651026393,
"grad_norm": 0.6600838806245943,
"learning_rate": 3.0008442942394763e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26058539748191833,
"step": 2865,
"valid_targets_mean": 2661.4,
"valid_targets_min": 1131
},
{
"epoch": 2.8054740957966766,
"grad_norm": 0.64943249977253,
"learning_rate": 2.9966204482713447e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22463732957839966,
"step": 2870,
"valid_targets_mean": 2495.8,
"valid_targets_min": 680
},
{
"epoch": 2.8103616813294234,
"grad_norm": 0.6786818865745439,
"learning_rate": 2.9923906804413966e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2178959995508194,
"step": 2875,
"valid_targets_mean": 2419.3,
"valid_targets_min": 826
},
{
"epoch": 2.8152492668621703,
"grad_norm": 0.5944406321947248,
"learning_rate": 2.988155015882671e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23274701833724976,
"step": 2880,
"valid_targets_mean": 3016.2,
"valid_targets_min": 906
},
{
"epoch": 2.820136852394917,
"grad_norm": 0.7333620836779235,
"learning_rate": 2.9839134797632448e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2247675657272339,
"step": 2885,
"valid_targets_mean": 1883.5,
"valid_targets_min": 635
},
{
"epoch": 2.825024437927664,
"grad_norm": 0.6805311682642338,
"learning_rate": 2.9796660972860843e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23136526346206665,
"step": 2890,
"valid_targets_mean": 2278.5,
"valid_targets_min": 807
},
{
"epoch": 2.8299120234604107,
"grad_norm": 0.7830726431275282,
"learning_rate": 2.975412893688893e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24189212918281555,
"step": 2895,
"valid_targets_mean": 1769.8,
"valid_targets_min": 663
},
{
"epoch": 2.8347996089931575,
"grad_norm": 0.6769811140537966,
"learning_rate": 2.9711538942439637e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22272557020187378,
"step": 2900,
"valid_targets_mean": 2156.8,
"valid_targets_min": 876
},
{
"epoch": 2.8396871945259043,
"grad_norm": 0.7674529053801956,
"learning_rate": 2.9668891242580287e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2575834095478058,
"step": 2905,
"valid_targets_mean": 2216.5,
"valid_targets_min": 744
},
{
"epoch": 2.844574780058651,
"grad_norm": 0.6658603801212766,
"learning_rate": 2.962618609072108e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25467610359191895,
"step": 2910,
"valid_targets_mean": 2915.1,
"valid_targets_min": 694
},
{
"epoch": 2.849462365591398,
"grad_norm": 0.62994164165599,
"learning_rate": 2.9583423740613583e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25572115182876587,
"step": 2915,
"valid_targets_mean": 2733.2,
"valid_targets_min": 1002
},
{
"epoch": 2.854349951124145,
"grad_norm": 0.7802082469784795,
"learning_rate": 2.954060444634924e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21022462844848633,
"step": 2920,
"valid_targets_mean": 1662.9,
"valid_targets_min": 749
},
{
"epoch": 2.8592375366568916,
"grad_norm": 0.7025252669117502,
"learning_rate": 2.9497728462357854e-05,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2211170792579651,
"step": 2925,
"valid_targets_mean": 1993.3,
"valid_targets_min": 695
},
{
"epoch": 2.8641251221896384,
"grad_norm": 0.5702454921369775,
"learning_rate": 2.9454796043406082e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22452156245708466,
"step": 2930,
"valid_targets_mean": 3428.3,
"valid_targets_min": 765
},
{
"epoch": 2.8690127077223853,
"grad_norm": 0.737348955153242,
"learning_rate": 2.9411807444595903e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21879072487354279,
"step": 2935,
"valid_targets_mean": 2037.2,
"valid_targets_min": 636
},
{
"epoch": 2.873900293255132,
"grad_norm": 0.7194505785174569,
"learning_rate": 2.936876292136311e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2638698220252991,
"step": 2940,
"valid_targets_mean": 2237.4,
"valid_targets_min": 834
},
{
"epoch": 2.878787878787879,
"grad_norm": 0.7215626747806759,
"learning_rate": 2.9325662729475808e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24015557765960693,
"step": 2945,
"valid_targets_mean": 2293.9,
"valid_targets_min": 752
},
{
"epoch": 2.8836754643206257,
"grad_norm": 0.6723838618072419,
"learning_rate": 2.928250712503288e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21491815149784088,
"step": 2950,
"valid_targets_mean": 2184.8,
"valid_targets_min": 979
},
{
"epoch": 2.8885630498533725,
"grad_norm": 0.7739998699952924,
"learning_rate": 2.9239296364462467e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25200653076171875,
"step": 2955,
"valid_targets_mean": 2104.8,
"valid_targets_min": 815
},
{
"epoch": 2.8934506353861194,
"grad_norm": 0.6661883736388912,
"learning_rate": 2.919603070452043e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24104368686676025,
"step": 2960,
"valid_targets_mean": 2636.2,
"valid_targets_min": 821
},
{
"epoch": 2.898338220918866,
"grad_norm": 0.777296307434507,
"learning_rate": 2.915271040228886e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22833505272865295,
"step": 2965,
"valid_targets_mean": 1935.4,
"valid_targets_min": 892
},
{
"epoch": 2.903225806451613,
"grad_norm": 0.6089518142750111,
"learning_rate": 2.9109335715174517e-05,
"loss": 0.233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23753002285957336,
"step": 2970,
"valid_targets_mean": 3033.2,
"valid_targets_min": 1109
},
{
"epoch": 2.90811339198436,
"grad_norm": 0.782726714582175,
"learning_rate": 2.9065906900907318e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23450714349746704,
"step": 2975,
"valid_targets_mean": 1985.1,
"valid_targets_min": 770
},
{
"epoch": 2.9130009775171066,
"grad_norm": 0.6413112020747412,
"learning_rate": 2.9022424217538797e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2412833422422409,
"step": 2980,
"valid_targets_mean": 2716.9,
"valid_targets_min": 985
},
{
"epoch": 2.9178885630498534,
"grad_norm": 0.6854532986235314,
"learning_rate": 2.8978887923440573e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23968929052352905,
"step": 2985,
"valid_targets_mean": 2625.2,
"valid_targets_min": 940
},
{
"epoch": 2.9227761485826003,
"grad_norm": 0.6876034052530781,
"learning_rate": 2.8935298277302827e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24147212505340576,
"step": 2990,
"valid_targets_mean": 2415.8,
"valid_targets_min": 727
},
{
"epoch": 2.927663734115347,
"grad_norm": 0.6592399161754122,
"learning_rate": 2.8891655538132747e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24528644979000092,
"step": 2995,
"valid_targets_mean": 2493.1,
"valid_targets_min": 879
},
{
"epoch": 2.932551319648094,
"grad_norm": 0.7330835802360961,
"learning_rate": 2.8847959965252997e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24110592901706696,
"step": 3000,
"valid_targets_mean": 2464.8,
"valid_targets_min": 714
},
{
"epoch": 2.9374389051808407,
"grad_norm": 0.9963806436549506,
"learning_rate": 2.8804211818300175e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24917423725128174,
"step": 3005,
"valid_targets_mean": 2112.3,
"valid_targets_min": 635
},
{
"epoch": 2.9423264907135875,
"grad_norm": 0.7093645468792228,
"learning_rate": 2.8760411357223274e-05,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.256412148475647,
"step": 3010,
"valid_targets_mean": 2230.4,
"valid_targets_min": 514
},
{
"epoch": 2.9472140762463344,
"grad_norm": 0.6313278112245672,
"learning_rate": 2.8716558842282133e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21212854981422424,
"step": 3015,
"valid_targets_mean": 2637.0,
"valid_targets_min": 916
},
{
"epoch": 2.952101661779081,
"grad_norm": 0.5943727879588198,
"learning_rate": 2.8672654534045893e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22816044092178345,
"step": 3020,
"valid_targets_mean": 3090.9,
"valid_targets_min": 819
},
{
"epoch": 2.956989247311828,
"grad_norm": 0.6972022185831341,
"learning_rate": 2.8628698693391454e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24018850922584534,
"step": 3025,
"valid_targets_mean": 2340.3,
"valid_targets_min": 807
},
{
"epoch": 2.961876832844575,
"grad_norm": 0.6777221287793921,
"learning_rate": 2.8584691581501904e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22792454063892365,
"step": 3030,
"valid_targets_mean": 2147.8,
"valid_targets_min": 929
},
{
"epoch": 2.9667644183773216,
"grad_norm": 0.608921349958511,
"learning_rate": 2.8540633459864984e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22310322523117065,
"step": 3035,
"valid_targets_mean": 2694.1,
"valid_targets_min": 714
},
{
"epoch": 2.9716520039100685,
"grad_norm": 0.6960978391554294,
"learning_rate": 2.8496524590271558e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25981682538986206,
"step": 3040,
"valid_targets_mean": 2517.1,
"valid_targets_min": 940
},
{
"epoch": 2.9765395894428153,
"grad_norm": 0.7378583701878564,
"learning_rate": 2.8452365234813992e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1961268186569214,
"step": 3045,
"valid_targets_mean": 2311.8,
"valid_targets_min": 740
},
{
"epoch": 2.981427174975562,
"grad_norm": 0.6720248721061973,
"learning_rate": 2.8408155655884666e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2390064001083374,
"step": 3050,
"valid_targets_mean": 2484.6,
"valid_targets_min": 1076
},
{
"epoch": 2.986314760508309,
"grad_norm": 0.6878264817723515,
"learning_rate": 2.836389611617437e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2337898164987564,
"step": 3055,
"valid_targets_mean": 2284.5,
"valid_targets_min": 1266
},
{
"epoch": 2.9912023460410557,
"grad_norm": 0.6966111553176655,
"learning_rate": 2.8319586878670767e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22837823629379272,
"step": 3060,
"valid_targets_mean": 2068.6,
"valid_targets_min": 772
},
{
"epoch": 2.9960899315738025,
"grad_norm": 0.6945196129457747,
"learning_rate": 2.827522820665681e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2056921422481537,
"step": 3065,
"valid_targets_mean": 2009.1,
"valid_targets_min": 612
},
{
"epoch": 3.0009775171065494,
"grad_norm": 0.6719993247544616,
"learning_rate": 2.82308203637092e-05,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2267838567495346,
"step": 3070,
"valid_targets_mean": 2419.8,
"valid_targets_min": 732
},
{
"epoch": 3.005865102639296,
"grad_norm": 0.6667645399427046,
"learning_rate": 2.8186363613696807e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22658130526542664,
"step": 3075,
"valid_targets_mean": 2837.1,
"valid_targets_min": 648
},
{
"epoch": 3.010752688172043,
"grad_norm": 0.6995064995237391,
"learning_rate": 2.81418582207791e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21117915213108063,
"step": 3080,
"valid_targets_mean": 2488.8,
"valid_targets_min": 746
},
{
"epoch": 3.01564027370479,
"grad_norm": 0.7816935143677926,
"learning_rate": 2.809730444940459e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19485579431056976,
"step": 3085,
"valid_targets_mean": 1877.2,
"valid_targets_min": 585
},
{
"epoch": 3.0205278592375366,
"grad_norm": 0.6280789848534472,
"learning_rate": 2.8052702564309232e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18880394101142883,
"step": 3090,
"valid_targets_mean": 2680.8,
"valid_targets_min": 754
},
{
"epoch": 3.0254154447702835,
"grad_norm": 0.7246655595987659,
"learning_rate": 2.8008052830514882e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21295440196990967,
"step": 3095,
"valid_targets_mean": 2274.8,
"valid_targets_min": 788
},
{
"epoch": 3.0303030303030303,
"grad_norm": 0.7042756737696498,
"learning_rate": 2.7963355513327717e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23234760761260986,
"step": 3100,
"valid_targets_mean": 2904.4,
"valid_targets_min": 708
},
{
"epoch": 3.035190615835777,
"grad_norm": 0.7467994069578198,
"learning_rate": 2.7918610878336644e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22012445330619812,
"step": 3105,
"valid_targets_mean": 2543.5,
"valid_targets_min": 893
},
{
"epoch": 3.040078201368524,
"grad_norm": 0.6581294580719984,
"learning_rate": 2.7873819191411732e-05,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1838349997997284,
"step": 3110,
"valid_targets_mean": 2560.5,
"valid_targets_min": 1434
},
{
"epoch": 3.0449657869012707,
"grad_norm": 0.6275202980378985,
"learning_rate": 2.782898071870261e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1899479627609253,
"step": 3115,
"valid_targets_mean": 2978.4,
"valid_targets_min": 723
},
{
"epoch": 3.0498533724340176,
"grad_norm": 0.708666227527697,
"learning_rate": 2.7784095726636945e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2058933973312378,
"step": 3120,
"valid_targets_mean": 2619.5,
"valid_targets_min": 1038
},
{
"epoch": 3.0547409579667644,
"grad_norm": 0.7252823344406546,
"learning_rate": 2.773916448191879e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2228691130876541,
"step": 3125,
"valid_targets_mean": 2502.4,
"valid_targets_min": 855
},
{
"epoch": 3.059628543499511,
"grad_norm": 0.6775893290948455,
"learning_rate": 2.7694187251527034e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20811831951141357,
"step": 3130,
"valid_targets_mean": 2852.7,
"valid_targets_min": 834
},
{
"epoch": 3.064516129032258,
"grad_norm": 0.6750667682794524,
"learning_rate": 2.7649164302713818e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2103792279958725,
"step": 3135,
"valid_targets_mean": 2695.4,
"valid_targets_min": 1083
},
{
"epoch": 3.069403714565005,
"grad_norm": 0.6452750671952329,
"learning_rate": 2.7604095903002925e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19791629910469055,
"step": 3140,
"valid_targets_mean": 2622.8,
"valid_targets_min": 851
},
{
"epoch": 3.0742913000977516,
"grad_norm": 0.6855575675327805,
"learning_rate": 2.7558982320188228e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20340736210346222,
"step": 3145,
"valid_targets_mean": 2924.1,
"valid_targets_min": 858
},
{
"epoch": 3.0791788856304985,
"grad_norm": 0.7823747155692843,
"learning_rate": 2.7513823822332044e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19628237187862396,
"step": 3150,
"valid_targets_mean": 1840.7,
"valid_targets_min": 759
},
{
"epoch": 3.0840664711632453,
"grad_norm": 0.8146578281379756,
"learning_rate": 2.74686206777636e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20766061544418335,
"step": 3155,
"valid_targets_mean": 1969.3,
"valid_targets_min": 918
},
{
"epoch": 3.088954056695992,
"grad_norm": 0.6883738938370201,
"learning_rate": 2.7423373155077403e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18747478723526,
"step": 3160,
"valid_targets_mean": 2373.4,
"valid_targets_min": 856
},
{
"epoch": 3.093841642228739,
"grad_norm": 0.7077726637761635,
"learning_rate": 2.7378081523131644e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20626375079154968,
"step": 3165,
"valid_targets_mean": 2385.8,
"valid_targets_min": 683
},
{
"epoch": 3.0987292277614857,
"grad_norm": 0.8627305595439234,
"learning_rate": 2.7332746051046616e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21347269415855408,
"step": 3170,
"valid_targets_mean": 2014.2,
"valid_targets_min": 734
},
{
"epoch": 3.1036168132942326,
"grad_norm": 0.7893777089075921,
"learning_rate": 2.72873670082031e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2146587371826172,
"step": 3175,
"valid_targets_mean": 2289.4,
"valid_targets_min": 642
},
{
"epoch": 3.1085043988269794,
"grad_norm": 0.8273291714086848,
"learning_rate": 2.7241944664240792e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16076461970806122,
"step": 3180,
"valid_targets_mean": 1337.8,
"valid_targets_min": 514
},
{
"epoch": 3.113391984359726,
"grad_norm": 0.729684484993837,
"learning_rate": 2.719647928905666e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20329692959785461,
"step": 3185,
"valid_targets_mean": 2202.4,
"valid_targets_min": 1251
},
{
"epoch": 3.118279569892473,
"grad_norm": 0.6526019445711841,
"learning_rate": 2.715097115280337e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19159898161888123,
"step": 3190,
"valid_targets_mean": 2702.8,
"valid_targets_min": 793
},
{
"epoch": 3.12316715542522,
"grad_norm": 0.7498464955317224,
"learning_rate": 2.7105420525887667e-05,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2095525860786438,
"step": 3195,
"valid_targets_mean": 2154.8,
"valid_targets_min": 916
},
{
"epoch": 3.1280547409579667,
"grad_norm": 0.7063138314214019,
"learning_rate": 2.7059827678968775e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19605648517608643,
"step": 3200,
"valid_targets_mean": 2327.6,
"valid_targets_min": 916
},
{
"epoch": 3.1329423264907135,
"grad_norm": 0.759819492933154,
"learning_rate": 2.7014192882956795e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2000146508216858,
"step": 3205,
"valid_targets_mean": 2217.5,
"valid_targets_min": 682
},
{
"epoch": 3.1378299120234603,
"grad_norm": 0.7249197896837959,
"learning_rate": 2.6968516409011073e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2277396023273468,
"step": 3210,
"valid_targets_mean": 2899.7,
"valid_targets_min": 905
},
{
"epoch": 3.142717497556207,
"grad_norm": 0.6645341527478739,
"learning_rate": 2.6922798528538615e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1898479163646698,
"step": 3215,
"valid_targets_mean": 2493.7,
"valid_targets_min": 697
},
{
"epoch": 3.147605083088954,
"grad_norm": 0.7890579447239405,
"learning_rate": 2.6877039513192452e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1876201033592224,
"step": 3220,
"valid_targets_mean": 2037.3,
"valid_targets_min": 916
},
{
"epoch": 3.1524926686217007,
"grad_norm": 0.7907814247477751,
"learning_rate": 2.6831239634870044e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19796785712242126,
"step": 3225,
"valid_targets_mean": 1733.1,
"valid_targets_min": 742
},
{
"epoch": 3.1573802541544476,
"grad_norm": 0.7070573564286917,
"learning_rate": 2.6785399165711662e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19448038935661316,
"step": 3230,
"valid_targets_mean": 2516.5,
"valid_targets_min": 1012
},
{
"epoch": 3.1622678396871944,
"grad_norm": 0.7496403178879768,
"learning_rate": 2.673951837809874e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20808371901512146,
"step": 3235,
"valid_targets_mean": 2226.3,
"valid_targets_min": 702
},
{
"epoch": 3.167155425219941,
"grad_norm": 0.7481396583011426,
"learning_rate": 2.669359754465231e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20283767580986023,
"step": 3240,
"valid_targets_mean": 2323.2,
"valid_targets_min": 618
},
{
"epoch": 3.172043010752688,
"grad_norm": 0.7195578782630686,
"learning_rate": 2.6647636938231342e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21234679222106934,
"step": 3245,
"valid_targets_mean": 2472.0,
"valid_targets_min": 642
},
{
"epoch": 3.176930596285435,
"grad_norm": 0.7513145461378141,
"learning_rate": 2.6601636831931134e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21580851078033447,
"step": 3250,
"valid_targets_mean": 2293.7,
"valid_targets_min": 521
},
{
"epoch": 3.1818181818181817,
"grad_norm": 0.7021834829360021,
"learning_rate": 2.6555597499081694e-05,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2086678445339203,
"step": 3255,
"valid_targets_mean": 2655.6,
"valid_targets_min": 921
},
{
"epoch": 3.1867057673509285,
"grad_norm": 0.7337259433387169,
"learning_rate": 2.6509519213246107e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19709116220474243,
"step": 3260,
"valid_targets_mean": 2152.6,
"valid_targets_min": 661
},
{
"epoch": 3.1915933528836753,
"grad_norm": 0.7732965615576772,
"learning_rate": 2.646340224821892e-05,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17325511574745178,
"step": 3265,
"valid_targets_mean": 1718.6,
"valid_targets_min": 757
},
{
"epoch": 3.196480938416422,
"grad_norm": 0.7642020533927616,
"learning_rate": 2.64172468780245e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21912142634391785,
"step": 3270,
"valid_targets_mean": 1914.9,
"valid_targets_min": 762
},
{
"epoch": 3.201368523949169,
"grad_norm": 0.7137081449723205,
"learning_rate": 2.6371053376915442e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1930808126926422,
"step": 3275,
"valid_targets_mean": 2530.1,
"valid_targets_min": 1259
},
{
"epoch": 3.2062561094819158,
"grad_norm": 0.7965252099837399,
"learning_rate": 2.6324822019370874e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20748776197433472,
"step": 3280,
"valid_targets_mean": 2264.4,
"valid_targets_min": 801
},
{
"epoch": 3.2111436950146626,
"grad_norm": 0.7194214666441809,
"learning_rate": 2.6278553080094887e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22017285227775574,
"step": 3285,
"valid_targets_mean": 2692.5,
"valid_targets_min": 794
},
{
"epoch": 3.2160312805474094,
"grad_norm": 0.7245863184684226,
"learning_rate": 2.6232246834014876e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1813446581363678,
"step": 3290,
"valid_targets_mean": 2046.6,
"valid_targets_min": 659
},
{
"epoch": 3.220918866080156,
"grad_norm": 0.7908976384173254,
"learning_rate": 2.618590355627992e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101239562034607,
"step": 3295,
"valid_targets_mean": 2258.9,
"valid_targets_min": 1006
},
{
"epoch": 3.225806451612903,
"grad_norm": 0.7977860033215038,
"learning_rate": 2.613952352225912e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18104560673236847,
"step": 3300,
"valid_targets_mean": 1767.8,
"valid_targets_min": 484
},
{
"epoch": 3.23069403714565,
"grad_norm": 0.6115674983154584,
"learning_rate": 2.6093107007539998e-05,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17804718017578125,
"step": 3305,
"valid_targets_mean": 3087.1,
"valid_targets_min": 818
},
{
"epoch": 3.2355816226783967,
"grad_norm": 0.6099669179614807,
"learning_rate": 2.604665428792683e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20128144323825836,
"step": 3310,
"valid_targets_mean": 3071.8,
"valid_targets_min": 1057
},
{
"epoch": 3.2404692082111435,
"grad_norm": 0.7754454106550883,
"learning_rate": 2.600016563943904e-05,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.216938778758049,
"step": 3315,
"valid_targets_mean": 2073.1,
"valid_targets_min": 740
},
{
"epoch": 3.2453567937438903,
"grad_norm": 0.7143546354659018,
"learning_rate": 2.5953641338309496e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19034463167190552,
"step": 3320,
"valid_targets_mean": 2202.1,
"valid_targets_min": 737
},
{
"epoch": 3.250244379276637,
"grad_norm": 0.8320544699825392,
"learning_rate": 2.590708166098296e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20066097378730774,
"step": 3325,
"valid_targets_mean": 2138.4,
"valid_targets_min": 985
},
{
"epoch": 3.255131964809384,
"grad_norm": 0.7253333750300228,
"learning_rate": 2.586048688411437e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23125603795051575,
"step": 3330,
"valid_targets_mean": 2893.1,
"valid_targets_min": 1018
},
{
"epoch": 3.2600195503421308,
"grad_norm": 0.730875427222105,
"learning_rate": 2.5813857284567237e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19738978147506714,
"step": 3335,
"valid_targets_mean": 2522.3,
"valid_targets_min": 859
},
{
"epoch": 3.2649071358748776,
"grad_norm": 0.7298430353490984,
"learning_rate": 2.5767193139411964e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20270711183547974,
"step": 3340,
"valid_targets_mean": 2434.2,
"valid_targets_min": 467
},
{
"epoch": 3.2697947214076244,
"grad_norm": 1.083616521939471,
"learning_rate": 2.5720494725924257e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21499906480312347,
"step": 3345,
"valid_targets_mean": 1869.0,
"valid_targets_min": 724
},
{
"epoch": 3.274682306940371,
"grad_norm": 0.6154395147501789,
"learning_rate": 2.5673762321583415e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21717801690101624,
"step": 3350,
"valid_targets_mean": 3228.8,
"valid_targets_min": 974
},
{
"epoch": 3.279569892473118,
"grad_norm": 0.7777446446492675,
"learning_rate": 2.5626996204070714e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207222580909729,
"step": 3355,
"valid_targets_mean": 2294.8,
"valid_targets_min": 705
},
{
"epoch": 3.2844574780058653,
"grad_norm": 0.626315557736335,
"learning_rate": 2.558019665126777e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18110740184783936,
"step": 3360,
"valid_targets_mean": 2922.9,
"valid_targets_min": 607
},
{
"epoch": 3.289345063538612,
"grad_norm": 0.6898177043479149,
"learning_rate": 2.5533363941254826e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18781378865242004,
"step": 3365,
"valid_targets_mean": 2249.1,
"valid_targets_min": 740
},
{
"epoch": 3.294232649071359,
"grad_norm": 0.7219158135860761,
"learning_rate": 2.5486498352309194e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19829457998275757,
"step": 3370,
"valid_targets_mean": 2316.6,
"valid_targets_min": 896
},
{
"epoch": 3.2991202346041058,
"grad_norm": 0.7339876884452256,
"learning_rate": 2.5439600162903527e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2177194505929947,
"step": 3375,
"valid_targets_mean": 2257.8,
"valid_targets_min": 726
},
{
"epoch": 3.3040078201368526,
"grad_norm": 0.6776390716226277,
"learning_rate": 2.5392669651704185e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19257496297359467,
"step": 3380,
"valid_targets_mean": 2925.8,
"valid_targets_min": 1060
},
{
"epoch": 3.3088954056695994,
"grad_norm": 0.759226279377635,
"learning_rate": 2.5345707097569586e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948852837085724,
"step": 3385,
"valid_targets_mean": 2035.1,
"valid_targets_min": 679
},
{
"epoch": 3.313782991202346,
"grad_norm": 0.7681252041823609,
"learning_rate": 2.529871277954854e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.219600647687912,
"step": 3390,
"valid_targets_mean": 2099.7,
"valid_targets_min": 798
},
{
"epoch": 3.318670576735093,
"grad_norm": 0.7587652122936347,
"learning_rate": 2.5251686976878618e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18549835681915283,
"step": 3395,
"valid_targets_mean": 2503.0,
"valid_targets_min": 847
},
{
"epoch": 3.32355816226784,
"grad_norm": 0.6848113837428216,
"learning_rate": 2.5204629968984443e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21900366246700287,
"step": 3400,
"valid_targets_mean": 2764.0,
"valid_targets_min": 651
},
{
"epoch": 3.3284457478005867,
"grad_norm": 0.6897084263388162,
"learning_rate": 2.5157542035476077e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19517606496810913,
"step": 3405,
"valid_targets_mean": 2661.6,
"valid_targets_min": 960
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.7517965693921952,
"learning_rate": 2.5110423456147322e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21612215042114258,
"step": 3410,
"valid_targets_mean": 2433.1,
"valid_targets_min": 975
},
{
"epoch": 3.3382209188660803,
"grad_norm": 0.7318661225517749,
"learning_rate": 2.50632745109741e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1917639672756195,
"step": 3415,
"valid_targets_mean": 1934.4,
"valid_targets_min": 771
},
{
"epoch": 3.343108504398827,
"grad_norm": 0.7445802916995302,
"learning_rate": 2.501609548011275e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921059787273407,
"step": 3420,
"valid_targets_mean": 2087.8,
"valid_targets_min": 692
},
{
"epoch": 3.347996089931574,
"grad_norm": 0.6673062277647884,
"learning_rate": 2.4968886643898366e-05,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18176676332950592,
"step": 3425,
"valid_targets_mean": 2963.6,
"valid_targets_min": 1007
},
{
"epoch": 3.3528836754643208,
"grad_norm": 0.9097050470991745,
"learning_rate": 2.4921648282843176e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18103784322738647,
"step": 3430,
"valid_targets_mean": 2004.6,
"valid_targets_min": 628
},
{
"epoch": 3.3577712609970676,
"grad_norm": 0.7122931954083914,
"learning_rate": 2.4874380677634817e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19356971979141235,
"step": 3435,
"valid_targets_mean": 2382.2,
"valid_targets_min": 914
},
{
"epoch": 3.3626588465298144,
"grad_norm": 0.7088171184773836,
"learning_rate": 2.4827084109134697e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20455177128314972,
"step": 3440,
"valid_targets_mean": 2174.6,
"valid_targets_min": 657
},
{
"epoch": 3.367546432062561,
"grad_norm": 0.6612005144692485,
"learning_rate": 2.477975885837634e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21015259623527527,
"step": 3445,
"valid_targets_mean": 2880.4,
"valid_targets_min": 648
},
{
"epoch": 3.372434017595308,
"grad_norm": 0.7655924949272598,
"learning_rate": 2.473240520656367e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2177879959344864,
"step": 3450,
"valid_targets_mean": 2229.4,
"valid_targets_min": 836
},
{
"epoch": 3.377321603128055,
"grad_norm": 0.7618724000532252,
"learning_rate": 2.4685023435069388e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23734396696090698,
"step": 3455,
"valid_targets_mean": 2332.8,
"valid_targets_min": 621
},
{
"epoch": 3.3822091886608017,
"grad_norm": 0.8143707345252376,
"learning_rate": 2.4637613825433277e-05,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19915053248405457,
"step": 3460,
"valid_targets_mean": 1512.4,
"valid_targets_min": 668
},
{
"epoch": 3.3870967741935485,
"grad_norm": 0.8158876268350879,
"learning_rate": 2.4590176659360538e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22826993465423584,
"step": 3465,
"valid_targets_mean": 2035.4,
"valid_targets_min": 650
},
{
"epoch": 3.3919843597262953,
"grad_norm": 0.6759338161481376,
"learning_rate": 2.4542712218720093e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18781697750091553,
"step": 3470,
"valid_targets_mean": 2423.6,
"valid_targets_min": 738
},
{
"epoch": 3.396871945259042,
"grad_norm": 0.6931462841032442,
"learning_rate": 2.449522078554294e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20876827836036682,
"step": 3475,
"valid_targets_mean": 2486.4,
"valid_targets_min": 610
},
{
"epoch": 3.401759530791789,
"grad_norm": 0.656880638760444,
"learning_rate": 2.444770264202047e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21965506672859192,
"step": 3480,
"valid_targets_mean": 2932.4,
"valid_targets_min": 924
},
{
"epoch": 3.4066471163245358,
"grad_norm": 0.7793846246855756,
"learning_rate": 2.4400158070502773e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2179027497768402,
"step": 3485,
"valid_targets_mean": 2128.7,
"valid_targets_min": 807
},
{
"epoch": 3.4115347018572826,
"grad_norm": 0.6366727057551457,
"learning_rate": 2.435258735349699e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207027405500412,
"step": 3490,
"valid_targets_mean": 3005.8,
"valid_targets_min": 901
},
{
"epoch": 3.4164222873900294,
"grad_norm": 0.8083254712829566,
"learning_rate": 2.4304990773665587e-05,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22201141715049744,
"step": 3495,
"valid_targets_mean": 2266.4,
"valid_targets_min": 790
},
{
"epoch": 3.421309872922776,
"grad_norm": 0.7883137521426757,
"learning_rate": 2.4257368613824745e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18446215987205505,
"step": 3500,
"valid_targets_mean": 1863.5,
"valid_targets_min": 1075
},
{
"epoch": 3.426197458455523,
"grad_norm": 0.7729853988513622,
"learning_rate": 2.4209721156942615e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1607511341571808,
"step": 3505,
"valid_targets_mean": 1680.6,
"valid_targets_min": 792
},
{
"epoch": 3.43108504398827,
"grad_norm": 0.7615871115872819,
"learning_rate": 2.416204868613765e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2097199559211731,
"step": 3510,
"valid_targets_mean": 2369.9,
"valid_targets_min": 809
},
{
"epoch": 3.4359726295210167,
"grad_norm": 0.7886947243326079,
"learning_rate": 2.4114351484676975e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22828155755996704,
"step": 3515,
"valid_targets_mean": 2259.6,
"valid_targets_min": 702
},
{
"epoch": 3.4408602150537635,
"grad_norm": 0.6428893882305308,
"learning_rate": 2.4066629835974614e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22016070783138275,
"step": 3520,
"valid_targets_mean": 3275.2,
"valid_targets_min": 1265
},
{
"epoch": 3.4457478005865103,
"grad_norm": 0.822974697294548,
"learning_rate": 2.40188840235899e-05,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20060139894485474,
"step": 3525,
"valid_targets_mean": 1830.9,
"valid_targets_min": 692
},
{
"epoch": 3.450635386119257,
"grad_norm": 0.6770812059975508,
"learning_rate": 2.3971114331225715e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20556485652923584,
"step": 3530,
"valid_targets_mean": 2694.8,
"valid_targets_min": 642
},
{
"epoch": 3.455522971652004,
"grad_norm": 0.7786397671656108,
"learning_rate": 2.392332104272684e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2165582925081253,
"step": 3535,
"valid_targets_mean": 2489.4,
"valid_targets_min": 786
},
{
"epoch": 3.4604105571847508,
"grad_norm": 0.7323225666730152,
"learning_rate": 2.3875504442078282e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21573954820632935,
"step": 3540,
"valid_targets_mean": 2259.0,
"valid_targets_min": 713
},
{
"epoch": 3.4652981427174976,
"grad_norm": 0.6799054356460841,
"learning_rate": 2.3827664813403537e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1902822107076645,
"step": 3545,
"valid_targets_mean": 2551.8,
"valid_targets_min": 627
},
{
"epoch": 3.4701857282502444,
"grad_norm": 0.7472013601982304,
"learning_rate": 2.3779802440962958e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20308758318424225,
"step": 3550,
"valid_targets_mean": 2375.5,
"valid_targets_min": 982
},
{
"epoch": 3.4750733137829912,
"grad_norm": 0.7391959529865234,
"learning_rate": 2.3731917609152023e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21505077183246613,
"step": 3555,
"valid_targets_mean": 2454.9,
"valid_targets_min": 704
},
{
"epoch": 3.479960899315738,
"grad_norm": 0.6408227234028441,
"learning_rate": 2.3684010602499675e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18841466307640076,
"step": 3560,
"valid_targets_mean": 2844.4,
"valid_targets_min": 736
},
{
"epoch": 3.484848484848485,
"grad_norm": 0.6995274259824635,
"learning_rate": 2.363608170566661e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19288122653961182,
"step": 3565,
"valid_targets_mean": 2298.1,
"valid_targets_min": 593
},
{
"epoch": 3.4897360703812317,
"grad_norm": 0.712559649636414,
"learning_rate": 2.35881312034436e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18562278151512146,
"step": 3570,
"valid_targets_mean": 2527.5,
"valid_targets_min": 1190
},
{
"epoch": 3.4946236559139785,
"grad_norm": 0.7601682130608852,
"learning_rate": 2.3540159380749794e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18290041387081146,
"step": 3575,
"valid_targets_mean": 1959.9,
"valid_targets_min": 244
},
{
"epoch": 3.4995112414467253,
"grad_norm": 0.6518733256350043,
"learning_rate": 2.349216652263101e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1879890263080597,
"step": 3580,
"valid_targets_mean": 2892.5,
"valid_targets_min": 788
},
{
"epoch": 3.504398826979472,
"grad_norm": 0.6632097525792074,
"learning_rate": 2.3444152914258087e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19737496972084045,
"step": 3585,
"valid_targets_mean": 2592.2,
"valid_targets_min": 694
},
{
"epoch": 3.509286412512219,
"grad_norm": 0.701914967587876,
"learning_rate": 2.339611884092514e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21197064220905304,
"step": 3590,
"valid_targets_mean": 2489.3,
"valid_targets_min": 763
},
{
"epoch": 3.5141739980449658,
"grad_norm": 0.7664935207947431,
"learning_rate": 2.3348064588047893e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19324423372745514,
"step": 3595,
"valid_targets_mean": 1855.3,
"valid_targets_min": 635
},
{
"epoch": 3.5190615835777126,
"grad_norm": 0.7141259014048177,
"learning_rate": 2.329999044116197e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21774733066558838,
"step": 3600,
"valid_targets_mean": 2392.5,
"valid_targets_min": 682
},
{
"epoch": 3.5239491691104594,
"grad_norm": 0.6730829479768565,
"learning_rate": 2.3251896685921205e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19916030764579773,
"step": 3605,
"valid_targets_mean": 2920.2,
"valid_targets_min": 821
},
{
"epoch": 3.5288367546432062,
"grad_norm": 0.7671142376386617,
"learning_rate": 2.3203783608095954e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23348473012447357,
"step": 3610,
"valid_targets_mean": 2295.7,
"valid_targets_min": 959
},
{
"epoch": 3.533724340175953,
"grad_norm": 0.7689072632328403,
"learning_rate": 2.3155651493571382e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20937813818454742,
"step": 3615,
"valid_targets_mean": 2182.8,
"valid_targets_min": 1082
},
{
"epoch": 3.5386119257087,
"grad_norm": 0.7292242265860919,
"learning_rate": 2.3107500628345756e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22746799886226654,
"step": 3620,
"valid_targets_mean": 2486.5,
"valid_targets_min": 730
},
{
"epoch": 3.5434995112414467,
"grad_norm": 0.7976787109769994,
"learning_rate": 2.3059331298528776e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2245236039161682,
"step": 3625,
"valid_targets_mean": 1958.8,
"valid_targets_min": 1215
},
{
"epoch": 3.5483870967741935,
"grad_norm": 0.7468841302577356,
"learning_rate": 2.301114379033984e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18756568431854248,
"step": 3630,
"valid_targets_mean": 1843.2,
"valid_targets_min": 900
},
{
"epoch": 3.5532746823069403,
"grad_norm": 0.7052365263985373,
"learning_rate": 2.2962938390106388e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.190373957157135,
"step": 3635,
"valid_targets_mean": 2208.5,
"valid_targets_min": 672
},
{
"epoch": 3.558162267839687,
"grad_norm": 0.7861655797997658,
"learning_rate": 2.291471538426214e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21023714542388916,
"step": 3640,
"valid_targets_mean": 2122.3,
"valid_targets_min": 654
},
{
"epoch": 3.563049853372434,
"grad_norm": 0.7654010417442486,
"learning_rate": 2.2866475059345453e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21987277269363403,
"step": 3645,
"valid_targets_mean": 2314.6,
"valid_targets_min": 872
},
{
"epoch": 3.567937438905181,
"grad_norm": 0.7329153965811843,
"learning_rate": 2.2818217701997577e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19848138093948364,
"step": 3650,
"valid_targets_mean": 2325.4,
"valid_targets_min": 815
},
{
"epoch": 3.5728250244379276,
"grad_norm": 0.6582062601819844,
"learning_rate": 2.276994359896099e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20447036623954773,
"step": 3655,
"valid_targets_mean": 2623.2,
"valid_targets_min": 985
},
{
"epoch": 3.5777126099706744,
"grad_norm": 0.6885840936099205,
"learning_rate": 2.2721653037077645e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2211674004793167,
"step": 3660,
"valid_targets_mean": 2750.7,
"valid_targets_min": 701
},
{
"epoch": 3.5826001955034212,
"grad_norm": 0.7022727114163723,
"learning_rate": 2.2673346303287297e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19418203830718994,
"step": 3665,
"valid_targets_mean": 2241.1,
"valid_targets_min": 548
},
{
"epoch": 3.587487781036168,
"grad_norm": 0.6929148877932964,
"learning_rate": 2.262502368462582e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22029688954353333,
"step": 3670,
"valid_targets_mean": 2660.6,
"valid_targets_min": 729
},
{
"epoch": 3.592375366568915,
"grad_norm": 0.6443170990968766,
"learning_rate": 2.2576685468223444e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18446439504623413,
"step": 3675,
"valid_targets_mean": 2688.0,
"valid_targets_min": 692
},
{
"epoch": 3.5972629521016617,
"grad_norm": 0.600440286447225,
"learning_rate": 2.2528331941303093e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19318996369838715,
"step": 3680,
"valid_targets_mean": 3134.5,
"valid_targets_min": 1041
},
{
"epoch": 3.6021505376344085,
"grad_norm": 0.7844338847583994,
"learning_rate": 2.2479963391178657e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21118606626987457,
"step": 3685,
"valid_targets_mean": 2066.8,
"valid_targets_min": 814
},
{
"epoch": 3.6070381231671553,
"grad_norm": 0.7215085805201092,
"learning_rate": 2.2431580105253313e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20135241746902466,
"step": 3690,
"valid_targets_mean": 2184.1,
"valid_targets_min": 722
},
{
"epoch": 3.611925708699902,
"grad_norm": 0.6656818554741202,
"learning_rate": 2.238318237101778e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20373103022575378,
"step": 3695,
"valid_targets_mean": 2753.5,
"valid_targets_min": 975
},
{
"epoch": 3.616813294232649,
"grad_norm": 0.7180482881493666,
"learning_rate": 2.233477047604863e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976693719625473,
"step": 3700,
"valid_targets_mean": 2586.9,
"valid_targets_min": 692
},
{
"epoch": 3.621700879765396,
"grad_norm": 0.6461550790717755,
"learning_rate": 2.2286344708006578e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20432640612125397,
"step": 3705,
"valid_targets_mean": 3076.8,
"valid_targets_min": 952
},
{
"epoch": 3.6265884652981426,
"grad_norm": 0.7135365897281873,
"learning_rate": 2.2237905354634775e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21222619712352753,
"step": 3710,
"valid_targets_mean": 2544.2,
"valid_targets_min": 1058
},
{
"epoch": 3.6314760508308894,
"grad_norm": 0.7106647598992838,
"learning_rate": 2.2189452703757097e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919505000114441,
"step": 3715,
"valid_targets_mean": 2239.9,
"valid_targets_min": 700
},
{
"epoch": 3.6363636363636362,
"grad_norm": 0.7370346403284481,
"learning_rate": 2.214098704327643e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2074413299560547,
"step": 3720,
"valid_targets_mean": 2248.9,
"valid_targets_min": 504
},
{
"epoch": 3.641251221896383,
"grad_norm": 0.6946560980334792,
"learning_rate": 2.2092508661172957e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18183276057243347,
"step": 3725,
"valid_targets_mean": 2272.8,
"valid_targets_min": 746
},
{
"epoch": 3.64613880742913,
"grad_norm": 0.6384613289501591,
"learning_rate": 2.204401784550246e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18616612255573273,
"step": 3730,
"valid_targets_mean": 2584.4,
"valid_targets_min": 684
},
{
"epoch": 3.6510263929618767,
"grad_norm": 0.6909767548097899,
"learning_rate": 2.1995514884394596e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1910645067691803,
"step": 3735,
"valid_targets_mean": 2587.4,
"valid_targets_min": 771
},
{
"epoch": 3.6559139784946235,
"grad_norm": 0.8148464145542923,
"learning_rate": 2.1947000066051204e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20611697435379028,
"step": 3740,
"valid_targets_mean": 1887.4,
"valid_targets_min": 730
},
{
"epoch": 3.6608015640273703,
"grad_norm": 0.7056151602431089,
"learning_rate": 2.189847367874454e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21500477194786072,
"step": 3745,
"valid_targets_mean": 2486.1,
"valid_targets_min": 1001
},
{
"epoch": 3.665689149560117,
"grad_norm": 1.0531242937391503,
"learning_rate": 2.1849936010815653e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21067142486572266,
"step": 3750,
"valid_targets_mean": 1737.8,
"valid_targets_min": 714
},
{
"epoch": 3.670576735092864,
"grad_norm": 0.7901950772244742,
"learning_rate": 2.1801387350672577e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20664237439632416,
"step": 3755,
"valid_targets_mean": 2177.6,
"valid_targets_min": 627
},
{
"epoch": 3.675464320625611,
"grad_norm": 0.7840380182400347,
"learning_rate": 2.175282798678869e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21524584293365479,
"step": 3760,
"valid_targets_mean": 2213.3,
"valid_targets_min": 722
},
{
"epoch": 3.6803519061583576,
"grad_norm": 0.7134090806306669,
"learning_rate": 2.170425820770096e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20987609028816223,
"step": 3765,
"valid_targets_mean": 2505.4,
"valid_targets_min": 1124
},
{
"epoch": 3.6852394916911044,
"grad_norm": 0.7246436271430389,
"learning_rate": 2.1655678302008232e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20697399973869324,
"step": 3770,
"valid_targets_mean": 2323.0,
"valid_targets_min": 753
},
{
"epoch": 3.6901270772238517,
"grad_norm": 0.6770013885437635,
"learning_rate": 2.160708855836954e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1982710063457489,
"step": 3775,
"valid_targets_mean": 2790.8,
"valid_targets_min": 715
},
{
"epoch": 3.6950146627565985,
"grad_norm": 0.799738720478482,
"learning_rate": 2.1558489265502373e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.220750093460083,
"step": 3780,
"valid_targets_mean": 2273.8,
"valid_targets_min": 750
},
{
"epoch": 3.6999022482893453,
"grad_norm": 0.6508927329830108,
"learning_rate": 2.1509880712180946e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20443478226661682,
"step": 3785,
"valid_targets_mean": 2857.2,
"valid_targets_min": 874
},
{
"epoch": 3.704789833822092,
"grad_norm": 0.6802733863979533,
"learning_rate": 2.1461263187234515e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20990541577339172,
"step": 3790,
"valid_targets_mean": 2561.4,
"valid_targets_min": 705
},
{
"epoch": 3.709677419354839,
"grad_norm": 0.7028949057842757,
"learning_rate": 2.141263697954563e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2133583277463913,
"step": 3795,
"valid_targets_mean": 2545.5,
"valid_targets_min": 881
},
{
"epoch": 3.714565004887586,
"grad_norm": 0.6847821139141917,
"learning_rate": 2.1364002378048446e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20359432697296143,
"step": 3800,
"valid_targets_mean": 2529.1,
"valid_targets_min": 914
},
{
"epoch": 3.7194525904203326,
"grad_norm": 0.7683431448503167,
"learning_rate": 2.1315359671726994e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20140613615512848,
"step": 3805,
"valid_targets_mean": 2015.9,
"valid_targets_min": 740
},
{
"epoch": 3.7243401759530794,
"grad_norm": 0.6765983248131439,
"learning_rate": 2.1266709149613448e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19246436655521393,
"step": 3810,
"valid_targets_mean": 2428.9,
"valid_targets_min": 870
},
{
"epoch": 3.7292277614858262,
"grad_norm": 0.9226737395699486,
"learning_rate": 2.1218051100786443e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1814860701560974,
"step": 3815,
"valid_targets_mean": 1909.5,
"valid_targets_min": 779
},
{
"epoch": 3.734115347018573,
"grad_norm": 0.8000270533236249,
"learning_rate": 2.1169385814369317e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22426359355449677,
"step": 3820,
"valid_targets_mean": 1909.4,
"valid_targets_min": 711
},
{
"epoch": 3.73900293255132,
"grad_norm": 0.6753953556756007,
"learning_rate": 2.112071357952844e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1894885152578354,
"step": 3825,
"valid_targets_mean": 2391.7,
"valid_targets_min": 696
},
{
"epoch": 3.7438905180840667,
"grad_norm": 0.7747404427802933,
"learning_rate": 2.1072034685471442e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2056509256362915,
"step": 3830,
"valid_targets_mean": 1816.9,
"valid_targets_min": 548
},
{
"epoch": 3.7487781036168135,
"grad_norm": 0.7637718123929285,
"learning_rate": 2.1023349421445532e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20844748616218567,
"step": 3835,
"valid_targets_mean": 2643.7,
"valid_targets_min": 793
},
{
"epoch": 3.7536656891495603,
"grad_norm": 0.6354837562399616,
"learning_rate": 2.0974658076735767e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1894562840461731,
"step": 3840,
"valid_targets_mean": 2781.6,
"valid_targets_min": 1309
},
{
"epoch": 3.758553274682307,
"grad_norm": 0.6766758246484479,
"learning_rate": 2.0925960940663356e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19174224138259888,
"step": 3845,
"valid_targets_mean": 2529.0,
"valid_targets_min": 987
},
{
"epoch": 3.763440860215054,
"grad_norm": 0.6892947666726518,
"learning_rate": 2.087725830258389e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084968388080597,
"step": 3850,
"valid_targets_mean": 2646.6,
"valid_targets_min": 655
},
{
"epoch": 3.768328445747801,
"grad_norm": 0.70291002815775,
"learning_rate": 2.082855045188565e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20856565237045288,
"step": 3855,
"valid_targets_mean": 2704.9,
"valid_targets_min": 789
},
{
"epoch": 3.7732160312805476,
"grad_norm": 0.7692739550745331,
"learning_rate": 2.0779837677987927e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19723054766654968,
"step": 3860,
"valid_targets_mean": 1855.1,
"valid_targets_min": 1118
},
{
"epoch": 3.7781036168132944,
"grad_norm": 0.7101378522156258,
"learning_rate": 2.073112027033923e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21212387084960938,
"step": 3865,
"valid_targets_mean": 2229.6,
"valid_targets_min": 1150
},
{
"epoch": 3.7829912023460412,
"grad_norm": 0.795515076642536,
"learning_rate": 2.068239851841563e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20189426839351654,
"step": 3870,
"valid_targets_mean": 2010.2,
"valid_targets_min": 768
},
{
"epoch": 3.787878787878788,
"grad_norm": 0.8748951610329812,
"learning_rate": 2.0633672711718975e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20840033888816833,
"step": 3875,
"valid_targets_mean": 2443.8,
"valid_targets_min": 1158
},
{
"epoch": 3.792766373411535,
"grad_norm": 0.6476901318697162,
"learning_rate": 2.0584943139775237e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948857605457306,
"step": 3880,
"valid_targets_mean": 2858.7,
"valid_targets_min": 882
},
{
"epoch": 3.7976539589442817,
"grad_norm": 0.7397815710205294,
"learning_rate": 2.053621009213276e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21412993967533112,
"step": 3885,
"valid_targets_mean": 2184.9,
"valid_targets_min": 997
},
{
"epoch": 3.8025415444770285,
"grad_norm": 0.7146555857159458,
"learning_rate": 2.0487473858360515e-05,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18842893838882446,
"step": 3890,
"valid_targets_mean": 2270.2,
"valid_targets_min": 713
},
{
"epoch": 3.8074291300097753,
"grad_norm": 0.65940562297892,
"learning_rate": 2.0438734728046432e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18981792032718658,
"step": 3895,
"valid_targets_mean": 2287.4,
"valid_targets_min": 1016
},
{
"epoch": 3.812316715542522,
"grad_norm": 0.8426072348378402,
"learning_rate": 2.0389992990795632e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22454825043678284,
"step": 3900,
"valid_targets_mean": 1866.6,
"valid_targets_min": 537
},
{
"epoch": 3.817204301075269,
"grad_norm": 0.7342198247089646,
"learning_rate": 2.0341248936228748e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2228454351425171,
"step": 3905,
"valid_targets_mean": 2335.3,
"valid_targets_min": 1021
},
{
"epoch": 3.822091886608016,
"grad_norm": 0.6636543015733303,
"learning_rate": 2.0292502853980164e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20288674533367157,
"step": 3910,
"valid_targets_mean": 2667.2,
"valid_targets_min": 791
},
{
"epoch": 3.8269794721407626,
"grad_norm": 0.7610090323169763,
"learning_rate": 2.0243755033696313e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20183882117271423,
"step": 3915,
"valid_targets_mean": 2155.2,
"valid_targets_min": 632
},
{
"epoch": 3.8318670576735094,
"grad_norm": 0.6831492165378048,
"learning_rate": 2.019500576503397e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1926528513431549,
"step": 3920,
"valid_targets_mean": 2656.8,
"valid_targets_min": 1210
},
{
"epoch": 3.8367546432062563,
"grad_norm": 0.7402425571751615,
"learning_rate": 2.0146255337658494e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21684202551841736,
"step": 3925,
"valid_targets_mean": 2248.5,
"valid_targets_min": 420
},
{
"epoch": 3.841642228739003,
"grad_norm": 0.6921612269978583,
"learning_rate": 2.009750404124216e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20540589094161987,
"step": 3930,
"valid_targets_mean": 2690.6,
"valid_targets_min": 697
},
{
"epoch": 3.84652981427175,
"grad_norm": 0.7529950655294566,
"learning_rate": 2.0048752165462373e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21762652695178986,
"step": 3935,
"valid_targets_mean": 2733.9,
"valid_targets_min": 844
},
{
"epoch": 3.8514173998044967,
"grad_norm": 0.6580479552711862,
"learning_rate": 2e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1937936544418335,
"step": 3940,
"valid_targets_mean": 2622.9,
"valid_targets_min": 632
},
{
"epoch": 3.8563049853372435,
"grad_norm": 0.8321134334974649,
"learning_rate": 1.9951247834537634e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21654708683490753,
"step": 3945,
"valid_targets_mean": 2118.2,
"valid_targets_min": 594
},
{
"epoch": 3.8611925708699903,
"grad_norm": 0.8110075847407984,
"learning_rate": 1.9902495958757844e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21147048473358154,
"step": 3950,
"valid_targets_mean": 2464.2,
"valid_targets_min": 775
},
{
"epoch": 3.866080156402737,
"grad_norm": 0.8481527474330096,
"learning_rate": 1.985374466234151e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752730906009674,
"step": 3955,
"valid_targets_mean": 1691.5,
"valid_targets_min": 680
},
{
"epoch": 3.870967741935484,
"grad_norm": 0.7391679144111151,
"learning_rate": 1.9804994234966036e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2055065929889679,
"step": 3960,
"valid_targets_mean": 2255.8,
"valid_targets_min": 1006
},
{
"epoch": 3.875855327468231,
"grad_norm": 0.6879643282262666,
"learning_rate": 1.9756244966303693e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21640875935554504,
"step": 3965,
"valid_targets_mean": 2545.9,
"valid_targets_min": 750
},
{
"epoch": 3.8807429130009776,
"grad_norm": 0.682330103660924,
"learning_rate": 1.9707497146019846e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17964300513267517,
"step": 3970,
"valid_targets_mean": 2946.8,
"valid_targets_min": 750
},
{
"epoch": 3.8856304985337244,
"grad_norm": 0.6624662717730248,
"learning_rate": 1.9658751063771255e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20151904225349426,
"step": 3975,
"valid_targets_mean": 3265.1,
"valid_targets_min": 711
},
{
"epoch": 3.8905180840664713,
"grad_norm": 0.7423253354159347,
"learning_rate": 1.961000700920437e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19609767198562622,
"step": 3980,
"valid_targets_mean": 2088.9,
"valid_targets_min": 780
},
{
"epoch": 3.895405669599218,
"grad_norm": 0.9813652565552392,
"learning_rate": 1.956126527195358e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2142195701599121,
"step": 3985,
"valid_targets_mean": 2652.4,
"valid_targets_min": 759
},
{
"epoch": 3.900293255131965,
"grad_norm": 0.5712086066191886,
"learning_rate": 1.9512526141639492e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16019731760025024,
"step": 3990,
"valid_targets_mean": 3155.6,
"valid_targets_min": 770
},
{
"epoch": 3.9051808406647117,
"grad_norm": 0.7587001616327813,
"learning_rate": 1.9463789907867248e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25113722681999207,
"step": 3995,
"valid_targets_mean": 2617.2,
"valid_targets_min": 869
},
{
"epoch": 3.9100684261974585,
"grad_norm": 0.7046294004069471,
"learning_rate": 1.941505686022476e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18923306465148926,
"step": 4000,
"valid_targets_mean": 2173.3,
"valid_targets_min": 929
},
{
"epoch": 3.9149560117302054,
"grad_norm": 0.6934724921753709,
"learning_rate": 1.936632728828103e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20533259212970734,
"step": 4005,
"valid_targets_mean": 2358.2,
"valid_targets_min": 898
},
{
"epoch": 3.919843597262952,
"grad_norm": 0.8196595601053237,
"learning_rate": 1.9317601481584383e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2104458212852478,
"step": 4010,
"valid_targets_mean": 1972.3,
"valid_targets_min": 725
},
{
"epoch": 3.924731182795699,
"grad_norm": 0.7849322123412164,
"learning_rate": 1.926887972966077e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269350528717041,
"step": 4015,
"valid_targets_mean": 2177.9,
"valid_targets_min": 819
},
{
"epoch": 3.929618768328446,
"grad_norm": 0.7525483327532918,
"learning_rate": 1.922016232201208e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21186742186546326,
"step": 4020,
"valid_targets_mean": 2130.6,
"valid_targets_min": 548
},
{
"epoch": 3.9345063538611926,
"grad_norm": 0.6367950186766983,
"learning_rate": 1.917144954811435e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19727790355682373,
"step": 4025,
"valid_targets_mean": 2766.4,
"valid_targets_min": 817
},
{
"epoch": 3.9393939393939394,
"grad_norm": 0.7362334474471227,
"learning_rate": 1.9122741697416122e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.206711083650589,
"step": 4030,
"valid_targets_mean": 2190.1,
"valid_targets_min": 771
},
{
"epoch": 3.9442815249266863,
"grad_norm": 0.6272342072403345,
"learning_rate": 1.9074039059336654e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19984391331672668,
"step": 4035,
"valid_targets_mean": 2838.1,
"valid_targets_min": 614
},
{
"epoch": 3.949169110459433,
"grad_norm": 0.6758572832963811,
"learning_rate": 1.902534192326423e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21952173113822937,
"step": 4040,
"valid_targets_mean": 2742.6,
"valid_targets_min": 1552
},
{
"epoch": 3.95405669599218,
"grad_norm": 0.6455921997950347,
"learning_rate": 1.8976650578554475e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17914989590644836,
"step": 4045,
"valid_targets_mean": 2462.2,
"valid_targets_min": 1012
},
{
"epoch": 3.9589442815249267,
"grad_norm": 0.7064643550905159,
"learning_rate": 1.892796531452857e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22437229752540588,
"step": 4050,
"valid_targets_mean": 2798.8,
"valid_targets_min": 572
},
{
"epoch": 3.9638318670576735,
"grad_norm": 0.7269435964183898,
"learning_rate": 1.8879286420471562e-05,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22988593578338623,
"step": 4055,
"valid_targets_mean": 2328.2,
"valid_targets_min": 584
},
{
"epoch": 3.9687194525904204,
"grad_norm": 0.6243634215768921,
"learning_rate": 1.8830614185630686e-05,
"loss": 0.2017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19760319590568542,
"step": 4060,
"valid_targets_mean": 3104.0,
"valid_targets_min": 665
},
{
"epoch": 3.973607038123167,
"grad_norm": 0.7229402835170321,
"learning_rate": 1.8781948899213563e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19763663411140442,
"step": 4065,
"valid_targets_mean": 2293.1,
"valid_targets_min": 1080
},
{
"epoch": 3.978494623655914,
"grad_norm": 0.7692945667783568,
"learning_rate": 1.8733290850386556e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2350245714187622,
"step": 4070,
"valid_targets_mean": 2153.9,
"valid_targets_min": 522
},
{
"epoch": 3.983382209188661,
"grad_norm": 0.7485634972600307,
"learning_rate": 1.8684640328273013e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2132551074028015,
"step": 4075,
"valid_targets_mean": 2146.8,
"valid_targets_min": 533
},
{
"epoch": 3.9882697947214076,
"grad_norm": 0.7868285556946475,
"learning_rate": 1.8635997621951554e-05,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21789923310279846,
"step": 4080,
"valid_targets_mean": 1982.0,
"valid_targets_min": 1146
},
{
"epoch": 3.9931573802541545,
"grad_norm": 0.6520687750578001,
"learning_rate": 1.858736302045438e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2020658552646637,
"step": 4085,
"valid_targets_mean": 2626.5,
"valid_targets_min": 1214
},
{
"epoch": 3.9980449657869013,
"grad_norm": 0.6705009639669899,
"learning_rate": 1.8538736812765495e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2510734796524048,
"step": 4090,
"valid_targets_mean": 2900.7,
"valid_targets_min": 823
},
{
"epoch": 4.002932551319648,
"grad_norm": 0.6983984686970028,
"learning_rate": 1.8490119287819058e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1645195633172989,
"step": 4095,
"valid_targets_mean": 2202.6,
"valid_targets_min": 706
},
{
"epoch": 4.007820136852395,
"grad_norm": 0.7590415869647605,
"learning_rate": 1.844151073449763e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1695270985364914,
"step": 4100,
"valid_targets_mean": 2045.4,
"valid_targets_min": 484
},
{
"epoch": 4.012707722385142,
"grad_norm": 0.8500063167328339,
"learning_rate": 1.8392911441630458e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1960211545228958,
"step": 4105,
"valid_targets_mean": 1932.2,
"valid_targets_min": 886
},
{
"epoch": 4.0175953079178885,
"grad_norm": 0.6876315958843118,
"learning_rate": 1.8344321697991775e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17042392492294312,
"step": 4110,
"valid_targets_mean": 2488.9,
"valid_targets_min": 984
},
{
"epoch": 4.022482893450635,
"grad_norm": 0.6267560608434691,
"learning_rate": 1.8295741792299054e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1570637822151184,
"step": 4115,
"valid_targets_mean": 2911.5,
"valid_targets_min": 998
},
{
"epoch": 4.027370478983382,
"grad_norm": 0.6860515522522642,
"learning_rate": 1.8247172013211316e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17035432159900665,
"step": 4120,
"valid_targets_mean": 2804.3,
"valid_targets_min": 1062
},
{
"epoch": 4.032258064516129,
"grad_norm": 0.658990742688263,
"learning_rate": 1.819861264932743e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1729648858308792,
"step": 4125,
"valid_targets_mean": 3242.4,
"valid_targets_min": 952
},
{
"epoch": 4.037145650048876,
"grad_norm": 0.8278627891112406,
"learning_rate": 1.815006398918435e-05,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17281252145767212,
"step": 4130,
"valid_targets_mean": 1954.6,
"valid_targets_min": 746
},
{
"epoch": 4.042033235581623,
"grad_norm": 0.7070945916212567,
"learning_rate": 1.8101526321255464e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18609067797660828,
"step": 4135,
"valid_targets_mean": 2809.1,
"valid_targets_min": 725
},
{
"epoch": 4.0469208211143695,
"grad_norm": 0.732269604211766,
"learning_rate": 1.805299993394881e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601986289024353,
"step": 4140,
"valid_targets_mean": 2153.6,
"valid_targets_min": 895
},
{
"epoch": 4.051808406647116,
"grad_norm": 0.7644694368274649,
"learning_rate": 1.8004485115605407e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17084315419197083,
"step": 4145,
"valid_targets_mean": 2271.1,
"valid_targets_min": 900
},
{
"epoch": 4.056695992179863,
"grad_norm": 0.680277205771116,
"learning_rate": 1.7955982154497545e-05,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18231913447380066,
"step": 4150,
"valid_targets_mean": 2801.8,
"valid_targets_min": 1152
},
{
"epoch": 4.06158357771261,
"grad_norm": 0.7619020216747033,
"learning_rate": 1.7907491338827053e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17396214604377747,
"step": 4155,
"valid_targets_mean": 2283.8,
"valid_targets_min": 649
},
{
"epoch": 4.066471163245357,
"grad_norm": 0.7954884604214785,
"learning_rate": 1.7859012956723577e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17803660035133362,
"step": 4160,
"valid_targets_mean": 2164.9,
"valid_targets_min": 784
},
{
"epoch": 4.0713587487781036,
"grad_norm": 0.70348085226897,
"learning_rate": 1.781054729624291e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16010019183158875,
"step": 4165,
"valid_targets_mean": 2553.6,
"valid_targets_min": 843
},
{
"epoch": 4.07624633431085,
"grad_norm": 1.026152425313603,
"learning_rate": 1.7762094645365225e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18153509497642517,
"step": 4170,
"valid_targets_mean": 2432.5,
"valid_targets_min": 615
},
{
"epoch": 4.081133919843597,
"grad_norm": 0.7254831762036433,
"learning_rate": 1.7713655291993426e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20568543672561646,
"step": 4175,
"valid_targets_mean": 2840.9,
"valid_targets_min": 881
},
{
"epoch": 4.086021505376344,
"grad_norm": 0.697671859067687,
"learning_rate": 1.766522952395138e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19269169867038727,
"step": 4180,
"valid_targets_mean": 3086.3,
"valid_targets_min": 746
},
{
"epoch": 4.090909090909091,
"grad_norm": 0.7479636389963256,
"learning_rate": 1.7616817628982225e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16542398929595947,
"step": 4185,
"valid_targets_mean": 2449.9,
"valid_targets_min": 1025
},
{
"epoch": 4.095796676441838,
"grad_norm": 0.8012001808352684,
"learning_rate": 1.7568419894746694e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15177610516548157,
"step": 4190,
"valid_targets_mean": 1801.7,
"valid_targets_min": 567
},
{
"epoch": 4.1006842619745845,
"grad_norm": 0.6599199969261322,
"learning_rate": 1.7520036608821343e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16316524147987366,
"step": 4195,
"valid_targets_mean": 2802.2,
"valid_targets_min": 607
},
{
"epoch": 4.105571847507331,
"grad_norm": 0.660475255360126,
"learning_rate": 1.7471668058696917e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16640618443489075,
"step": 4200,
"valid_targets_mean": 2976.4,
"valid_targets_min": 821
},
{
"epoch": 4.110459433040078,
"grad_norm": 0.7767208027973069,
"learning_rate": 1.7423314531776566e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16882777214050293,
"step": 4205,
"valid_targets_mean": 2222.6,
"valid_targets_min": 627
},
{
"epoch": 4.115347018572825,
"grad_norm": 0.6976329404563815,
"learning_rate": 1.737497631537418e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17232577502727509,
"step": 4210,
"valid_targets_mean": 2611.0,
"valid_targets_min": 869
},
{
"epoch": 4.120234604105572,
"grad_norm": 0.8087989717723046,
"learning_rate": 1.7326653696712706e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1771789789199829,
"step": 4215,
"valid_targets_mean": 2261.4,
"valid_targets_min": 551
},
{
"epoch": 4.125122189638319,
"grad_norm": 0.7223726297736563,
"learning_rate": 1.7278346962922365e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17196297645568848,
"step": 4220,
"valid_targets_mean": 2553.8,
"valid_targets_min": 791
},
{
"epoch": 4.130009775171065,
"grad_norm": 0.8038120785795847,
"learning_rate": 1.7230056401039014e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1827443540096283,
"step": 4225,
"valid_targets_mean": 1950.0,
"valid_targets_min": 744
},
{
"epoch": 4.134897360703812,
"grad_norm": 0.8507666081146841,
"learning_rate": 1.7181782298002426e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1930236965417862,
"step": 4230,
"valid_targets_mean": 1955.8,
"valid_targets_min": 837
},
{
"epoch": 4.139784946236559,
"grad_norm": 0.72829350980729,
"learning_rate": 1.713352494065455e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1770409643650055,
"step": 4235,
"valid_targets_mean": 2629.4,
"valid_targets_min": 728
},
{
"epoch": 4.144672531769306,
"grad_norm": 0.8739112255295849,
"learning_rate": 1.708528461573787e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17912176251411438,
"step": 4240,
"valid_targets_mean": 1731.5,
"valid_targets_min": 829
},
{
"epoch": 4.149560117302053,
"grad_norm": 0.6736533471138151,
"learning_rate": 1.703706160989362e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17516711354255676,
"step": 4245,
"valid_targets_mean": 3023.8,
"valid_targets_min": 726
},
{
"epoch": 4.1544477028347995,
"grad_norm": 0.7146049815510215,
"learning_rate": 1.6988856209660162e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18740811944007874,
"step": 4250,
"valid_targets_mean": 3117.8,
"valid_targets_min": 895
},
{
"epoch": 4.159335288367546,
"grad_norm": 0.8287505524072367,
"learning_rate": 1.694066870147123e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17309562861919403,
"step": 4255,
"valid_targets_mean": 2429.8,
"valid_targets_min": 613
},
{
"epoch": 4.164222873900293,
"grad_norm": 0.8384682014231488,
"learning_rate": 1.689249937165425e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17695944011211395,
"step": 4260,
"valid_targets_mean": 1893.6,
"valid_targets_min": 622
},
{
"epoch": 4.16911045943304,
"grad_norm": 0.8023347194519758,
"learning_rate": 1.6844348506428624e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862003207206726,
"step": 4265,
"valid_targets_mean": 2379.9,
"valid_targets_min": 996
},
{
"epoch": 4.173998044965787,
"grad_norm": 0.7189754762701044,
"learning_rate": 1.679621639190405e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18278726935386658,
"step": 4270,
"valid_targets_mean": 2820.7,
"valid_targets_min": 981
},
{
"epoch": 4.178885630498534,
"grad_norm": 0.7689815704124234,
"learning_rate": 1.6748103314078795e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15576958656311035,
"step": 4275,
"valid_targets_mean": 2550.9,
"valid_targets_min": 830
},
{
"epoch": 4.18377321603128,
"grad_norm": 0.7790069715413338,
"learning_rate": 1.6700009558838034e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1859605610370636,
"step": 4280,
"valid_targets_mean": 2325.7,
"valid_targets_min": 765
},
{
"epoch": 4.188660801564027,
"grad_norm": 0.7059772286515155,
"learning_rate": 1.6651935411952117e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18116068840026855,
"step": 4285,
"valid_targets_mean": 2637.1,
"valid_targets_min": 981
},
{
"epoch": 4.193548387096774,
"grad_norm": 0.8478026456180225,
"learning_rate": 1.6603881159074864e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1635878086090088,
"step": 4290,
"valid_targets_mean": 2021.2,
"valid_targets_min": 728
},
{
"epoch": 4.198435972629521,
"grad_norm": 0.7892671310342947,
"learning_rate": 1.655584708574192e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16756808757781982,
"step": 4295,
"valid_targets_mean": 2019.6,
"valid_targets_min": 694
},
{
"epoch": 4.203323558162268,
"grad_norm": 0.7866619457000387,
"learning_rate": 1.6507833477368994e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662808358669281,
"step": 4300,
"valid_targets_mean": 2019.4,
"valid_targets_min": 824
},
{
"epoch": 4.2082111436950145,
"grad_norm": 0.8459519999111245,
"learning_rate": 1.6459840619250217e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1930123269557953,
"step": 4305,
"valid_targets_mean": 2161.1,
"valid_targets_min": 817
},
{
"epoch": 4.213098729227761,
"grad_norm": 0.8021367267841367,
"learning_rate": 1.6411868796556408e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18006908893585205,
"step": 4310,
"valid_targets_mean": 2118.6,
"valid_targets_min": 572
},
{
"epoch": 4.217986314760508,
"grad_norm": 0.8090359446901784,
"learning_rate": 1.6363918294333395e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15488529205322266,
"step": 4315,
"valid_targets_mean": 1977.8,
"valid_targets_min": 727
},
{
"epoch": 4.222873900293255,
"grad_norm": 0.6855591904703289,
"learning_rate": 1.6315989397500332e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16280516982078552,
"step": 4320,
"valid_targets_mean": 3256.6,
"valid_targets_min": 958
},
{
"epoch": 4.227761485826002,
"grad_norm": 0.809105744787128,
"learning_rate": 1.6268082390847983e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15723910927772522,
"step": 4325,
"valid_targets_mean": 1953.2,
"valid_targets_min": 746
},
{
"epoch": 4.232649071358749,
"grad_norm": 0.7131155432880343,
"learning_rate": 1.6220197559037045e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18179753422737122,
"step": 4330,
"valid_targets_mean": 2626.1,
"valid_targets_min": 1086
},
{
"epoch": 4.237536656891495,
"grad_norm": 0.7455797655769655,
"learning_rate": 1.617233518659647e-05,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16530537605285645,
"step": 4335,
"valid_targets_mean": 2392.8,
"valid_targets_min": 770
},
{
"epoch": 4.242424242424242,
"grad_norm": 0.7439354451578698,
"learning_rate": 1.6124495557921725e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.173561230301857,
"step": 4340,
"valid_targets_mean": 2214.4,
"valid_targets_min": 671
},
{
"epoch": 4.247311827956989,
"grad_norm": 0.7373073806467637,
"learning_rate": 1.6076678957273162e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17753678560256958,
"step": 4345,
"valid_targets_mean": 2657.6,
"valid_targets_min": 734
},
{
"epoch": 4.252199413489736,
"grad_norm": 0.7000837897806548,
"learning_rate": 1.602888566877429e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17242294549942017,
"step": 4350,
"valid_targets_mean": 2792.0,
"valid_targets_min": 770
},
{
"epoch": 4.257086999022483,
"grad_norm": 0.7271682426991912,
"learning_rate": 1.59811159764101e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16193613409996033,
"step": 4355,
"valid_targets_mean": 2416.5,
"valid_targets_min": 907
},
{
"epoch": 4.2619745845552295,
"grad_norm": 0.7944206346753406,
"learning_rate": 1.593337016402539e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17991730570793152,
"step": 4360,
"valid_targets_mean": 2064.8,
"valid_targets_min": 655
},
{
"epoch": 4.266862170087976,
"grad_norm": 0.7010001037382477,
"learning_rate": 1.5885648515323028e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16409370303153992,
"step": 4365,
"valid_targets_mean": 2635.2,
"valid_targets_min": 930
},
{
"epoch": 4.271749755620723,
"grad_norm": 0.6568280133407176,
"learning_rate": 1.5837951313862352e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18202292919158936,
"step": 4370,
"valid_targets_mean": 3231.6,
"valid_targets_min": 671
},
{
"epoch": 4.27663734115347,
"grad_norm": 0.8085208993831905,
"learning_rate": 1.5790278843057395e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18638502061367035,
"step": 4375,
"valid_targets_mean": 2588.2,
"valid_targets_min": 665
},
{
"epoch": 4.281524926686217,
"grad_norm": 0.8087448136164485,
"learning_rate": 1.5742631386175255e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17984755337238312,
"step": 4380,
"valid_targets_mean": 2140.7,
"valid_targets_min": 701
},
{
"epoch": 4.286412512218964,
"grad_norm": 0.7073051473557163,
"learning_rate": 1.569500922633442e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16911262273788452,
"step": 4385,
"valid_targets_mean": 2626.2,
"valid_targets_min": 694
},
{
"epoch": 4.29130009775171,
"grad_norm": 0.7422208850214889,
"learning_rate": 1.5647412646503025e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17553281784057617,
"step": 4390,
"valid_targets_mean": 2183.2,
"valid_targets_min": 1272
},
{
"epoch": 4.296187683284457,
"grad_norm": 0.7592007757916336,
"learning_rate": 1.5599841929497234e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17773813009262085,
"step": 4395,
"valid_targets_mean": 2256.4,
"valid_targets_min": 771
},
{
"epoch": 4.301075268817204,
"grad_norm": 0.7553316641615674,
"learning_rate": 1.555229735797954e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18115384876728058,
"step": 4400,
"valid_targets_mean": 2220.1,
"valid_targets_min": 733
},
{
"epoch": 4.305962854349951,
"grad_norm": 0.7811092431468514,
"learning_rate": 1.5504779214457064e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17034941911697388,
"step": 4405,
"valid_targets_mean": 1985.4,
"valid_targets_min": 872
},
{
"epoch": 4.310850439882698,
"grad_norm": 0.6751967572463863,
"learning_rate": 1.5457287781279914e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1524028480052948,
"step": 4410,
"valid_targets_mean": 2459.4,
"valid_targets_min": 768
},
{
"epoch": 4.3157380254154445,
"grad_norm": 0.7006365562513612,
"learning_rate": 1.5409823340639472e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1530303657054901,
"step": 4415,
"valid_targets_mean": 2240.3,
"valid_targets_min": 809
},
{
"epoch": 4.320625610948191,
"grad_norm": 0.8127996699553531,
"learning_rate": 1.5362386174566727e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1497165858745575,
"step": 4420,
"valid_targets_mean": 1762.8,
"valid_targets_min": 672
},
{
"epoch": 4.325513196480938,
"grad_norm": 0.7509544790056238,
"learning_rate": 1.5314976564930616e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.215011328458786,
"step": 4425,
"valid_targets_mean": 2781.2,
"valid_targets_min": 870
},
{
"epoch": 4.330400782013685,
"grad_norm": 0.7344537959086179,
"learning_rate": 1.526759479343634e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1870063692331314,
"step": 4430,
"valid_targets_mean": 2725.8,
"valid_targets_min": 1240
},
{
"epoch": 4.335288367546432,
"grad_norm": 0.672200316438301,
"learning_rate": 1.5220241141623666e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690032184123993,
"step": 4435,
"valid_targets_mean": 3031.5,
"valid_targets_min": 1266
},
{
"epoch": 4.340175953079179,
"grad_norm": 0.6666959910156269,
"learning_rate": 1.517291589086531e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15352541208267212,
"step": 4440,
"valid_targets_mean": 2541.2,
"valid_targets_min": 749
},
{
"epoch": 4.345063538611925,
"grad_norm": 0.7100554914799727,
"learning_rate": 1.512561932236519e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16762804985046387,
"step": 4445,
"valid_targets_mean": 2549.6,
"valid_targets_min": 978
},
{
"epoch": 4.349951124144672,
"grad_norm": 0.7579351582413887,
"learning_rate": 1.507835171715683e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19213947653770447,
"step": 4450,
"valid_targets_mean": 2302.4,
"valid_targets_min": 893
},
{
"epoch": 4.354838709677419,
"grad_norm": 0.7076551024584983,
"learning_rate": 1.503111335610164e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16405513882637024,
"step": 4455,
"valid_targets_mean": 2656.4,
"valid_targets_min": 662
},
{
"epoch": 4.359726295210166,
"grad_norm": 0.6577102500804493,
"learning_rate": 1.4983904519887257e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18623942136764526,
"step": 4460,
"valid_targets_mean": 3397.5,
"valid_targets_min": 869
},
{
"epoch": 4.364613880742913,
"grad_norm": 0.8364738050383415,
"learning_rate": 1.4936725489025907e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18252325057983398,
"step": 4465,
"valid_targets_mean": 2765.1,
"valid_targets_min": 740
},
{
"epoch": 4.3695014662756595,
"grad_norm": 0.7332207981929358,
"learning_rate": 1.4889576543852679e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18655236065387726,
"step": 4470,
"valid_targets_mean": 2426.7,
"valid_targets_min": 759
},
{
"epoch": 4.374389051808406,
"grad_norm": 0.7291042324534501,
"learning_rate": 1.4842457964523932e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1768685281276703,
"step": 4475,
"valid_targets_mean": 2585.4,
"valid_targets_min": 776
},
{
"epoch": 4.379276637341153,
"grad_norm": 0.7241032428052671,
"learning_rate": 1.4795370031015562e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15364965796470642,
"step": 4480,
"valid_targets_mean": 2301.1,
"valid_targets_min": 968
},
{
"epoch": 4.3841642228739,
"grad_norm": 0.8029472975208416,
"learning_rate": 1.4748313023121385e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17943759262561798,
"step": 4485,
"valid_targets_mean": 2096.1,
"valid_targets_min": 698
},
{
"epoch": 4.389051808406647,
"grad_norm": 0.7738811474250595,
"learning_rate": 1.4701287220451463e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18864920735359192,
"step": 4490,
"valid_targets_mean": 2364.0,
"valid_targets_min": 761
},
{
"epoch": 4.393939393939394,
"grad_norm": 0.8073103577600892,
"learning_rate": 1.4654292902430424e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1911054402589798,
"step": 4495,
"valid_targets_mean": 2996.8,
"valid_targets_min": 912
},
{
"epoch": 4.39882697947214,
"grad_norm": 0.7781332848101631,
"learning_rate": 1.4607330348295821e-05,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20065414905548096,
"step": 4500,
"valid_targets_mean": 2334.9,
"valid_targets_min": 620
},
{
"epoch": 4.403714565004887,
"grad_norm": 0.8238449326675337,
"learning_rate": 1.4560399837096478e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1719534993171692,
"step": 4505,
"valid_targets_mean": 1942.7,
"valid_targets_min": 1107
},
{
"epoch": 4.408602150537634,
"grad_norm": 0.7909535037694309,
"learning_rate": 1.4513501647690804e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15581440925598145,
"step": 4510,
"valid_targets_mean": 2048.7,
"valid_targets_min": 680
},
{
"epoch": 4.413489736070381,
"grad_norm": 0.667844663877056,
"learning_rate": 1.4466636058745179e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16047389805316925,
"step": 4515,
"valid_targets_mean": 2790.1,
"valid_targets_min": 697
},
{
"epoch": 4.418377321603128,
"grad_norm": 0.7179178500193523,
"learning_rate": 1.4419803348732245e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16572578251361847,
"step": 4520,
"valid_targets_mean": 2572.5,
"valid_targets_min": 923
},
{
"epoch": 4.4232649071358745,
"grad_norm": 0.7482497307829565,
"learning_rate": 1.4373003795929287e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17924658954143524,
"step": 4525,
"valid_targets_mean": 2537.1,
"valid_targets_min": 1124
},
{
"epoch": 4.428152492668621,
"grad_norm": 0.7983711495940576,
"learning_rate": 1.4326237678416588e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15910127758979797,
"step": 4530,
"valid_targets_mean": 2120.4,
"valid_targets_min": 865
},
{
"epoch": 4.433040078201368,
"grad_norm": 0.7219070798034924,
"learning_rate": 1.4279505274075743e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17049354314804077,
"step": 4535,
"valid_targets_mean": 2468.0,
"valid_targets_min": 1040
},
{
"epoch": 4.437927663734115,
"grad_norm": 0.6820006015545326,
"learning_rate": 1.423280686058804e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17498445510864258,
"step": 4540,
"valid_targets_mean": 2878.1,
"valid_targets_min": 814
},
{
"epoch": 4.442815249266862,
"grad_norm": 0.7956975533298152,
"learning_rate": 1.4186142715432775e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15380510687828064,
"step": 4545,
"valid_targets_mean": 1974.9,
"valid_targets_min": 788
},
{
"epoch": 4.447702834799609,
"grad_norm": 0.6688865610533883,
"learning_rate": 1.4139513115885635e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18294396996498108,
"step": 4550,
"valid_targets_mean": 3151.7,
"valid_targets_min": 1199
},
{
"epoch": 4.452590420332355,
"grad_norm": 0.7510655980124383,
"learning_rate": 1.4092918339017046e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17913363873958588,
"step": 4555,
"valid_targets_mean": 2332.2,
"valid_targets_min": 875
},
{
"epoch": 4.457478005865102,
"grad_norm": 0.7147653866732739,
"learning_rate": 1.4046358661690515e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15671703219413757,
"step": 4560,
"valid_targets_mean": 2355.0,
"valid_targets_min": 648
},
{
"epoch": 4.462365591397849,
"grad_norm": 0.8146269315094486,
"learning_rate": 1.3999834360560969e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18449649214744568,
"step": 4565,
"valid_targets_mean": 2228.4,
"valid_targets_min": 798
},
{
"epoch": 4.467253176930596,
"grad_norm": 0.8549012646003764,
"learning_rate": 1.3953345712073172e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20259252190589905,
"step": 4570,
"valid_targets_mean": 1910.8,
"valid_targets_min": 698
},
{
"epoch": 4.472140762463344,
"grad_norm": 0.6930221111338045,
"learning_rate": 1.3906892992460004e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19013884663581848,
"step": 4575,
"valid_targets_mean": 2861.4,
"valid_targets_min": 1011
},
{
"epoch": 4.4770283479960895,
"grad_norm": 0.8136412327729154,
"learning_rate": 1.3860476477740883e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1534624695777893,
"step": 4580,
"valid_targets_mean": 1744.6,
"valid_targets_min": 650
},
{
"epoch": 4.481915933528837,
"grad_norm": 0.7069363998150793,
"learning_rate": 1.3814096443720091e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16891230642795563,
"step": 4585,
"valid_targets_mean": 2515.7,
"valid_targets_min": 696
},
{
"epoch": 4.486803519061583,
"grad_norm": 0.801344597413106,
"learning_rate": 1.3767753165985126e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14025087654590607,
"step": 4590,
"valid_targets_mean": 1840.0,
"valid_targets_min": 818
},
{
"epoch": 4.491691104594331,
"grad_norm": 0.7759235567696053,
"learning_rate": 1.3721446919905121e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16802477836608887,
"step": 4595,
"valid_targets_mean": 2318.0,
"valid_targets_min": 698
},
{
"epoch": 4.496578690127077,
"grad_norm": 0.7746563734745292,
"learning_rate": 1.3675177980629135e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17537719011306763,
"step": 4600,
"valid_targets_mean": 2127.3,
"valid_targets_min": 625
},
{
"epoch": 4.5014662756598245,
"grad_norm": 0.692029862169816,
"learning_rate": 1.3628946623084563e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666170358657837,
"step": 4605,
"valid_targets_mean": 2804.1,
"valid_targets_min": 1352
},
{
"epoch": 4.50635386119257,
"grad_norm": 0.7747220358157921,
"learning_rate": 1.3582753121975502e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16754350066184998,
"step": 4610,
"valid_targets_mean": 2106.8,
"valid_targets_min": 1041
},
{
"epoch": 4.511241446725318,
"grad_norm": 0.794400474753371,
"learning_rate": 1.3536597751781082e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15418118238449097,
"step": 4615,
"valid_targets_mean": 2122.1,
"valid_targets_min": 623
},
{
"epoch": 4.516129032258064,
"grad_norm": 0.8630490069683876,
"learning_rate": 1.3490480786753901e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1692330241203308,
"step": 4620,
"valid_targets_mean": 1878.2,
"valid_targets_min": 864
},
{
"epoch": 4.521016617790812,
"grad_norm": 0.6949929703480787,
"learning_rate": 1.3444402500918314e-05,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19203145802021027,
"step": 4625,
"valid_targets_mean": 2929.6,
"valid_targets_min": 1109
},
{
"epoch": 4.525904203323558,
"grad_norm": 0.7212230561742061,
"learning_rate": 1.3398363168068871e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1773679554462433,
"step": 4630,
"valid_targets_mean": 3018.6,
"valid_targets_min": 852
},
{
"epoch": 4.530791788856305,
"grad_norm": 0.7491901926461985,
"learning_rate": 1.3352363061768668e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19477087259292603,
"step": 4635,
"valid_targets_mean": 2341.3,
"valid_targets_min": 548
},
{
"epoch": 4.535679374389051,
"grad_norm": 0.7218327291631365,
"learning_rate": 1.3306402455347693e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15920904278755188,
"step": 4640,
"valid_targets_mean": 2138.7,
"valid_targets_min": 749
},
{
"epoch": 4.540566959921799,
"grad_norm": 0.7886843070822219,
"learning_rate": 1.3260481621901269e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20281338691711426,
"step": 4645,
"valid_targets_mean": 2345.5,
"valid_targets_min": 700
},
{
"epoch": 4.545454545454545,
"grad_norm": 0.7254460885818595,
"learning_rate": 1.3214600834288351e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18300187587738037,
"step": 4650,
"valid_targets_mean": 2600.0,
"valid_targets_min": 818
},
{
"epoch": 4.550342130987293,
"grad_norm": 0.7303419088042947,
"learning_rate": 1.3168760365129958e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1488429307937622,
"step": 4655,
"valid_targets_mean": 2088.1,
"valid_targets_min": 957
},
{
"epoch": 4.555229716520039,
"grad_norm": 0.8187576278617511,
"learning_rate": 1.3122960486807551e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666831523180008,
"step": 4660,
"valid_targets_mean": 2028.4,
"valid_targets_min": 734
},
{
"epoch": 4.560117302052786,
"grad_norm": 0.7689970727875466,
"learning_rate": 1.3077201471461396e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19278375804424286,
"step": 4665,
"valid_targets_mean": 2721.1,
"valid_targets_min": 1050
},
{
"epoch": 4.565004887585533,
"grad_norm": 0.7136026943772088,
"learning_rate": 1.3031483590988932e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18920962512493134,
"step": 4670,
"valid_targets_mean": 3069.2,
"valid_targets_min": 703
},
{
"epoch": 4.56989247311828,
"grad_norm": 0.6768328311866438,
"learning_rate": 1.2985807117043212e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.170124351978302,
"step": 4675,
"valid_targets_mean": 3036.4,
"valid_targets_min": 750
},
{
"epoch": 4.574780058651027,
"grad_norm": 0.7065627099385119,
"learning_rate": 1.2940172321031228e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17484335601329803,
"step": 4680,
"valid_targets_mean": 2361.8,
"valid_targets_min": 985
},
{
"epoch": 4.579667644183774,
"grad_norm": 0.7870866877498359,
"learning_rate": 1.2894579474112336e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17841269075870514,
"step": 4685,
"valid_targets_mean": 2178.9,
"valid_targets_min": 673
},
{
"epoch": 4.58455522971652,
"grad_norm": 0.7992856974999708,
"learning_rate": 1.2849028847196642e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18455563485622406,
"step": 4690,
"valid_targets_mean": 2120.1,
"valid_targets_min": 522
},
{
"epoch": 4.589442815249267,
"grad_norm": 0.7236365680919709,
"learning_rate": 1.2803520710943345e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1834551990032196,
"step": 4695,
"valid_targets_mean": 2806.9,
"valid_targets_min": 683
},
{
"epoch": 4.594330400782014,
"grad_norm": 0.7328506697251148,
"learning_rate": 1.2758055335759214e-05,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16841992735862732,
"step": 4700,
"valid_targets_mean": 2405.8,
"valid_targets_min": 830
},
{
"epoch": 4.599217986314761,
"grad_norm": 0.7488482580131285,
"learning_rate": 1.27126329917969e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20795467495918274,
"step": 4705,
"valid_targets_mean": 2736.6,
"valid_targets_min": 740
},
{
"epoch": 4.604105571847508,
"grad_norm": 0.701924815848274,
"learning_rate": 1.2667253948953392e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16952826082706451,
"step": 4710,
"valid_targets_mean": 2894.4,
"valid_targets_min": 805
},
{
"epoch": 4.6089931573802545,
"grad_norm": 0.7638018479267547,
"learning_rate": 1.262191847686837e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17446717619895935,
"step": 4715,
"valid_targets_mean": 2210.6,
"valid_targets_min": 1220
},
{
"epoch": 4.613880742913001,
"grad_norm": 0.9146808729960212,
"learning_rate": 1.2576626844922602e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19167935848236084,
"step": 4720,
"valid_targets_mean": 2399.1,
"valid_targets_min": 743
},
{
"epoch": 4.618768328445748,
"grad_norm": 0.7745900925140338,
"learning_rate": 1.2531379322236403e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17140185832977295,
"step": 4725,
"valid_targets_mean": 2393.5,
"valid_targets_min": 850
},
{
"epoch": 4.623655913978495,
"grad_norm": 0.776866808386388,
"learning_rate": 1.2486176177667963e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710333526134491,
"step": 4730,
"valid_targets_mean": 2295.1,
"valid_targets_min": 635
},
{
"epoch": 4.628543499511242,
"grad_norm": 0.9138199933637996,
"learning_rate": 1.2441017679811777e-05,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17593233287334442,
"step": 4735,
"valid_targets_mean": 1879.2,
"valid_targets_min": 661
},
{
"epoch": 4.633431085043989,
"grad_norm": 0.7080266048721636,
"learning_rate": 1.2395904096997082e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17759348452091217,
"step": 4740,
"valid_targets_mean": 2714.9,
"valid_targets_min": 715
},
{
"epoch": 4.638318670576735,
"grad_norm": 0.7107351831118239,
"learning_rate": 1.2350835697286185e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1701585203409195,
"step": 4745,
"valid_targets_mean": 2465.2,
"valid_targets_min": 836
},
{
"epoch": 4.643206256109482,
"grad_norm": 0.7110148275686181,
"learning_rate": 1.2305812748472969e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16965368390083313,
"step": 4750,
"valid_targets_mean": 2887.4,
"valid_targets_min": 1056
},
{
"epoch": 4.648093841642229,
"grad_norm": 0.7808205504531988,
"learning_rate": 1.2260835518081216e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1801660656929016,
"step": 4755,
"valid_targets_mean": 2264.4,
"valid_targets_min": 537
},
{
"epoch": 4.652981427174976,
"grad_norm": 0.6736174438322065,
"learning_rate": 1.2215904273363055e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16034579277038574,
"step": 4760,
"valid_targets_mean": 2747.2,
"valid_targets_min": 878
},
{
"epoch": 4.657869012707723,
"grad_norm": 0.8172833092442401,
"learning_rate": 1.2171019281297397e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18934208154678345,
"step": 4765,
"valid_targets_mean": 2011.7,
"valid_targets_min": 689
},
{
"epoch": 4.6627565982404695,
"grad_norm": 0.7810540506761577,
"learning_rate": 1.2126180808588281e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19872036576271057,
"step": 4770,
"valid_targets_mean": 2411.7,
"valid_targets_min": 858
},
{
"epoch": 4.667644183773216,
"grad_norm": 0.7414123362578164,
"learning_rate": 1.2081389121663361e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19137006998062134,
"step": 4775,
"valid_targets_mean": 2429.5,
"valid_targets_min": 996
},
{
"epoch": 4.672531769305963,
"grad_norm": 0.7992138573951394,
"learning_rate": 1.2036644486672287e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18999941647052765,
"step": 4780,
"valid_targets_mean": 2264.3,
"valid_targets_min": 800
},
{
"epoch": 4.67741935483871,
"grad_norm": 0.7629820940559762,
"learning_rate": 1.199194716948512e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18513910472393036,
"step": 4785,
"valid_targets_mean": 2405.6,
"valid_targets_min": 548
},
{
"epoch": 4.682306940371457,
"grad_norm": 0.712753687411961,
"learning_rate": 1.1947297435690772e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18980765342712402,
"step": 4790,
"valid_targets_mean": 2899.6,
"valid_targets_min": 916
},
{
"epoch": 4.687194525904204,
"grad_norm": 0.7285016261064938,
"learning_rate": 1.190269555059542e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17685630917549133,
"step": 4795,
"valid_targets_mean": 2543.8,
"valid_targets_min": 779
},
{
"epoch": 4.69208211143695,
"grad_norm": 0.7186549073765208,
"learning_rate": 1.1858141779220902e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17428386211395264,
"step": 4800,
"valid_targets_mean": 2633.2,
"valid_targets_min": 781
},
{
"epoch": 4.696969696969697,
"grad_norm": 0.7081619736005064,
"learning_rate": 1.1813636386303196e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1797652244567871,
"step": 4805,
"valid_targets_mean": 2718.8,
"valid_targets_min": 776
},
{
"epoch": 4.701857282502444,
"grad_norm": 0.8451059412061002,
"learning_rate": 1.1769179636290801e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18409138917922974,
"step": 4810,
"valid_targets_mean": 2124.2,
"valid_targets_min": 847
},
{
"epoch": 4.706744868035191,
"grad_norm": 0.8202631061205068,
"learning_rate": 1.1724771793343192e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17531917989253998,
"step": 4815,
"valid_targets_mean": 2052.2,
"valid_targets_min": 700
},
{
"epoch": 4.711632453567938,
"grad_norm": 0.6836107410471749,
"learning_rate": 1.1680413121329243e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17793884873390198,
"step": 4820,
"valid_targets_mean": 3199.6,
"valid_targets_min": 1120
},
{
"epoch": 4.7165200391006845,
"grad_norm": 0.7484449202460228,
"learning_rate": 1.1636103883825636e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1955634206533432,
"step": 4825,
"valid_targets_mean": 2796.8,
"valid_targets_min": 1038
},
{
"epoch": 4.721407624633431,
"grad_norm": 0.8765114876948064,
"learning_rate": 1.1591844344115346e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16911789774894714,
"step": 4830,
"valid_targets_mean": 1774.6,
"valid_targets_min": 637
},
{
"epoch": 4.726295210166178,
"grad_norm": 0.730247866586368,
"learning_rate": 1.1547634765186016e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16497325897216797,
"step": 4835,
"valid_targets_mean": 2376.2,
"valid_targets_min": 818
},
{
"epoch": 4.731182795698925,
"grad_norm": 0.8018221641880683,
"learning_rate": 1.1503475409728448e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17386886477470398,
"step": 4840,
"valid_targets_mean": 2089.1,
"valid_targets_min": 1032
},
{
"epoch": 4.736070381231672,
"grad_norm": 0.7294276842415255,
"learning_rate": 1.1459366540135019e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1633351594209671,
"step": 4845,
"valid_targets_mean": 2460.2,
"valid_targets_min": 870
},
{
"epoch": 4.740957966764419,
"grad_norm": 0.7012095976697436,
"learning_rate": 1.1415308418498104e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1733730584383011,
"step": 4850,
"valid_targets_mean": 2616.0,
"valid_targets_min": 644
},
{
"epoch": 4.745845552297165,
"grad_norm": 0.6630187702111296,
"learning_rate": 1.137130130660855e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16590818762779236,
"step": 4855,
"valid_targets_mean": 3160.9,
"valid_targets_min": 1147
},
{
"epoch": 4.750733137829912,
"grad_norm": 0.9413915512130215,
"learning_rate": 1.1327345465954109e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1672978401184082,
"step": 4860,
"valid_targets_mean": 1737.2,
"valid_targets_min": 744
},
{
"epoch": 4.755620723362659,
"grad_norm": 0.7740192526311673,
"learning_rate": 1.128344115771787e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14710134267807007,
"step": 4865,
"valid_targets_mean": 2162.9,
"valid_targets_min": 612
},
{
"epoch": 4.760508308895406,
"grad_norm": 0.7042101370968502,
"learning_rate": 1.1239588642776736e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1820552498102188,
"step": 4870,
"valid_targets_mean": 2700.5,
"valid_targets_min": 856
},
{
"epoch": 4.765395894428153,
"grad_norm": 0.846516777206178,
"learning_rate": 1.1195788181699829e-05,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16076403856277466,
"step": 4875,
"valid_targets_mean": 1912.6,
"valid_targets_min": 607
},
{
"epoch": 4.7702834799608995,
"grad_norm": 0.8117401631836421,
"learning_rate": 1.1152040034747005e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19138172268867493,
"step": 4880,
"valid_targets_mean": 2053.1,
"valid_targets_min": 679
},
{
"epoch": 4.775171065493646,
"grad_norm": 0.8090125882585804,
"learning_rate": 1.1108344461867256e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18099914491176605,
"step": 4885,
"valid_targets_mean": 2086.2,
"valid_targets_min": 875
},
{
"epoch": 4.780058651026393,
"grad_norm": 0.7869706404872734,
"learning_rate": 1.1064701722697171e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17875008285045624,
"step": 4890,
"valid_targets_mean": 2636.2,
"valid_targets_min": 789
},
{
"epoch": 4.78494623655914,
"grad_norm": 0.8338533349319971,
"learning_rate": 1.102111207655943e-05,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1614495813846588,
"step": 4895,
"valid_targets_mean": 2010.5,
"valid_targets_min": 1178
},
{
"epoch": 4.789833822091887,
"grad_norm": 0.8181674038081255,
"learning_rate": 1.0977575782461215e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16135358810424805,
"step": 4900,
"valid_targets_mean": 1836.6,
"valid_targets_min": 704
},
{
"epoch": 4.794721407624634,
"grad_norm": 0.7134765702982729,
"learning_rate": 1.0934093099092684e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18349812924861908,
"step": 4905,
"valid_targets_mean": 2678.9,
"valid_targets_min": 1270
},
{
"epoch": 4.79960899315738,
"grad_norm": 0.7321067232072485,
"learning_rate": 1.0890664284825488e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972254067659378,
"step": 4910,
"valid_targets_mean": 2744.4,
"valid_targets_min": 991
},
{
"epoch": 4.804496578690127,
"grad_norm": 0.7586910224470423,
"learning_rate": 1.0847289597711144e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1841929405927658,
"step": 4915,
"valid_targets_mean": 2455.1,
"valid_targets_min": 881
},
{
"epoch": 4.809384164222874,
"grad_norm": 0.7967660614928856,
"learning_rate": 1.0803969295479577e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16611838340759277,
"step": 4920,
"valid_targets_mean": 1992.2,
"valid_targets_min": 699
},
{
"epoch": 4.814271749755621,
"grad_norm": 0.7051736092585311,
"learning_rate": 1.076070363553754e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14659056067466736,
"step": 4925,
"valid_targets_mean": 2598.4,
"valid_targets_min": 904
},
{
"epoch": 4.819159335288368,
"grad_norm": 0.8074487953089629,
"learning_rate": 1.071749287496712e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18871314823627472,
"step": 4930,
"valid_targets_mean": 2446.9,
"valid_targets_min": 917
},
{
"epoch": 4.8240469208211145,
"grad_norm": 0.7358191683646678,
"learning_rate": 1.0674337270524195e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15642912685871124,
"step": 4935,
"valid_targets_mean": 2261.7,
"valid_targets_min": 659
},
{
"epoch": 4.828934506353861,
"grad_norm": 0.7772322735086833,
"learning_rate": 1.06312370786369e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16359858214855194,
"step": 4940,
"valid_targets_mean": 2106.1,
"valid_targets_min": 706
},
{
"epoch": 4.833822091886608,
"grad_norm": 0.7984734484679462,
"learning_rate": 1.0588192555404106e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1786036491394043,
"step": 4945,
"valid_targets_mean": 1923.9,
"valid_targets_min": 1242
},
{
"epoch": 4.838709677419355,
"grad_norm": 0.7509801685683009,
"learning_rate": 1.0545203956593922e-05,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16603411734104156,
"step": 4950,
"valid_targets_mean": 2316.3,
"valid_targets_min": 917
},
{
"epoch": 4.843597262952102,
"grad_norm": 0.6961656843543814,
"learning_rate": 1.0502271537642144e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17675796151161194,
"step": 4955,
"valid_targets_mean": 2698.9,
"valid_targets_min": 825
},
{
"epoch": 4.848484848484849,
"grad_norm": 0.8051523733028211,
"learning_rate": 1.0459395553650767e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18461185693740845,
"step": 4960,
"valid_targets_mean": 1971.4,
"valid_targets_min": 727
},
{
"epoch": 4.853372434017595,
"grad_norm": 0.8334702591345402,
"learning_rate": 1.041657625938643e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19902193546295166,
"step": 4965,
"valid_targets_mean": 2607.7,
"valid_targets_min": 1300
},
{
"epoch": 4.858260019550342,
"grad_norm": 0.7868464417093073,
"learning_rate": 1.0373813909278926e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20459884405136108,
"step": 4970,
"valid_targets_mean": 2319.3,
"valid_targets_min": 861
},
{
"epoch": 4.863147605083089,
"grad_norm": 0.757600709591517,
"learning_rate": 1.0331108757419715e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1869640350341797,
"step": 4975,
"valid_targets_mean": 2491.2,
"valid_targets_min": 567
},
{
"epoch": 4.868035190615836,
"grad_norm": 0.7221664526957879,
"learning_rate": 1.0288461057560361e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17515313625335693,
"step": 4980,
"valid_targets_mean": 2669.4,
"valid_targets_min": 1520
},
{
"epoch": 4.872922776148583,
"grad_norm": 0.7579422903647014,
"learning_rate": 1.0245871063111077e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1622183918952942,
"step": 4985,
"valid_targets_mean": 2357.6,
"valid_targets_min": 912
},
{
"epoch": 4.8778103616813295,
"grad_norm": 0.8067790989051661,
"learning_rate": 1.0203339027139167e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16633889079093933,
"step": 4990,
"valid_targets_mean": 1989.5,
"valid_targets_min": 632
},
{
"epoch": 4.882697947214076,
"grad_norm": 0.7758521837897394,
"learning_rate": 1.0160865202367556e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1709386706352234,
"step": 4995,
"valid_targets_mean": 2203.2,
"valid_targets_min": 829
},
{
"epoch": 4.887585532746823,
"grad_norm": 0.8248140895342541,
"learning_rate": 1.0118449841173294e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18402284383773804,
"step": 5000,
"valid_targets_mean": 2114.4,
"valid_targets_min": 720
},
{
"epoch": 4.89247311827957,
"grad_norm": 0.6897458976588339,
"learning_rate": 1.0076093195586043e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16674119234085083,
"step": 5005,
"valid_targets_mean": 2625.1,
"valid_targets_min": 708
},
{
"epoch": 4.897360703812317,
"grad_norm": 0.6687153559969188,
"learning_rate": 1.0033795517286558e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17733493447303772,
"step": 5010,
"valid_targets_mean": 2868.8,
"valid_targets_min": 922
},
{
"epoch": 4.902248289345064,
"grad_norm": 0.8576695321729364,
"learning_rate": 9.991557057605244e-06,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18968823552131653,
"step": 5015,
"valid_targets_mean": 1945.0,
"valid_targets_min": 704
},
{
"epoch": 4.9071358748778104,
"grad_norm": 0.639640416335708,
"learning_rate": 9.949378067520601e-06,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14256887137889862,
"step": 5020,
"valid_targets_mean": 2694.2,
"valid_targets_min": 656
},
{
"epoch": 4.912023460410557,
"grad_norm": 0.6732914788931557,
"learning_rate": 9.90725879765779e-06,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1720367670059204,
"step": 5025,
"valid_targets_mean": 3006.6,
"valid_targets_min": 1307
},
{
"epoch": 4.916911045943304,
"grad_norm": 0.7100316647560853,
"learning_rate": 9.865199498287118e-06,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16838201880455017,
"step": 5030,
"valid_targets_mean": 2566.2,
"valid_targets_min": 826
},
{
"epoch": 4.921798631476051,
"grad_norm": 0.7460391948002998,
"learning_rate": 9.823200419322523e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16970403492450714,
"step": 5035,
"valid_targets_mean": 2189.6,
"valid_targets_min": 737
},
{
"epoch": 4.926686217008798,
"grad_norm": 0.7470863844930459,
"learning_rate": 9.781261810320151e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17340749502182007,
"step": 5040,
"valid_targets_mean": 2428.0,
"valid_targets_min": 647
},
{
"epoch": 4.9315738025415445,
"grad_norm": 0.7125845379627102,
"learning_rate": 9.739383920476806e-06,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16167551279067993,
"step": 5045,
"valid_targets_mean": 2554.8,
"valid_targets_min": 544
},
{
"epoch": 4.936461388074291,
"grad_norm": 0.7572669890789546,
"learning_rate": 9.69756699862853e-06,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22088664770126343,
"step": 5050,
"valid_targets_mean": 2523.8,
"valid_targets_min": 944
},
{
"epoch": 4.941348973607038,
"grad_norm": 0.7472631938735368,
"learning_rate": 9.65581129324909e-06,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17298045754432678,
"step": 5055,
"valid_targets_mean": 2148.9,
"valid_targets_min": 591
},
{
"epoch": 4.946236559139785,
"grad_norm": 0.7406653369418025,
"learning_rate": 9.614117052448488e-06,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12865734100341797,
"step": 5060,
"valid_targets_mean": 2030.6,
"valid_targets_min": 842
},
{
"epoch": 4.951124144672532,
"grad_norm": 0.7621843768822362,
"learning_rate": 9.572484523971544e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17717863619327545,
"step": 5065,
"valid_targets_mean": 2430.3,
"valid_targets_min": 704
},
{
"epoch": 4.956011730205279,
"grad_norm": 0.7498657834356395,
"learning_rate": 9.530913955196344e-06,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18062527477741241,
"step": 5070,
"valid_targets_mean": 2419.0,
"valid_targets_min": 824
},
{
"epoch": 4.9608993157380255,
"grad_norm": 0.8141850556767372,
"learning_rate": 9.489405593132846e-06,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15304099023342133,
"step": 5075,
"valid_targets_mean": 2178.5,
"valid_targets_min": 780
},
{
"epoch": 4.965786901270772,
"grad_norm": 0.6380568455457596,
"learning_rate": 9.447959684421374e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16023944318294525,
"step": 5080,
"valid_targets_mean": 3038.6,
"valid_targets_min": 1137
},
{
"epoch": 4.970674486803519,
"grad_norm": 0.7983753521526253,
"learning_rate": 9.40657647533114e-06,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18773408234119415,
"step": 5085,
"valid_targets_mean": 2392.6,
"valid_targets_min": 753
},
{
"epoch": 4.975562072336266,
"grad_norm": 0.7019559841529516,
"learning_rate": 9.365256211758819e-06,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18119125068187714,
"step": 5090,
"valid_targets_mean": 2740.1,
"valid_targets_min": 797
},
{
"epoch": 4.980449657869013,
"grad_norm": 0.8008073853070248,
"learning_rate": 9.323999139227051e-06,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18562883138656616,
"step": 5095,
"valid_targets_mean": 2072.8,
"valid_targets_min": 764
},
{
"epoch": 4.9853372434017595,
"grad_norm": 0.7313841730070882,
"learning_rate": 9.282805502883007e-06,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1831430047750473,
"step": 5100,
"valid_targets_mean": 2517.4,
"valid_targets_min": 754
},
{
"epoch": 4.990224828934506,
"grad_norm": 0.8078162384967679,
"learning_rate": 9.241675547496938e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17006579041481018,
"step": 5105,
"valid_targets_mean": 2003.2,
"valid_targets_min": 714
},
{
"epoch": 4.995112414467253,
"grad_norm": 0.8091777933799764,
"learning_rate": 9.200609517460675e-06,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18514806032180786,
"step": 5110,
"valid_targets_mean": 2168.2,
"valid_targets_min": 680
},
{
"epoch": 5.0,
"grad_norm": 0.7870915330741979,
"learning_rate": 9.159607656786222e-06,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16797024011611938,
"step": 5115,
"valid_targets_mean": 2128.8,
"valid_targets_min": 887
},
{
"epoch": 5.004887585532747,
"grad_norm": 0.7747894970742039,
"learning_rate": 9.1186702091043e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16766156256198883,
"step": 5120,
"valid_targets_mean": 2120.5,
"valid_targets_min": 675
},
{
"epoch": 5.009775171065494,
"grad_norm": 0.6475219132787013,
"learning_rate": 9.077797417662888e-06,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16814623773097992,
"step": 5125,
"valid_targets_mean": 3438.9,
"valid_targets_min": 621
},
{
"epoch": 5.0146627565982405,
"grad_norm": 0.6877209083156904,
"learning_rate": 9.036989525325788e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.151102676987648,
"step": 5130,
"valid_targets_mean": 3217.8,
"valid_targets_min": 768
},
{
"epoch": 5.019550342130987,
"grad_norm": 0.7324938421863219,
"learning_rate": 8.996246774571159e-06,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12554004788398743,
"step": 5135,
"valid_targets_mean": 2168.3,
"valid_targets_min": 1037
},
{
"epoch": 5.024437927663734,
"grad_norm": 0.7753610298141373,
"learning_rate": 8.95556940749009e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14286714792251587,
"step": 5140,
"valid_targets_mean": 2078.7,
"valid_targets_min": 668
},
{
"epoch": 5.029325513196481,
"grad_norm": 0.7395423291733766,
"learning_rate": 8.914957665785184e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16619789600372314,
"step": 5145,
"valid_targets_mean": 2746.6,
"valid_targets_min": 986
},
{
"epoch": 5.034213098729228,
"grad_norm": 0.6439026975349222,
"learning_rate": 8.874411790769093e-06,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12593859434127808,
"step": 5150,
"valid_targets_mean": 2663.3,
"valid_targets_min": 1334
},
{
"epoch": 5.0391006842619745,
"grad_norm": 0.7324203667912003,
"learning_rate": 8.833932023363096e-06,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16145989298820496,
"step": 5155,
"valid_targets_mean": 2840.1,
"valid_targets_min": 1147
},
{
"epoch": 5.043988269794721,
"grad_norm": 1.2076159147090062,
"learning_rate": 8.793518604095659e-06,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16184774041175842,
"step": 5160,
"valid_targets_mean": 2118.9,
"valid_targets_min": 985
},
{
"epoch": 5.048875855327468,
"grad_norm": 0.8370647289954567,
"learning_rate": 8.753171773101e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15503370761871338,
"step": 5165,
"valid_targets_mean": 2071.8,
"valid_targets_min": 741
},
{
"epoch": 5.053763440860215,
"grad_norm": 1.3707229780441046,
"learning_rate": 8.712891770117693e-06,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1608889102935791,
"step": 5170,
"valid_targets_mean": 2661.7,
"valid_targets_min": 807
},
{
"epoch": 5.058651026392962,
"grad_norm": 0.8818514323414521,
"learning_rate": 8.672678834487228e-06,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1271866112947464,
"step": 5175,
"valid_targets_mean": 1782.8,
"valid_targets_min": 933
},
{
"epoch": 5.063538611925709,
"grad_norm": 0.7996369140231598,
"learning_rate": 8.632533205152553e-06,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14621879160404205,
"step": 5180,
"valid_targets_mean": 2618.7,
"valid_targets_min": 771
},
{
"epoch": 5.0684261974584555,
"grad_norm": 0.7632406562623092,
"learning_rate": 8.592455120656726e-06,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15845827758312225,
"step": 5185,
"valid_targets_mean": 2956.1,
"valid_targets_min": 636
},
{
"epoch": 5.073313782991202,
"grad_norm": 0.8154709547280357,
"learning_rate": 8.552444819141413e-06,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15961962938308716,
"step": 5190,
"valid_targets_mean": 2535.6,
"valid_targets_min": 727
},
{
"epoch": 5.078201368523949,
"grad_norm": 0.7508882761061626,
"learning_rate": 8.512502538345568e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13347077369689941,
"step": 5195,
"valid_targets_mean": 2393.2,
"valid_targets_min": 625
},
{
"epoch": 5.083088954056696,
"grad_norm": 0.7503877902892744,
"learning_rate": 8.472628515603936e-06,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1839996576309204,
"step": 5200,
"valid_targets_mean": 3139.9,
"valid_targets_min": 1167
},
{
"epoch": 5.087976539589443,
"grad_norm": 0.814409890229622,
"learning_rate": 8.43282298784567e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16277194023132324,
"step": 5205,
"valid_targets_mean": 2501.2,
"valid_targets_min": 949
},
{
"epoch": 5.0928641251221896,
"grad_norm": 0.7086407404966241,
"learning_rate": 8.393086191592963e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15189936757087708,
"step": 5210,
"valid_targets_mean": 3098.6,
"valid_targets_min": 1159
},
{
"epoch": 5.097751710654936,
"grad_norm": 0.8089395622560438,
"learning_rate": 8.353418362959564e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1489260196685791,
"step": 5215,
"valid_targets_mean": 2491.1,
"valid_targets_min": 644
},
{
"epoch": 5.102639296187683,
"grad_norm": 0.8056121720254122,
"learning_rate": 8.313819737649483e-06,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15654730796813965,
"step": 5220,
"valid_targets_mean": 2591.2,
"valid_targets_min": 801
},
{
"epoch": 5.10752688172043,
"grad_norm": 0.8044880648557395,
"learning_rate": 8.274290550955468e-06,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13206225633621216,
"step": 5225,
"valid_targets_mean": 2005.5,
"valid_targets_min": 1094
},
{
"epoch": 5.112414467253177,
"grad_norm": 0.7613818292118435,
"learning_rate": 8.234831037757687e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17657440900802612,
"step": 5230,
"valid_targets_mean": 2638.0,
"valid_targets_min": 765
},
{
"epoch": 5.117302052785924,
"grad_norm": 0.6877071433658863,
"learning_rate": 8.195441432522324e-06,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1490596979856491,
"step": 5235,
"valid_targets_mean": 3027.0,
"valid_targets_min": 874
},
{
"epoch": 5.1221896383186705,
"grad_norm": 0.7403615217739022,
"learning_rate": 8.156121969300168e-06,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1425008326768875,
"step": 5240,
"valid_targets_mean": 2339.8,
"valid_targets_min": 659
},
{
"epoch": 5.127077223851417,
"grad_norm": 0.7526140740334464,
"learning_rate": 8.116872881725213e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1776733696460724,
"step": 5245,
"valid_targets_mean": 3384.4,
"valid_targets_min": 1031
},
{
"epoch": 5.131964809384164,
"grad_norm": 0.7793267157176477,
"learning_rate": 8.077694403013312e-06,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542745679616928,
"step": 5250,
"valid_targets_mean": 2364.7,
"valid_targets_min": 712
},
{
"epoch": 5.136852394916911,
"grad_norm": 0.7971711756751064,
"learning_rate": 8.038586765960735e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1412791758775711,
"step": 5255,
"valid_targets_mean": 1963.4,
"valid_targets_min": 641
},
{
"epoch": 5.141739980449658,
"grad_norm": 0.7033271354224208,
"learning_rate": 7.999550202942833e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16525672376155853,
"step": 5260,
"valid_targets_mean": 3219.7,
"valid_targets_min": 809
},
{
"epoch": 5.146627565982405,
"grad_norm": 0.7247341620856336,
"learning_rate": 7.960584945912649e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16547167301177979,
"step": 5265,
"valid_targets_mean": 2777.9,
"valid_targets_min": 744
},
{
"epoch": 5.151515151515151,
"grad_norm": 0.8520459168069531,
"learning_rate": 7.921691226399492e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15888334810733795,
"step": 5270,
"valid_targets_mean": 2529.7,
"valid_targets_min": 816
},
{
"epoch": 5.156402737047898,
"grad_norm": 0.7059577585280569,
"learning_rate": 7.882869275507648e-06,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13361497223377228,
"step": 5275,
"valid_targets_mean": 2845.0,
"valid_targets_min": 704
},
{
"epoch": 5.161290322580645,
"grad_norm": 0.6859160374477156,
"learning_rate": 7.844119323914918e-06,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14880457520484924,
"step": 5280,
"valid_targets_mean": 3074.0,
"valid_targets_min": 764
},
{
"epoch": 5.166177908113392,
"grad_norm": 0.6951765797767238,
"learning_rate": 7.805441601871292e-06,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1490635871887207,
"step": 5285,
"valid_targets_mean": 3103.2,
"valid_targets_min": 1018
},
{
"epoch": 5.171065493646139,
"grad_norm": 0.7792674902926341,
"learning_rate": 7.766836339197617e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745825558900833,
"step": 5290,
"valid_targets_mean": 2414.8,
"valid_targets_min": 972
},
{
"epoch": 5.1759530791788855,
"grad_norm": 0.7243392727575753,
"learning_rate": 7.728303765284136e-06,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1535375863313675,
"step": 5295,
"valid_targets_mean": 2897.2,
"valid_targets_min": 932
},
{
"epoch": 5.180840664711632,
"grad_norm": 0.7297677901128055,
"learning_rate": 7.689844109089217e-06,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14912715554237366,
"step": 5300,
"valid_targets_mean": 2656.3,
"valid_targets_min": 1004
},
{
"epoch": 5.185728250244379,
"grad_norm": 0.7467264254993835,
"learning_rate": 7.651457599137929e-06,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14847451448440552,
"step": 5305,
"valid_targets_mean": 2904.3,
"valid_targets_min": 638
},
{
"epoch": 5.190615835777126,
"grad_norm": 0.8720410023528405,
"learning_rate": 7.613144463520732e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656719148159027,
"step": 5310,
"valid_targets_mean": 2167.3,
"valid_targets_min": 734
},
{
"epoch": 5.195503421309873,
"grad_norm": 0.7908689871901836,
"learning_rate": 7.574904929892093e-06,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16172878444194794,
"step": 5315,
"valid_targets_mean": 2394.0,
"valid_targets_min": 898
},
{
"epoch": 5.20039100684262,
"grad_norm": 0.755139638023909,
"learning_rate": 7.53673922546913e-06,
"loss": 0.1367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14658725261688232,
"step": 5320,
"valid_targets_mean": 2478.6,
"valid_targets_min": 810
},
{
"epoch": 5.205278592375366,
"grad_norm": 0.8778718952166356,
"learning_rate": 7.498647577030291e-06,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14963701367378235,
"step": 5325,
"valid_targets_mean": 2121.1,
"valid_targets_min": 635
},
{
"epoch": 5.210166177908113,
"grad_norm": 0.8376481931091295,
"learning_rate": 7.460630210913964e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14989005029201508,
"step": 5330,
"valid_targets_mean": 1952.4,
"valid_targets_min": 648
},
{
"epoch": 5.21505376344086,
"grad_norm": 0.8652589359238804,
"learning_rate": 7.422687353017173e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15695667266845703,
"step": 5335,
"valid_targets_mean": 1941.1,
"valid_targets_min": 795
},
{
"epoch": 5.219941348973607,
"grad_norm": 0.8041415349342634,
"learning_rate": 7.384819228794222e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1654549539089203,
"step": 5340,
"valid_targets_mean": 2202.2,
"valid_targets_min": 1217
},
{
"epoch": 5.224828934506354,
"grad_norm": 0.7245646950191174,
"learning_rate": 7.347026063255338e-06,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14550118148326874,
"step": 5345,
"valid_targets_mean": 2840.0,
"valid_targets_min": 1225
},
{
"epoch": 5.2297165200391005,
"grad_norm": 0.761083682415506,
"learning_rate": 7.309308080965345e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15238893032073975,
"step": 5350,
"valid_targets_mean": 2448.1,
"valid_targets_min": 953
},
{
"epoch": 5.234604105571847,
"grad_norm": 0.8141359878753163,
"learning_rate": 7.271665506042349e-06,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1655212789773941,
"step": 5355,
"valid_targets_mean": 2414.3,
"valid_targets_min": 750
},
{
"epoch": 5.239491691104594,
"grad_norm": 0.7925319949059126,
"learning_rate": 7.234098562156382e-06,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14529694616794586,
"step": 5360,
"valid_targets_mean": 2259.9,
"valid_targets_min": 796
},
{
"epoch": 5.244379276637341,
"grad_norm": 0.8281189537598208,
"learning_rate": 7.196607472528083e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15511846542358398,
"step": 5365,
"valid_targets_mean": 2057.9,
"valid_targets_min": 696
},
{
"epoch": 5.249266862170088,
"grad_norm": 0.9202487657550533,
"learning_rate": 7.1591924599273646e-06,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16870905458927155,
"step": 5370,
"valid_targets_mean": 2043.6,
"valid_targets_min": 806
},
{
"epoch": 5.254154447702835,
"grad_norm": 0.7490177593952363,
"learning_rate": 7.121853746672087e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1420806646347046,
"step": 5375,
"valid_targets_mean": 2500.4,
"valid_targets_min": 1353
},
{
"epoch": 5.259042033235581,
"grad_norm": 0.7953194730901839,
"learning_rate": 7.084591554626761e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15275171399116516,
"step": 5380,
"valid_targets_mean": 2575.5,
"valid_targets_min": 920
},
{
"epoch": 5.263929618768328,
"grad_norm": 0.8052676980006547,
"learning_rate": 7.047406105201202e-06,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14699678122997284,
"step": 5385,
"valid_targets_mean": 2143.2,
"valid_targets_min": 514
},
{
"epoch": 5.268817204301075,
"grad_norm": 0.8178962169352656,
"learning_rate": 7.010297619349238e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14148107171058655,
"step": 5390,
"valid_targets_mean": 1963.5,
"valid_targets_min": 642
},
{
"epoch": 5.273704789833822,
"grad_norm": 0.7553088050684637,
"learning_rate": 6.973266317567364e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751079261302948,
"step": 5395,
"valid_targets_mean": 2179.1,
"valid_targets_min": 829
},
{
"epoch": 5.278592375366569,
"grad_norm": 0.7418479058847184,
"learning_rate": 6.936312419893458e-06,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1365339756011963,
"step": 5400,
"valid_targets_mean": 2537.8,
"valid_targets_min": 923
},
{
"epoch": 5.2834799608993155,
"grad_norm": 0.8557491666172627,
"learning_rate": 6.899436145905474e-06,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15646493434906006,
"step": 5405,
"valid_targets_mean": 2075.5,
"valid_targets_min": 648
},
{
"epoch": 5.288367546432062,
"grad_norm": 0.8021756331273079,
"learning_rate": 6.862637714720138e-06,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329081803560257,
"step": 5410,
"valid_targets_mean": 1917.8,
"valid_targets_min": 682
},
{
"epoch": 5.293255131964809,
"grad_norm": 0.7229260402895247,
"learning_rate": 6.825917344991611e-06,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15381160378456116,
"step": 5415,
"valid_targets_mean": 2806.7,
"valid_targets_min": 994
},
{
"epoch": 5.298142717497556,
"grad_norm": 0.8535602266976685,
"learning_rate": 6.789275254910246e-06,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13848789036273956,
"step": 5420,
"valid_targets_mean": 1859.3,
"valid_targets_min": 713
},
{
"epoch": 5.303030303030303,
"grad_norm": 0.8074188447585233,
"learning_rate": 6.752711662201241e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15609613060951233,
"step": 5425,
"valid_targets_mean": 2341.6,
"valid_targets_min": 806
},
{
"epoch": 5.30791788856305,
"grad_norm": 0.877202839044622,
"learning_rate": 6.716226784123383e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16460809111595154,
"step": 5430,
"valid_targets_mean": 2276.0,
"valid_targets_min": 662
},
{
"epoch": 5.312805474095796,
"grad_norm": 0.7588859531837344,
"learning_rate": 6.6798208374677384e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16514082252979279,
"step": 5435,
"valid_targets_mean": 2550.6,
"valid_targets_min": 761
},
{
"epoch": 5.317693059628543,
"grad_norm": 0.7981982898217473,
"learning_rate": 6.643494038556355e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17266137897968292,
"step": 5440,
"valid_targets_mean": 2877.4,
"valid_targets_min": 1372
},
{
"epoch": 5.32258064516129,
"grad_norm": 0.7362910731569113,
"learning_rate": 6.607246603241009e-06,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15483227372169495,
"step": 5445,
"valid_targets_mean": 2524.4,
"valid_targets_min": 884
},
{
"epoch": 5.327468230694037,
"grad_norm": 0.7656377794863742,
"learning_rate": 6.571078746901878e-06,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14594011008739471,
"step": 5450,
"valid_targets_mean": 2367.2,
"valid_targets_min": 768
},
{
"epoch": 5.332355816226784,
"grad_norm": 0.6850050225914522,
"learning_rate": 6.53499068444631e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1416652500629425,
"step": 5455,
"valid_targets_mean": 2953.6,
"valid_targets_min": 704
},
{
"epoch": 5.3372434017595305,
"grad_norm": 0.7391512591400116,
"learning_rate": 6.498982630307518e-06,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710202693939209,
"step": 5460,
"valid_targets_mean": 2936.5,
"valid_targets_min": 863
},
{
"epoch": 5.342130987292277,
"grad_norm": 0.7660416451265245,
"learning_rate": 6.463054798443287e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16152888536453247,
"step": 5465,
"valid_targets_mean": 2735.8,
"valid_targets_min": 1110
},
{
"epoch": 5.347018572825024,
"grad_norm": 0.8252295444761306,
"learning_rate": 6.4272074023347606e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15773028135299683,
"step": 5470,
"valid_targets_mean": 2095.6,
"valid_targets_min": 893
},
{
"epoch": 5.351906158357771,
"grad_norm": 0.9055114549440841,
"learning_rate": 6.391440654985106e-06,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17055881023406982,
"step": 5475,
"valid_targets_mean": 1950.2,
"valid_targets_min": 684
},
{
"epoch": 5.356793743890518,
"grad_norm": 0.6588127218396698,
"learning_rate": 6.355754768918301e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13662315905094147,
"step": 5480,
"valid_targets_mean": 3307.9,
"valid_targets_min": 747
},
{
"epoch": 5.361681329423265,
"grad_norm": 0.7472617276476732,
"learning_rate": 6.32014995617785e-06,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15279489755630493,
"step": 5485,
"valid_targets_mean": 2531.1,
"valid_targets_min": 645
},
{
"epoch": 5.366568914956011,
"grad_norm": 0.7945430057967098,
"learning_rate": 6.284626428325504e-06,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13775640726089478,
"step": 5490,
"valid_targets_mean": 2237.1,
"valid_targets_min": 793
},
{
"epoch": 5.371456500488758,
"grad_norm": 1.1165361040355197,
"learning_rate": 6.249184396440053e-06,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15144461393356323,
"step": 5495,
"valid_targets_mean": 2468.8,
"valid_targets_min": 615
},
{
"epoch": 5.376344086021505,
"grad_norm": 0.7782637843895414,
"learning_rate": 6.2138240711160125e-06,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1696222573518753,
"step": 5500,
"valid_targets_mean": 2696.6,
"valid_targets_min": 699
},
{
"epoch": 5.381231671554252,
"grad_norm": 0.7825515135644441,
"learning_rate": 6.178545662462425e-06,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16258756816387177,
"step": 5505,
"valid_targets_mean": 2587.4,
"valid_targets_min": 754
},
{
"epoch": 5.386119257086999,
"grad_norm": 0.8421569052905954,
"learning_rate": 6.1433493801015865e-06,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13311320543289185,
"step": 5510,
"valid_targets_mean": 1930.4,
"valid_targets_min": 617
},
{
"epoch": 5.3910068426197455,
"grad_norm": 0.8261937566397005,
"learning_rate": 6.108235433167791e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16040858626365662,
"step": 5515,
"valid_targets_mean": 2021.9,
"valid_targets_min": 684
},
{
"epoch": 5.395894428152492,
"grad_norm": 0.7936724009453671,
"learning_rate": 6.073204030306101e-06,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14740975201129913,
"step": 5520,
"valid_targets_mean": 2411.1,
"valid_targets_min": 636
},
{
"epoch": 5.400782013685239,
"grad_norm": 0.8088963586124284,
"learning_rate": 6.038255379671121e-06,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15532401204109192,
"step": 5525,
"valid_targets_mean": 2203.5,
"valid_targets_min": 678
},
{
"epoch": 5.405669599217986,
"grad_norm": 0.8249172911213923,
"learning_rate": 6.003389688925736e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13733899593353271,
"step": 5530,
"valid_targets_mean": 2478.9,
"valid_targets_min": 738
},
{
"epoch": 5.410557184750733,
"grad_norm": 0.6793605880624324,
"learning_rate": 5.968607165239897e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14237245917320251,
"step": 5535,
"valid_targets_mean": 3130.7,
"valid_targets_min": 1230
},
{
"epoch": 5.41544477028348,
"grad_norm": 0.9530584429559311,
"learning_rate": 5.933908015289367e-06,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17519810795783997,
"step": 5540,
"valid_targets_mean": 1629.4,
"valid_targets_min": 512
},
{
"epoch": 5.420332355816226,
"grad_norm": 0.7526914536401272,
"learning_rate": 5.89929244525451e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16908365488052368,
"step": 5545,
"valid_targets_mean": 2734.1,
"valid_targets_min": 1191
},
{
"epoch": 5.425219941348973,
"grad_norm": 0.7626748112290224,
"learning_rate": 5.864760660819073e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16685664653778076,
"step": 5550,
"valid_targets_mean": 2915.1,
"valid_targets_min": 1098
},
{
"epoch": 5.43010752688172,
"grad_norm": 0.8034530660024547,
"learning_rate": 5.830312867168948e-06,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14739468693733215,
"step": 5555,
"valid_targets_mean": 2265.8,
"valid_targets_min": 692
},
{
"epoch": 5.434995112414467,
"grad_norm": 0.7652321619302118,
"learning_rate": 5.795949268990964e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14698611199855804,
"step": 5560,
"valid_targets_mean": 2454.2,
"valid_targets_min": 717
},
{
"epoch": 5.439882697947214,
"grad_norm": 0.8333089448649366,
"learning_rate": 5.7616700704716545e-06,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15633103251457214,
"step": 5565,
"valid_targets_mean": 2116.5,
"valid_targets_min": 848
},
{
"epoch": 5.4447702834799605,
"grad_norm": 0.8009884901164667,
"learning_rate": 5.727475475296047e-06,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15122680366039276,
"step": 5570,
"valid_targets_mean": 2134.5,
"valid_targets_min": 900
},
{
"epoch": 5.449657869012707,
"grad_norm": 0.8124584053736166,
"learning_rate": 5.693365686646501e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16159634292125702,
"step": 5575,
"valid_targets_mean": 2173.5,
"valid_targets_min": 809
},
{
"epoch": 5.454545454545454,
"grad_norm": 0.7935256921202335,
"learning_rate": 5.659340907201418e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16111275553703308,
"step": 5580,
"valid_targets_mean": 2267.2,
"valid_targets_min": 701
},
{
"epoch": 5.459433040078201,
"grad_norm": 0.6835989696344518,
"learning_rate": 5.625401339134093e-06,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14738526940345764,
"step": 5585,
"valid_targets_mean": 3000.6,
"valid_targets_min": 879
},
{
"epoch": 5.464320625610948,
"grad_norm": 0.7930964833671504,
"learning_rate": 5.591547184111514e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1674892157316208,
"step": 5590,
"valid_targets_mean": 2696.9,
"valid_targets_min": 687
},
{
"epoch": 5.469208211143695,
"grad_norm": 0.744501626898747,
"learning_rate": 5.557778643293117e-06,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16441041231155396,
"step": 5595,
"valid_targets_mean": 2941.3,
"valid_targets_min": 1195
},
{
"epoch": 5.474095796676442,
"grad_norm": 0.7910032892994638,
"learning_rate": 5.524095917329668e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16341263055801392,
"step": 5600,
"valid_targets_mean": 2293.9,
"valid_targets_min": 1001
},
{
"epoch": 5.478983382209188,
"grad_norm": 0.8189803335488413,
"learning_rate": 5.490499206361992e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621970534324646,
"step": 5605,
"valid_targets_mean": 2192.6,
"valid_targets_min": 1044
},
{
"epoch": 5.483870967741936,
"grad_norm": 0.8435168373600971,
"learning_rate": 5.456988710019822e-06,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1423211395740509,
"step": 5610,
"valid_targets_mean": 1718.4,
"valid_targets_min": 756
},
{
"epoch": 5.488758553274682,
"grad_norm": 0.8432435824638052,
"learning_rate": 5.4235646274206185e-06,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15067586302757263,
"step": 5615,
"valid_targets_mean": 2142.1,
"valid_targets_min": 632
},
{
"epoch": 5.49364613880743,
"grad_norm": 0.8434772077306247,
"learning_rate": 5.3902271571683815e-06,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15619194507598877,
"step": 5620,
"valid_targets_mean": 2239.2,
"valid_targets_min": 719
},
{
"epoch": 5.4985337243401755,
"grad_norm": 0.7932516543133425,
"learning_rate": 5.356976497352442e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14296786487102509,
"step": 5625,
"valid_targets_mean": 2430.8,
"valid_targets_min": 878
},
{
"epoch": 5.503421309872923,
"grad_norm": 0.7340907560380051,
"learning_rate": 5.323812845546334e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15341924130916595,
"step": 5630,
"valid_targets_mean": 2661.9,
"valid_targets_min": 889
},
{
"epoch": 5.508308895405669,
"grad_norm": 0.9584349909909398,
"learning_rate": 5.290736398806575e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17308732867240906,
"step": 5635,
"valid_targets_mean": 1577.6,
"valid_targets_min": 848
},
{
"epoch": 5.513196480938417,
"grad_norm": 0.8019713328945052,
"learning_rate": 5.2577473536715275e-06,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16516554355621338,
"step": 5640,
"valid_targets_mean": 2460.1,
"valid_targets_min": 1066
},
{
"epoch": 5.518084066471163,
"grad_norm": 0.8191884705772617,
"learning_rate": 5.224845906160219e-06,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15267640352249146,
"step": 5645,
"valid_targets_mean": 2165.6,
"valid_targets_min": 752
},
{
"epoch": 5.5229716520039105,
"grad_norm": 0.8330339846872703,
"learning_rate": 5.1920322517711615e-06,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15274596214294434,
"step": 5650,
"valid_targets_mean": 2050.2,
"valid_targets_min": 591
},
{
"epoch": 5.527859237536656,
"grad_norm": 0.7824632706097082,
"learning_rate": 5.1593065854812294e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1320272833108902,
"step": 5655,
"valid_targets_mean": 2084.6,
"valid_targets_min": 789
},
{
"epoch": 5.532746823069404,
"grad_norm": 0.8015604744159438,
"learning_rate": 5.1266691017444505e-06,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1577574610710144,
"step": 5660,
"valid_targets_mean": 2387.2,
"valid_targets_min": 800
},
{
"epoch": 5.53763440860215,
"grad_norm": 0.7592693450999322,
"learning_rate": 5.094119994490898e-06,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16440163552761078,
"step": 5665,
"valid_targets_mean": 2866.8,
"valid_targets_min": 772
},
{
"epoch": 5.542521994134898,
"grad_norm": 0.7921173779072441,
"learning_rate": 5.061659457125514e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15453504025936127,
"step": 5670,
"valid_targets_mean": 2380.8,
"valid_targets_min": 1188
},
{
"epoch": 5.547409579667644,
"grad_norm": 0.8120586505606648,
"learning_rate": 5.029287682526949e-06,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16854724287986755,
"step": 5675,
"valid_targets_mean": 2460.8,
"valid_targets_min": 742
},
{
"epoch": 5.552297165200391,
"grad_norm": 0.8499742573768506,
"learning_rate": 4.997004863046446e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1677948236465454,
"step": 5680,
"valid_targets_mean": 2218.1,
"valid_targets_min": 1013
},
{
"epoch": 5.557184750733137,
"grad_norm": 0.8783081648919876,
"learning_rate": 4.964811190506671e-06,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18013803660869598,
"step": 5685,
"valid_targets_mean": 2322.4,
"valid_targets_min": 692
},
{
"epoch": 5.562072336265885,
"grad_norm": 0.7709090075615438,
"learning_rate": 4.932706856200589e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14455710351467133,
"step": 5690,
"valid_targets_mean": 2390.8,
"valid_targets_min": 626
},
{
"epoch": 5.566959921798632,
"grad_norm": 0.8439698983111165,
"learning_rate": 4.90069205089033e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16360528767108917,
"step": 5695,
"valid_targets_mean": 2045.9,
"valid_targets_min": 708
},
{
"epoch": 5.571847507331379,
"grad_norm": 0.8445073532119768,
"learning_rate": 4.868766964806029e-06,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16692796349525452,
"step": 5700,
"valid_targets_mean": 2184.8,
"valid_targets_min": 970
},
{
"epoch": 5.5767350928641255,
"grad_norm": 0.7247679212006615,
"learning_rate": 4.8369317876447365e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15431565046310425,
"step": 5705,
"valid_targets_mean": 3089.9,
"valid_targets_min": 1388
},
{
"epoch": 5.581622678396872,
"grad_norm": 0.7600528639537043,
"learning_rate": 4.805186708569245e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17368043959140778,
"step": 5710,
"valid_targets_mean": 2844.1,
"valid_targets_min": 958
},
{
"epoch": 5.586510263929619,
"grad_norm": 0.7391855729545126,
"learning_rate": 4.773531916207008e-06,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13605889678001404,
"step": 5715,
"valid_targets_mean": 2471.4,
"valid_targets_min": 992
},
{
"epoch": 5.591397849462366,
"grad_norm": 0.769129841502073,
"learning_rate": 4.741967598649002e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15731492638587952,
"step": 5720,
"valid_targets_mean": 2548.4,
"valid_targets_min": 711
},
{
"epoch": 5.596285434995113,
"grad_norm": 1.1287691604840524,
"learning_rate": 4.7104939434485884e-06,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1409187912940979,
"step": 5725,
"valid_targets_mean": 2582.1,
"valid_targets_min": 892
},
{
"epoch": 5.60117302052786,
"grad_norm": 0.9156130590977292,
"learning_rate": 4.679111137620442e-06,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329200565814972,
"step": 5730,
"valid_targets_mean": 1692.3,
"valid_targets_min": 591
},
{
"epoch": 5.606060606060606,
"grad_norm": 0.8263554263382872,
"learning_rate": 4.64781936763939e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14420738816261292,
"step": 5735,
"valid_targets_mean": 2274.1,
"valid_targets_min": 830
},
{
"epoch": 5.610948191593353,
"grad_norm": 0.7412321177836615,
"learning_rate": 4.616618819439353e-06,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455959975719452,
"step": 5740,
"valid_targets_mean": 2443.1,
"valid_targets_min": 875
},
{
"epoch": 5.6158357771261,
"grad_norm": 0.7056612270287848,
"learning_rate": 4.585509678412208e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15663772821426392,
"step": 5745,
"valid_targets_mean": 3141.4,
"valid_targets_min": 1052
},
{
"epoch": 5.620723362658847,
"grad_norm": 0.8069910406282396,
"learning_rate": 4.5544921294066935e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14563411474227905,
"step": 5750,
"valid_targets_mean": 2318.9,
"valid_targets_min": 1035
},
{
"epoch": 5.625610948191594,
"grad_norm": 0.8114201491577269,
"learning_rate": 4.523566356727309e-06,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1693604439496994,
"step": 5755,
"valid_targets_mean": 2370.1,
"valid_targets_min": 869
},
{
"epoch": 5.6304985337243405,
"grad_norm": 0.8443036168376865,
"learning_rate": 4.492732544133236e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15634265542030334,
"step": 5760,
"valid_targets_mean": 1911.4,
"valid_targets_min": 700
},
{
"epoch": 5.635386119257087,
"grad_norm": 0.787586816101732,
"learning_rate": 4.461990874837227e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15353325009346008,
"step": 5765,
"valid_targets_mean": 2510.8,
"valid_targets_min": 762
},
{
"epoch": 5.640273704789834,
"grad_norm": 0.8265538830295129,
"learning_rate": 4.431341531504536e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17224039137363434,
"step": 5770,
"valid_targets_mean": 2606.2,
"valid_targets_min": 897
},
{
"epoch": 5.645161290322581,
"grad_norm": 0.9987858614241965,
"learning_rate": 4.400784696251801e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1915130913257599,
"step": 5775,
"valid_targets_mean": 2068.2,
"valid_targets_min": 1206
},
{
"epoch": 5.650048875855328,
"grad_norm": 0.8197168076239274,
"learning_rate": 4.37032055064599e-06,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514715850353241,
"step": 5780,
"valid_targets_mean": 2108.2,
"valid_targets_min": 629
},
{
"epoch": 5.654936461388075,
"grad_norm": 0.7371445886865936,
"learning_rate": 4.3399492757033235e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20320241153240204,
"step": 5785,
"valid_targets_mean": 2937.3,
"valid_targets_min": 720
},
{
"epoch": 5.659824046920821,
"grad_norm": 0.860820707417868,
"learning_rate": 4.309671051888187e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14680787920951843,
"step": 5790,
"valid_targets_mean": 1897.9,
"valid_targets_min": 534
},
{
"epoch": 5.664711632453568,
"grad_norm": 0.7425530568167907,
"learning_rate": 4.27948605911205e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18525880575180054,
"step": 5795,
"valid_targets_mean": 2515.6,
"valid_targets_min": 752
},
{
"epoch": 5.669599217986315,
"grad_norm": 0.7672403302530817,
"learning_rate": 4.2493944767324245e-06,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17380796372890472,
"step": 5800,
"valid_targets_mean": 2673.0,
"valid_targets_min": 701
},
{
"epoch": 5.674486803519062,
"grad_norm": 0.8190685848445297,
"learning_rate": 4.2193964835517656e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1683279573917389,
"step": 5805,
"valid_targets_mean": 2120.9,
"valid_targets_min": 965
},
{
"epoch": 5.679374389051809,
"grad_norm": 1.002164296776056,
"learning_rate": 4.189492257816443e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14651206135749817,
"step": 5810,
"valid_targets_mean": 2480.2,
"valid_targets_min": 740
},
{
"epoch": 5.6842619745845555,
"grad_norm": 0.8097394342502438,
"learning_rate": 4.159681977215663e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17866715788841248,
"step": 5815,
"valid_targets_mean": 2452.8,
"valid_targets_min": 867
},
{
"epoch": 5.689149560117302,
"grad_norm": 0.8423732358599466,
"learning_rate": 4.1299658188804015e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1501942276954651,
"step": 5820,
"valid_targets_mean": 2100.3,
"valid_targets_min": 741
},
{
"epoch": 5.694037145650049,
"grad_norm": 0.7237945688434769,
"learning_rate": 4.1003439593823865e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15869738161563873,
"step": 5825,
"valid_targets_mean": 2729.0,
"valid_targets_min": 986
},
{
"epoch": 5.698924731182796,
"grad_norm": 0.7467148363318494,
"learning_rate": 4.070816574733003e-06,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14755885303020477,
"step": 5830,
"valid_targets_mean": 2749.3,
"valid_targets_min": 980
},
{
"epoch": 5.703812316715543,
"grad_norm": 0.7867120070266118,
"learning_rate": 4.041383840382294e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161052405834198,
"step": 5835,
"valid_targets_mean": 2601.4,
"valid_targets_min": 1062
},
{
"epoch": 5.70869990224829,
"grad_norm": 0.9049628718004302,
"learning_rate": 4.01204593121789e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15240147709846497,
"step": 5840,
"valid_targets_mean": 1931.8,
"valid_targets_min": 722
},
{
"epoch": 5.713587487781036,
"grad_norm": 0.8698769453803369,
"learning_rate": 3.982803021563961e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14392434060573578,
"step": 5845,
"valid_targets_mean": 2359.8,
"valid_targets_min": 790
},
{
"epoch": 5.718475073313783,
"grad_norm": 0.7228885339388987,
"learning_rate": 3.953655285180223e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14013831317424774,
"step": 5850,
"valid_targets_mean": 2797.0,
"valid_targets_min": 640
},
{
"epoch": 5.72336265884653,
"grad_norm": 0.7537686797769533,
"learning_rate": 3.924602895260843e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12795598804950714,
"step": 5855,
"valid_targets_mean": 2317.8,
"valid_targets_min": 715
},
{
"epoch": 5.728250244379277,
"grad_norm": 0.7471691429860486,
"learning_rate": 3.895646024433475e-06,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15418082475662231,
"step": 5860,
"valid_targets_mean": 2598.8,
"valid_targets_min": 734
},
{
"epoch": 5.733137829912024,
"grad_norm": 0.7549943500132472,
"learning_rate": 3.866784844758196e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1698361039161682,
"step": 5865,
"valid_targets_mean": 2571.3,
"valid_targets_min": 1006
},
{
"epoch": 5.7380254154447705,
"grad_norm": 0.7902697956389423,
"learning_rate": 3.838019527726478e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15650413930416107,
"step": 5870,
"valid_targets_mean": 2332.9,
"valid_targets_min": 748
},
{
"epoch": 5.742913000977517,
"grad_norm": 0.7626167489885958,
"learning_rate": 3.8093502442602037e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1520456075668335,
"step": 5875,
"valid_targets_mean": 2732.3,
"valid_targets_min": 851
},
{
"epoch": 5.747800586510264,
"grad_norm": 0.890203614110944,
"learning_rate": 3.7807771647106073e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16833049058914185,
"step": 5880,
"valid_targets_mean": 2514.6,
"valid_targets_min": 1051
},
{
"epoch": 5.752688172043011,
"grad_norm": 0.7072501670025816,
"learning_rate": 3.752300458857303e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15029340982437134,
"step": 5885,
"valid_targets_mean": 3031.2,
"valid_targets_min": 837
},
{
"epoch": 5.757575757575758,
"grad_norm": 0.7640980023033417,
"learning_rate": 3.723920295907255e-06,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1618524044752121,
"step": 5890,
"valid_targets_mean": 2569.4,
"valid_targets_min": 728
},
{
"epoch": 5.762463343108505,
"grad_norm": 0.7319035255044318,
"learning_rate": 3.695636844493764e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16255182027816772,
"step": 5895,
"valid_targets_mean": 3114.8,
"valid_targets_min": 951
},
{
"epoch": 5.767350928641251,
"grad_norm": 0.8063750882434633,
"learning_rate": 3.66745027267549e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666271686553955,
"step": 5900,
"valid_targets_mean": 2507.8,
"valid_targets_min": 986
},
{
"epoch": 5.772238514173998,
"grad_norm": 0.8345912032783375,
"learning_rate": 3.6393607479354275e-06,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15384799242019653,
"step": 5905,
"valid_targets_mean": 1862.2,
"valid_targets_min": 635
},
{
"epoch": 5.777126099706745,
"grad_norm": 0.7061819113437781,
"learning_rate": 3.611368437179934e-06,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18276137113571167,
"step": 5910,
"valid_targets_mean": 3247.3,
"valid_targets_min": 1489
},
{
"epoch": 5.782013685239492,
"grad_norm": 0.8167005148421289,
"learning_rate": 3.583473506737727e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1597469002008438,
"step": 5915,
"valid_targets_mean": 2362.9,
"valid_targets_min": 759
},
{
"epoch": 5.786901270772239,
"grad_norm": 0.7711204073304082,
"learning_rate": 3.555676122358884e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1491527557373047,
"step": 5920,
"valid_targets_mean": 2585.6,
"valid_targets_min": 1306
},
{
"epoch": 5.7917888563049855,
"grad_norm": 0.7283811601045469,
"learning_rate": 3.5279764492138724e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17027896642684937,
"step": 5925,
"valid_targets_mean": 3067.6,
"valid_targets_min": 522
},
{
"epoch": 5.796676441837732,
"grad_norm": 0.7011679340720517,
"learning_rate": 3.500374651892573e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1561456024646759,
"step": 5930,
"valid_targets_mean": 2874.4,
"valid_targets_min": 851
},
{
"epoch": 5.801564027370479,
"grad_norm": 0.9979178900846251,
"learning_rate": 3.472870894403291e-06,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1694871187210083,
"step": 5935,
"valid_targets_mean": 2362.9,
"valid_targets_min": 513
},
{
"epoch": 5.806451612903226,
"grad_norm": 0.8639990166797461,
"learning_rate": 3.4454653401717896e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12851397693157196,
"step": 5940,
"valid_targets_mean": 1915.4,
"valid_targets_min": 746
},
{
"epoch": 5.811339198435973,
"grad_norm": 0.6986837988916482,
"learning_rate": 3.4181581520403005e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15324917435646057,
"step": 5945,
"valid_targets_mean": 3119.9,
"valid_targets_min": 1011
},
{
"epoch": 5.81622678396872,
"grad_norm": 0.8313260438961377,
"learning_rate": 3.390949492266569e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447916030883789,
"step": 5950,
"valid_targets_mean": 2159.3,
"valid_targets_min": 800
},
{
"epoch": 5.821114369501466,
"grad_norm": 0.885127583979189,
"learning_rate": 3.363839522522916e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15982311964035034,
"step": 5955,
"valid_targets_mean": 1842.9,
"valid_targets_min": 607
},
{
"epoch": 5.826001955034213,
"grad_norm": 0.7808780924503399,
"learning_rate": 3.336828403895227e-06,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592644453048706,
"step": 5960,
"valid_targets_mean": 2727.3,
"valid_targets_min": 1050
},
{
"epoch": 5.83088954056696,
"grad_norm": 0.685353500101023,
"learning_rate": 3.309916296882021e-06,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1466306447982788,
"step": 5965,
"valid_targets_mean": 2775.5,
"valid_targets_min": 627
},
{
"epoch": 5.835777126099707,
"grad_norm": 1.2671880923497407,
"learning_rate": 3.2831033613935092e-06,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15228471159934998,
"step": 5970,
"valid_targets_mean": 2204.8,
"valid_targets_min": 1143
},
{
"epoch": 5.840664711632454,
"grad_norm": 0.7532578861942046,
"learning_rate": 3.256389756750613e-06,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13797354698181152,
"step": 5975,
"valid_targets_mean": 2369.1,
"valid_targets_min": 788
},
{
"epoch": 5.8455522971652005,
"grad_norm": 0.7743267560564064,
"learning_rate": 3.229775641684063e-06,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16579267382621765,
"step": 5980,
"valid_targets_mean": 2343.3,
"valid_targets_min": 888
},
{
"epoch": 5.850439882697947,
"grad_norm": 0.7015726455253567,
"learning_rate": 3.203261174333403e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14441198110580444,
"step": 5985,
"valid_targets_mean": 2980.8,
"valid_targets_min": 807
},
{
"epoch": 5.855327468230694,
"grad_norm": 0.7070459951461793,
"learning_rate": 3.1768465122460813e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1486390233039856,
"step": 5990,
"valid_targets_mean": 2794.2,
"valid_targets_min": 824
},
{
"epoch": 5.860215053763441,
"grad_norm": 0.7969197667556421,
"learning_rate": 3.1505318123765137e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16264227032661438,
"step": 5995,
"valid_targets_mean": 2405.8,
"valid_targets_min": 1005
},
{
"epoch": 5.865102639296188,
"grad_norm": 0.7190738114648545,
"learning_rate": 3.12431723108515e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1532568335533142,
"step": 6000,
"valid_targets_mean": 2788.5,
"valid_targets_min": 903
},
{
"epoch": 5.869990224828935,
"grad_norm": 0.7936029883530649,
"learning_rate": 3.0982029241375343e-06,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16097313165664673,
"step": 6005,
"valid_targets_mean": 2423.9,
"valid_targets_min": 911
},
{
"epoch": 5.874877810361681,
"grad_norm": 0.7946199748419005,
"learning_rate": 3.0721890467033866e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1583392471075058,
"step": 6010,
"valid_targets_mean": 2257.8,
"valid_targets_min": 654
},
{
"epoch": 5.879765395894428,
"grad_norm": 0.8074320913746822,
"learning_rate": 3.0462757533556784e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13972869515419006,
"step": 6015,
"valid_targets_mean": 2338.6,
"valid_targets_min": 708
},
{
"epoch": 5.884652981427175,
"grad_norm": 0.8929139568223418,
"learning_rate": 3.020463198069721e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16818490624427795,
"step": 6020,
"valid_targets_mean": 2117.4,
"valid_targets_min": 727
},
{
"epoch": 5.889540566959922,
"grad_norm": 0.6713747500739194,
"learning_rate": 2.994751534222251e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1403338611125946,
"step": 6025,
"valid_targets_mean": 2784.2,
"valid_targets_min": 1212
},
{
"epoch": 5.894428152492669,
"grad_norm": 0.7757304779081556,
"learning_rate": 2.969140914590498e-06,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14841482043266296,
"step": 6030,
"valid_targets_mean": 2193.8,
"valid_targets_min": 790
},
{
"epoch": 5.8993157380254155,
"grad_norm": 0.8629820125294086,
"learning_rate": 2.943631491351311e-06,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15556024014949799,
"step": 6035,
"valid_targets_mean": 2002.3,
"valid_targets_min": 1163
},
{
"epoch": 5.904203323558162,
"grad_norm": 0.8188534807515834,
"learning_rate": 2.918223416080219e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16173824667930603,
"step": 6040,
"valid_targets_mean": 2232.9,
"valid_targets_min": 891
},
{
"epoch": 5.909090909090909,
"grad_norm": 0.8132660493437572,
"learning_rate": 2.892916839750557e-06,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494334191083908,
"step": 6045,
"valid_targets_mean": 2253.3,
"valid_targets_min": 732
},
{
"epoch": 5.913978494623656,
"grad_norm": 0.654182287461871,
"learning_rate": 2.8677119127325625e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15798476338386536,
"step": 6050,
"valid_targets_mean": 3594.9,
"valid_targets_min": 1150
},
{
"epoch": 5.918866080156403,
"grad_norm": 0.6693246221511635,
"learning_rate": 2.8426087847924643e-06,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13518929481506348,
"step": 6055,
"valid_targets_mean": 2902.4,
"valid_targets_min": 1123
},
{
"epoch": 5.92375366568915,
"grad_norm": 0.8107053745570154,
"learning_rate": 2.8176076050916255e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15758317708969116,
"step": 6060,
"valid_targets_mean": 2398.6,
"valid_targets_min": 711
},
{
"epoch": 5.9286412512218964,
"grad_norm": 0.9021761140325874,
"learning_rate": 2.7927085221856185e-06,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15211939811706543,
"step": 6065,
"valid_targets_mean": 1915.1,
"valid_targets_min": 619
},
{
"epoch": 5.933528836754643,
"grad_norm": 0.7392044459110118,
"learning_rate": 2.7679116840233788e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442590355873108,
"step": 6070,
"valid_targets_mean": 2682.1,
"valid_targets_min": 837
},
{
"epoch": 5.93841642228739,
"grad_norm": 0.7909706387505339,
"learning_rate": 2.7432172379463073e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1507616639137268,
"step": 6075,
"valid_targets_mean": 2728.3,
"valid_targets_min": 1133
},
{
"epoch": 5.943304007820137,
"grad_norm": 0.6858517709489104,
"learning_rate": 2.718625330687381e-06,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569923758506775,
"step": 6080,
"valid_targets_mean": 3103.2,
"valid_targets_min": 698
},
{
"epoch": 5.948191593352884,
"grad_norm": 0.7282489397560563,
"learning_rate": 2.6941361083703244e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15824103355407715,
"step": 6085,
"valid_targets_mean": 3084.2,
"valid_targets_min": 1098
},
{
"epoch": 5.9530791788856305,
"grad_norm": 0.8200856694692574,
"learning_rate": 2.6697497165086826e-06,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14971165359020233,
"step": 6090,
"valid_targets_mean": 1849.7,
"valid_targets_min": 690
},
{
"epoch": 5.957966764418377,
"grad_norm": 0.8145406485221162,
"learning_rate": 2.645466300005013e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14848312735557556,
"step": 6095,
"valid_targets_mean": 2086.6,
"valid_targets_min": 765
},
{
"epoch": 5.962854349951124,
"grad_norm": 0.7660068981755783,
"learning_rate": 2.6212860031499942e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14158686995506287,
"step": 6100,
"valid_targets_mean": 2279.2,
"valid_targets_min": 1033
},
{
"epoch": 5.967741935483871,
"grad_norm": 0.8064378082219088,
"learning_rate": 2.597208969621561e-06,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14924579858779907,
"step": 6105,
"valid_targets_mean": 2187.1,
"valid_targets_min": 777
},
{
"epoch": 5.972629521016618,
"grad_norm": 0.7501577303291025,
"learning_rate": 2.5732353424840817e-06,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14925900101661682,
"step": 6110,
"valid_targets_mean": 2335.9,
"valid_targets_min": 634
},
{
"epoch": 5.977517106549365,
"grad_norm": 0.7898048269613115,
"learning_rate": 2.549365264187469e-06,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15726542472839355,
"step": 6115,
"valid_targets_mean": 2276.5,
"valid_targets_min": 1190
},
{
"epoch": 5.9824046920821115,
"grad_norm": 0.7940500094930575,
"learning_rate": 2.525598876566371e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1534472405910492,
"step": 6120,
"valid_targets_mean": 2346.0,
"valid_targets_min": 809
},
{
"epoch": 5.987292277614858,
"grad_norm": 0.882710433816707,
"learning_rate": 2.5019363208393133e-06,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18637877702713013,
"step": 6125,
"valid_targets_mean": 1959.3,
"valid_targets_min": 1010
},
{
"epoch": 5.992179863147605,
"grad_norm": 0.798333765699043,
"learning_rate": 2.4783777376078443e-06,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15766102075576782,
"step": 6130,
"valid_targets_mean": 2160.6,
"valid_targets_min": 1137
},
{
"epoch": 5.997067448680352,
"grad_norm": 0.8188870991896096,
"learning_rate": 2.4549232668557154e-06,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15294690430164337,
"step": 6135,
"valid_targets_mean": 2066.3,
"valid_targets_min": 733
},
{
"epoch": 6.001955034213099,
"grad_norm": 0.772371500976364,
"learning_rate": 2.4315730479480614e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14228251576423645,
"step": 6140,
"valid_targets_mean": 2113.5,
"valid_targets_min": 941
},
{
"epoch": 6.0068426197458455,
"grad_norm": 0.6951812269111425,
"learning_rate": 2.4083272196305483e-06,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12359236180782318,
"step": 6145,
"valid_targets_mean": 2279.8,
"valid_targets_min": 901
},
{
"epoch": 6.011730205278592,
"grad_norm": 0.7341125048499366,
"learning_rate": 2.385185920028563e-06,
"loss": 0.1344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12021429091691971,
"step": 6150,
"valid_targets_mean": 2476.9,
"valid_targets_min": 834
},
{
"epoch": 6.016617790811339,
"grad_norm": 0.8580978920271629,
"learning_rate": 2.3621492866463845e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14868280291557312,
"step": 6155,
"valid_targets_mean": 2026.8,
"valid_targets_min": 776
},
{
"epoch": 6.021505376344086,
"grad_norm": 0.8292027396293019,
"learning_rate": 2.3392174563663716e-06,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.154433935880661,
"step": 6160,
"valid_targets_mean": 2073.4,
"valid_targets_min": 610
},
{
"epoch": 6.026392961876833,
"grad_norm": 0.8083140379382482,
"learning_rate": 2.3163905654481524e-06,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15254239737987518,
"step": 6165,
"valid_targets_mean": 2362.4,
"valid_targets_min": 988
},
{
"epoch": 6.03128054740958,
"grad_norm": 0.711249329248669,
"learning_rate": 2.293668749527809e-06,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13382339477539062,
"step": 6170,
"valid_targets_mean": 2892.4,
"valid_targets_min": 761
},
{
"epoch": 6.0361681329423265,
"grad_norm": 0.7271334674837908,
"learning_rate": 2.2710521436170807e-06,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15734508633613586,
"step": 6175,
"valid_targets_mean": 3120.2,
"valid_targets_min": 1168
},
{
"epoch": 6.041055718475073,
"grad_norm": 0.8320574708134784,
"learning_rate": 2.2485408821025435e-06,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15673065185546875,
"step": 6180,
"valid_targets_mean": 2314.8,
"valid_targets_min": 676
},
{
"epoch": 6.04594330400782,
"grad_norm": 0.7618387380481915,
"learning_rate": 2.226135098744824e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15294227004051208,
"step": 6185,
"valid_targets_mean": 2752.2,
"valid_targets_min": 1263
},
{
"epoch": 6.050830889540567,
"grad_norm": 0.7682499575279256,
"learning_rate": 2.2038349266778146e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16213871538639069,
"step": 6190,
"valid_targets_mean": 2590.8,
"valid_targets_min": 764
},
{
"epoch": 6.055718475073314,
"grad_norm": 0.835630554054457,
"learning_rate": 2.1816404984078664e-06,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14952757954597473,
"step": 6195,
"valid_targets_mean": 2388.6,
"valid_targets_min": 678
},
{
"epoch": 6.0606060606060606,
"grad_norm": 0.7123162200549785,
"learning_rate": 2.1595519458129967e-06,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13014379143714905,
"step": 6200,
"valid_targets_mean": 2729.5,
"valid_targets_min": 815
},
{
"epoch": 6.065493646138807,
"grad_norm": 0.8818566517853015,
"learning_rate": 2.1375694001421343e-06,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15553683042526245,
"step": 6205,
"valid_targets_mean": 1978.7,
"valid_targets_min": 761
},
{
"epoch": 6.070381231671554,
"grad_norm": 0.7715315446565182,
"learning_rate": 2.115692992014304e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15126900374889374,
"step": 6210,
"valid_targets_mean": 2411.3,
"valid_targets_min": 1339
},
{
"epoch": 6.075268817204301,
"grad_norm": 0.8184332591539848,
"learning_rate": 2.0939228514178735e-06,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.146785169839859,
"step": 6215,
"valid_targets_mean": 2621.6,
"valid_targets_min": 892
},
{
"epoch": 6.080156402737048,
"grad_norm": 0.8703651745159651,
"learning_rate": 2.0722591077097844e-06,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14825935661792755,
"step": 6220,
"valid_targets_mean": 1934.5,
"valid_targets_min": 621
},
{
"epoch": 6.085043988269795,
"grad_norm": 0.8574526478965231,
"learning_rate": 2.0507018896147525e-06,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1470494568347931,
"step": 6225,
"valid_targets_mean": 2009.9,
"valid_targets_min": 591
},
{
"epoch": 6.0899315738025415,
"grad_norm": 0.8481048091940785,
"learning_rate": 2.0292513252245507e-06,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15715302526950836,
"step": 6230,
"valid_targets_mean": 2249.1,
"valid_targets_min": 750
},
{
"epoch": 6.094819159335288,
"grad_norm": 0.8473826531669545,
"learning_rate": 2.0079075419971937e-06,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15390710532665253,
"step": 6235,
"valid_targets_mean": 2229.1,
"valid_targets_min": 659
},
{
"epoch": 6.099706744868035,
"grad_norm": 0.813390106542457,
"learning_rate": 1.986670666756234e-06,
"loss": 0.1407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278359740972519,
"step": 6240,
"valid_targets_mean": 2046.5,
"valid_targets_min": 814
},
{
"epoch": 6.104594330400782,
"grad_norm": 0.8400309752046771,
"learning_rate": 1.9655408256899713e-06,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15281391143798828,
"step": 6245,
"valid_targets_mean": 2291.9,
"valid_targets_min": 733
},
{
"epoch": 6.109481915933529,
"grad_norm": 0.7250372273390747,
"learning_rate": 1.944518144350709e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1458112895488739,
"step": 6250,
"valid_targets_mean": 2883.2,
"valid_targets_min": 804
},
{
"epoch": 6.114369501466276,
"grad_norm": 0.8632663254658965,
"learning_rate": 1.9236027476540276e-06,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14336003363132477,
"step": 6255,
"valid_targets_mean": 2101.6,
"valid_targets_min": 817
},
{
"epoch": 6.119257086999022,
"grad_norm": 0.7798497119811234,
"learning_rate": 1.9027947598780127e-06,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14085283875465393,
"step": 6260,
"valid_targets_mean": 2175.4,
"valid_targets_min": 714
},
{
"epoch": 6.124144672531769,
"grad_norm": 0.8683686286891048,
"learning_rate": 1.8820943046625429e-06,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12134305387735367,
"step": 6265,
"valid_targets_mean": 1859.7,
"valid_targets_min": 776
},
{
"epoch": 6.129032258064516,
"grad_norm": 0.8639340556226129,
"learning_rate": 1.861501505008545e-06,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14260660111904144,
"step": 6270,
"valid_targets_mean": 2105.2,
"valid_targets_min": 905
},
{
"epoch": 6.133919843597263,
"grad_norm": 0.7652388086076658,
"learning_rate": 1.8410164832772536e-06,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1462109088897705,
"step": 6275,
"valid_targets_mean": 2521.6,
"valid_targets_min": 689
},
{
"epoch": 6.13880742913001,
"grad_norm": 0.8599010636007501,
"learning_rate": 1.8206393611895045e-06,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15619584918022156,
"step": 6280,
"valid_targets_mean": 2249.8,
"valid_targets_min": 1113
},
{
"epoch": 6.1436950146627565,
"grad_norm": 0.8398925161179197,
"learning_rate": 1.8003702598249861e-06,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14089694619178772,
"step": 6285,
"valid_targets_mean": 2057.7,
"valid_targets_min": 1225
},
{
"epoch": 6.148582600195503,
"grad_norm": 0.9006101111923522,
"learning_rate": 1.780209299621547e-06,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1570209264755249,
"step": 6290,
"valid_targets_mean": 2732.9,
"valid_targets_min": 922
},
{
"epoch": 6.15347018572825,
"grad_norm": 0.7691620511866091,
"learning_rate": 1.7601566003744631e-06,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1531471312046051,
"step": 6295,
"valid_targets_mean": 2870.6,
"valid_targets_min": 947
},
{
"epoch": 6.158357771260997,
"grad_norm": 0.6860071399944331,
"learning_rate": 1.740212281235727e-06,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13493847846984863,
"step": 6300,
"valid_targets_mean": 3376.0,
"valid_targets_min": 753
},
{
"epoch": 6.163245356793744,
"grad_norm": 0.7541769441863807,
"learning_rate": 1.7203764607133377e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15232732892036438,
"step": 6305,
"valid_targets_mean": 2786.0,
"valid_targets_min": 671
},
{
"epoch": 6.168132942326491,
"grad_norm": 0.7651389425645014,
"learning_rate": 1.7006492566706233e-06,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13763144612312317,
"step": 6310,
"valid_targets_mean": 2695.4,
"valid_targets_min": 1083
},
{
"epoch": 6.173020527859237,
"grad_norm": 0.8366808292024842,
"learning_rate": 1.6810307863254927e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14807304739952087,
"step": 6315,
"valid_targets_mean": 2219.9,
"valid_targets_min": 827
},
{
"epoch": 6.177908113391984,
"grad_norm": 0.8457539648171782,
"learning_rate": 1.6615211662497822e-06,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1576795130968094,
"step": 6320,
"valid_targets_mean": 2348.2,
"valid_targets_min": 757
},
{
"epoch": 6.182795698924731,
"grad_norm": 0.80734473246753,
"learning_rate": 1.6421205123685392e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13625971972942352,
"step": 6325,
"valid_targets_mean": 2120.9,
"valid_targets_min": 806
},
{
"epoch": 6.187683284457478,
"grad_norm": 0.9804288667902588,
"learning_rate": 1.6228289399593334e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14446699619293213,
"step": 6330,
"valid_targets_mean": 1873.2,
"valid_targets_min": 888
},
{
"epoch": 6.192570869990225,
"grad_norm": 0.7529261993671538,
"learning_rate": 1.603646563651604e-06,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14811274409294128,
"step": 6335,
"valid_targets_mean": 2624.8,
"valid_targets_min": 796
},
{
"epoch": 6.1974584555229715,
"grad_norm": 0.7758608591461221,
"learning_rate": 1.5845734974259207e-06,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13113583624362946,
"step": 6340,
"valid_targets_mean": 2221.9,
"valid_targets_min": 900
},
{
"epoch": 6.202346041055718,
"grad_norm": 0.7977758438125597,
"learning_rate": 1.5656098546133658e-06,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15472404658794403,
"step": 6345,
"valid_targets_mean": 2333.7,
"valid_targets_min": 777
},
{
"epoch": 6.207233626588465,
"grad_norm": 0.7496625060594996,
"learning_rate": 1.5467557478948148e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15827788412570953,
"step": 6350,
"valid_targets_mean": 2944.5,
"valid_targets_min": 659
},
{
"epoch": 6.212121212121212,
"grad_norm": 0.7617727567525714,
"learning_rate": 1.5280112893002908e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13309329748153687,
"step": 6355,
"valid_targets_mean": 2364.3,
"valid_targets_min": 988
},
{
"epoch": 6.217008797653959,
"grad_norm": 0.7687353152394582,
"learning_rate": 1.5093765902083069e-06,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15288090705871582,
"step": 6360,
"valid_targets_mean": 2643.9,
"valid_targets_min": 697
},
{
"epoch": 6.221896383186706,
"grad_norm": 0.8946465205196672,
"learning_rate": 1.4908517613451778e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14633601903915405,
"step": 6365,
"valid_targets_mean": 2086.7,
"valid_targets_min": 607
},
{
"epoch": 6.226783968719452,
"grad_norm": 0.8280125163578745,
"learning_rate": 1.472436912784374e-06,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13586950302124023,
"step": 6370,
"valid_targets_mean": 2219.1,
"valid_targets_min": 1104
},
{
"epoch": 6.231671554252199,
"grad_norm": 0.9360214005794244,
"learning_rate": 1.4541321539458775e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14993751049041748,
"step": 6375,
"valid_targets_mean": 1659.2,
"valid_targets_min": 686
},
{
"epoch": 6.236559139784946,
"grad_norm": 0.762660547954432,
"learning_rate": 1.4359375935955222e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1589202582836151,
"step": 6380,
"valid_targets_mean": 2716.4,
"valid_targets_min": 668
},
{
"epoch": 6.241446725317693,
"grad_norm": 0.8996541456011813,
"learning_rate": 1.4178533398443507e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14994928240776062,
"step": 6385,
"valid_targets_mean": 1683.6,
"valid_targets_min": 731
},
{
"epoch": 6.24633431085044,
"grad_norm": 0.7402483966290739,
"learning_rate": 1.3998795001479605e-06,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15734237432479858,
"step": 6390,
"valid_targets_mean": 2690.1,
"valid_targets_min": 776
},
{
"epoch": 6.2512218963831865,
"grad_norm": 0.8314893917101926,
"learning_rate": 1.3820161813058786e-06,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1409616619348526,
"step": 6395,
"valid_targets_mean": 1984.4,
"valid_targets_min": 617
},
{
"epoch": 6.256109481915933,
"grad_norm": 0.7192255814903107,
"learning_rate": 1.3642634894609308e-06,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14671871066093445,
"step": 6400,
"valid_targets_mean": 2923.3,
"valid_targets_min": 567
},
{
"epoch": 6.26099706744868,
"grad_norm": 0.7999646416770593,
"learning_rate": 1.3466215300985996e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13374221324920654,
"step": 6405,
"valid_targets_mean": 2253.6,
"valid_targets_min": 701
},
{
"epoch": 6.265884652981427,
"grad_norm": 0.7701307733257204,
"learning_rate": 1.3290904080464007e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15439356863498688,
"step": 6410,
"valid_targets_mean": 2676.4,
"valid_targets_min": 869
},
{
"epoch": 6.270772238514174,
"grad_norm": 0.717925366016105,
"learning_rate": 1.3116702274732585e-06,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1328277885913849,
"step": 6415,
"valid_targets_mean": 2629.2,
"valid_targets_min": 888
},
{
"epoch": 6.275659824046921,
"grad_norm": 0.8180028485476835,
"learning_rate": 1.2943610918888893e-06,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15177467465400696,
"step": 6420,
"valid_targets_mean": 2332.1,
"valid_targets_min": 680
},
{
"epoch": 6.280547409579667,
"grad_norm": 0.8165966121783467,
"learning_rate": 1.277163104143191e-06,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14720627665519714,
"step": 6425,
"valid_targets_mean": 2315.4,
"valid_targets_min": 934
},
{
"epoch": 6.285434995112414,
"grad_norm": 0.8235251951027993,
"learning_rate": 1.2600763664256288e-06,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15732279419898987,
"step": 6430,
"valid_targets_mean": 2338.2,
"valid_targets_min": 719
},
{
"epoch": 6.290322580645161,
"grad_norm": 0.8537813636704863,
"learning_rate": 1.2431009802646177e-06,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15671692788600922,
"step": 6435,
"valid_targets_mean": 2427.2,
"valid_targets_min": 614
},
{
"epoch": 6.295210166177908,
"grad_norm": 0.7787776965511892,
"learning_rate": 1.2262370465269368e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14795002341270447,
"step": 6440,
"valid_targets_mean": 2533.7,
"valid_targets_min": 867
},
{
"epoch": 6.300097751710655,
"grad_norm": 0.7466171619616006,
"learning_rate": 1.2094846654171133e-06,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1360429972410202,
"step": 6445,
"valid_targets_mean": 2684.0,
"valid_targets_min": 930
},
{
"epoch": 6.3049853372434015,
"grad_norm": 0.8453955068732553,
"learning_rate": 1.1928439364768418e-06,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1500052511692047,
"step": 6450,
"valid_targets_mean": 2271.9,
"valid_targets_min": 656
},
{
"epoch": 6.309872922776148,
"grad_norm": 0.7381224772665309,
"learning_rate": 1.176314958584388e-06,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1459953933954239,
"step": 6455,
"valid_targets_mean": 2728.8,
"valid_targets_min": 945
},
{
"epoch": 6.314760508308895,
"grad_norm": 0.7664923578206903,
"learning_rate": 1.1598978299539886e-06,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11979406327009201,
"step": 6460,
"valid_targets_mean": 2113.8,
"valid_targets_min": 740
},
{
"epoch": 6.319648093841642,
"grad_norm": 0.774864233400857,
"learning_rate": 1.143592648135292e-06,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13750594854354858,
"step": 6465,
"valid_targets_mean": 2761.6,
"valid_targets_min": 847
},
{
"epoch": 6.324535679374389,
"grad_norm": 0.887880805842084,
"learning_rate": 1.1273995100127478e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1429017186164856,
"step": 6470,
"valid_targets_mean": 1817.9,
"valid_targets_min": 739
},
{
"epoch": 6.329423264907136,
"grad_norm": 0.7426599652356065,
"learning_rate": 1.1113185118050662e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1407342255115509,
"step": 6475,
"valid_targets_mean": 2687.5,
"valid_targets_min": 830
},
{
"epoch": 6.334310850439882,
"grad_norm": 0.8069295804769829,
"learning_rate": 1.0953497490646204e-06,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1433069258928299,
"step": 6480,
"valid_targets_mean": 2190.9,
"valid_targets_min": 635
},
{
"epoch": 6.339198435972629,
"grad_norm": 0.7177391118014483,
"learning_rate": 1.0794933166768828e-06,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1430281698703766,
"step": 6485,
"valid_targets_mean": 3095.9,
"valid_targets_min": 770
},
{
"epoch": 6.344086021505376,
"grad_norm": 0.7687796424872444,
"learning_rate": 1.063749308859876e-06,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13334771990776062,
"step": 6490,
"valid_targets_mean": 2388.4,
"valid_targets_min": 966
},
{
"epoch": 6.348973607038123,
"grad_norm": 0.7612117876020217,
"learning_rate": 1.0481178191635876e-06,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1389297991991043,
"step": 6495,
"valid_targets_mean": 2652.2,
"valid_targets_min": 777
},
{
"epoch": 6.35386119257087,
"grad_norm": 0.7514521694555615,
"learning_rate": 1.0325989404694424e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16383954882621765,
"step": 6500,
"valid_targets_mean": 2935.7,
"valid_targets_min": 1179
},
{
"epoch": 6.3587487781036165,
"grad_norm": 0.8203426377026969,
"learning_rate": 1.017192764989734e-06,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15453344583511353,
"step": 6505,
"valid_targets_mean": 2347.6,
"valid_targets_min": 721
},
{
"epoch": 6.363636363636363,
"grad_norm": 0.8292620788591387,
"learning_rate": 1.001899384267071e-06,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15466228127479553,
"step": 6510,
"valid_targets_mean": 2221.9,
"valid_targets_min": 750
},
{
"epoch": 6.36852394916911,
"grad_norm": 0.829931504832341,
"learning_rate": 9.867188891738544e-07,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13335032761096954,
"step": 6515,
"valid_targets_mean": 2455.7,
"valid_targets_min": 1143
},
{
"epoch": 6.373411534701857,
"grad_norm": 0.7012016461939861,
"learning_rate": 9.716513699117148e-07,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12033946067094803,
"step": 6520,
"valid_targets_mean": 2587.4,
"valid_targets_min": 1035
},
{
"epoch": 6.378299120234604,
"grad_norm": 0.7608167779950807,
"learning_rate": 9.56696916010995e-07,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15372420847415924,
"step": 6525,
"valid_targets_mean": 2700.6,
"valid_targets_min": 1255
},
{
"epoch": 6.383186705767351,
"grad_norm": 0.7875236266722555,
"learning_rate": 9.418556163302073e-07,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1496465802192688,
"step": 6530,
"valid_targets_mean": 2373.9,
"valid_targets_min": 950
},
{
"epoch": 6.388074291300097,
"grad_norm": 0.9345295844327403,
"learning_rate": 9.271275590555073e-07,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13679920136928558,
"step": 6535,
"valid_targets_mean": 2371.4,
"valid_targets_min": 744
},
{
"epoch": 6.392961876832844,
"grad_norm": 0.8165642457777276,
"learning_rate": 9.125128317001653e-07,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14877143502235413,
"step": 6540,
"valid_targets_mean": 2413.6,
"valid_targets_min": 692
},
{
"epoch": 6.397849462365591,
"grad_norm": 0.8293551530994266,
"learning_rate": 8.980115211040607e-07,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12983205914497375,
"step": 6545,
"valid_targets_mean": 1852.1,
"valid_targets_min": 635
},
{
"epoch": 6.402737047898338,
"grad_norm": 0.8185584829200172,
"learning_rate": 8.836237134331527e-07,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1399831473827362,
"step": 6550,
"valid_targets_mean": 2156.9,
"valid_targets_min": 878
},
{
"epoch": 6.407624633431085,
"grad_norm": 0.8752733032904388,
"learning_rate": 8.693494941789748e-07,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14943121373653412,
"step": 6555,
"valid_targets_mean": 2125.4,
"valid_targets_min": 791
},
{
"epoch": 6.4125122189638315,
"grad_norm": 0.771428128135249,
"learning_rate": 8.551889481581255e-07,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13312771916389465,
"step": 6560,
"valid_targets_mean": 2736.9,
"valid_targets_min": 1206
},
{
"epoch": 6.417399804496578,
"grad_norm": 0.8363887006600691,
"learning_rate": 8.411421595117519e-07,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484169363975525,
"step": 6565,
"valid_targets_mean": 2258.8,
"valid_targets_min": 612
},
{
"epoch": 6.422287390029325,
"grad_norm": 0.841896164198332,
"learning_rate": 8.272092117050778e-07,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14031308889389038,
"step": 6570,
"valid_targets_mean": 2081.2,
"valid_targets_min": 741
},
{
"epoch": 6.427174975562072,
"grad_norm": 0.8344208378276725,
"learning_rate": 8.133901875268813e-07,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16051240265369415,
"step": 6575,
"valid_targets_mean": 2340.0,
"valid_targets_min": 793
},
{
"epoch": 6.432062561094819,
"grad_norm": 0.739011240056262,
"learning_rate": 7.996851690890195e-07,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1327826976776123,
"step": 6580,
"valid_targets_mean": 2467.3,
"valid_targets_min": 1040
},
{
"epoch": 6.436950146627566,
"grad_norm": 0.8388926850354799,
"learning_rate": 7.860942378259251e-07,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13930006325244904,
"step": 6585,
"valid_targets_mean": 2314.1,
"valid_targets_min": 687
},
{
"epoch": 6.441837732160312,
"grad_norm": 0.736849529441786,
"learning_rate": 7.726174744941351e-07,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1561793088912964,
"step": 6590,
"valid_targets_mean": 3114.3,
"valid_targets_min": 1144
},
{
"epoch": 6.446725317693059,
"grad_norm": 0.7374996366190613,
"learning_rate": 7.592549591718091e-07,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14413076639175415,
"step": 6595,
"valid_targets_mean": 3133.8,
"valid_targets_min": 1182
},
{
"epoch": 6.451612903225806,
"grad_norm": 0.8220802356280166,
"learning_rate": 7.460067712582519e-07,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1294611543416977,
"step": 6600,
"valid_targets_mean": 2196.5,
"valid_targets_min": 712
},
{
"epoch": 6.456500488758553,
"grad_norm": 0.7893984126724283,
"learning_rate": 7.328729894734388e-07,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1567493975162506,
"step": 6605,
"valid_targets_mean": 2438.6,
"valid_targets_min": 703
},
{
"epoch": 6.4613880742913,
"grad_norm": 0.8117586298458785,
"learning_rate": 7.198536918575527e-07,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428253948688507,
"step": 6610,
"valid_targets_mean": 2303.7,
"valid_targets_min": 632
},
{
"epoch": 6.4662756598240465,
"grad_norm": 0.7826755426811578,
"learning_rate": 7.069489557705145e-07,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15663695335388184,
"step": 6615,
"valid_targets_mean": 2520.6,
"valid_targets_min": 655
},
{
"epoch": 6.471163245356793,
"grad_norm": 0.8284462615884153,
"learning_rate": 6.941588578915315e-07,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1673087477684021,
"step": 6620,
"valid_targets_mean": 2560.1,
"valid_targets_min": 1093
},
{
"epoch": 6.476050830889541,
"grad_norm": 0.6413200188770708,
"learning_rate": 6.814834742186361e-07,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14878563582897186,
"step": 6625,
"valid_targets_mean": 4005.8,
"valid_targets_min": 696
},
{
"epoch": 6.480938416422287,
"grad_norm": 0.7615467726204301,
"learning_rate": 6.689228800682301e-07,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14344452321529388,
"step": 6630,
"valid_targets_mean": 2507.8,
"valid_targets_min": 899
},
{
"epoch": 6.485826001955035,
"grad_norm": 0.7837667879512825,
"learning_rate": 6.564771500746525e-07,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13829047977924347,
"step": 6635,
"valid_targets_mean": 2337.0,
"valid_targets_min": 800
},
{
"epoch": 6.490713587487781,
"grad_norm": 0.7681966736659308,
"learning_rate": 6.441463581897167e-07,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1388791799545288,
"step": 6640,
"valid_targets_mean": 2536.2,
"valid_targets_min": 960
},
{
"epoch": 6.495601173020528,
"grad_norm": 0.7657991833749364,
"learning_rate": 6.319305776822848e-07,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13757102191448212,
"step": 6645,
"valid_targets_mean": 2367.8,
"valid_targets_min": 720
},
{
"epoch": 6.500488758553274,
"grad_norm": 0.8617641880740021,
"learning_rate": 6.198298811378278e-07,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1516299545764923,
"step": 6650,
"valid_targets_mean": 2099.6,
"valid_targets_min": 627
},
{
"epoch": 6.505376344086022,
"grad_norm": 0.8509825074669289,
"learning_rate": 6.078443404579948e-07,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.160349503159523,
"step": 6655,
"valid_targets_mean": 2118.5,
"valid_targets_min": 764
},
{
"epoch": 6.510263929618768,
"grad_norm": 0.7385237771877197,
"learning_rate": 5.959740268601843e-07,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14553092420101166,
"step": 6660,
"valid_targets_mean": 2765.1,
"valid_targets_min": 799
},
{
"epoch": 6.515151515151516,
"grad_norm": 0.7414225190431922,
"learning_rate": 5.842190108771206e-07,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.158996120095253,
"step": 6665,
"valid_targets_mean": 2852.4,
"valid_targets_min": 1218
},
{
"epoch": 6.5200391006842615,
"grad_norm": 0.9920100082894623,
"learning_rate": 5.725793623564379e-07,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.143795907497406,
"step": 6670,
"valid_targets_mean": 2288.8,
"valid_targets_min": 981
},
{
"epoch": 6.524926686217009,
"grad_norm": 0.7440670427532977,
"learning_rate": 5.610551504602657e-07,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1507560908794403,
"step": 6675,
"valid_targets_mean": 2652.2,
"valid_targets_min": 921
},
{
"epoch": 6.529814271749755,
"grad_norm": 0.8286332715981629,
"learning_rate": 5.496464436648108e-07,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13288316130638123,
"step": 6680,
"valid_targets_mean": 1858.8,
"valid_targets_min": 777
},
{
"epoch": 6.534701857282503,
"grad_norm": 0.8232783710376684,
"learning_rate": 5.383533097599558e-07,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13944336771965027,
"step": 6685,
"valid_targets_mean": 2516.9,
"valid_targets_min": 925
},
{
"epoch": 6.539589442815249,
"grad_norm": 0.7654399610127802,
"learning_rate": 5.271758158488638e-07,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13826604187488556,
"step": 6690,
"valid_targets_mean": 2636.9,
"valid_targets_min": 902
},
{
"epoch": 6.5444770283479965,
"grad_norm": 0.8184911988154895,
"learning_rate": 5.161140283475608e-07,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1462034285068512,
"step": 6695,
"valid_targets_mean": 2207.8,
"valid_targets_min": 710
},
{
"epoch": 6.549364613880742,
"grad_norm": 0.7337833239715681,
"learning_rate": 5.051680129845605e-07,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12600910663604736,
"step": 6700,
"valid_targets_mean": 2454.8,
"valid_targets_min": 864
},
{
"epoch": 6.55425219941349,
"grad_norm": 0.8445779401373558,
"learning_rate": 4.94337834800458e-07,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1528075784444809,
"step": 6705,
"valid_targets_mean": 2297.4,
"valid_targets_min": 716
},
{
"epoch": 6.559139784946236,
"grad_norm": 0.7101947557300763,
"learning_rate": 4.836235581475523e-07,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12695491313934326,
"step": 6710,
"valid_targets_mean": 2736.0,
"valid_targets_min": 801
},
{
"epoch": 6.564027370478984,
"grad_norm": 0.8639233831130482,
"learning_rate": 4.7302524668946916e-07,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14430125057697296,
"step": 6715,
"valid_targets_mean": 2032.4,
"valid_targets_min": 846
},
{
"epoch": 6.568914956011731,
"grad_norm": 0.7461099525991259,
"learning_rate": 4.6254296340076497e-07,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13411906361579895,
"step": 6720,
"valid_targets_mean": 2808.7,
"valid_targets_min": 648
},
{
"epoch": 6.573802541544477,
"grad_norm": 0.7989702744987931,
"learning_rate": 4.521767705665747e-07,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15190516412258148,
"step": 6725,
"valid_targets_mean": 2514.4,
"valid_targets_min": 740
},
{
"epoch": 6.578690127077224,
"grad_norm": 0.8220944285398598,
"learning_rate": 4.419267297822205e-07,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1572040170431137,
"step": 6730,
"valid_targets_mean": 2357.9,
"valid_targets_min": 790
},
{
"epoch": 6.583577712609971,
"grad_norm": 0.6585139462243008,
"learning_rate": 4.317929019528566e-07,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13705238699913025,
"step": 6735,
"valid_targets_mean": 3228.4,
"valid_targets_min": 752
},
{
"epoch": 6.588465298142718,
"grad_norm": 0.8169152817627165,
"learning_rate": 4.217753472931141e-07,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.139057457447052,
"step": 6740,
"valid_targets_mean": 2172.5,
"valid_targets_min": 640
},
{
"epoch": 6.593352883675465,
"grad_norm": 0.7809355920094504,
"learning_rate": 4.118741253267322e-07,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14593061804771423,
"step": 6745,
"valid_targets_mean": 2661.4,
"valid_targets_min": 780
},
{
"epoch": 6.5982404692082115,
"grad_norm": 0.7768920952770774,
"learning_rate": 4.020892948862032e-07,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13564547896385193,
"step": 6750,
"valid_targets_mean": 2473.9,
"valid_targets_min": 537
},
{
"epoch": 6.603128054740958,
"grad_norm": 0.7722557323473561,
"learning_rate": 3.9242091411243245e-07,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1392875760793686,
"step": 6755,
"valid_targets_mean": 2471.2,
"valid_targets_min": 790
},
{
"epoch": 6.608015640273705,
"grad_norm": 0.7539682369302184,
"learning_rate": 3.8286904045438553e-07,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1369071751832962,
"step": 6760,
"valid_targets_mean": 2399.9,
"valid_targets_min": 610
},
{
"epoch": 6.612903225806452,
"grad_norm": 0.6424299073579681,
"learning_rate": 3.73433730668753e-07,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13768397271633148,
"step": 6765,
"valid_targets_mean": 3869.8,
"valid_targets_min": 1204
},
{
"epoch": 6.617790811339199,
"grad_norm": 0.6880284888599075,
"learning_rate": 3.641150408196037e-07,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12130261957645416,
"step": 6770,
"valid_targets_mean": 2982.4,
"valid_targets_min": 815
},
{
"epoch": 6.622678396871946,
"grad_norm": 0.8219148218793978,
"learning_rate": 3.5491302627806314e-07,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15362417697906494,
"step": 6775,
"valid_targets_mean": 2819.4,
"valid_targets_min": 919
},
{
"epoch": 6.627565982404692,
"grad_norm": 0.7921515154766982,
"learning_rate": 3.4582774172197576e-07,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13740390539169312,
"step": 6780,
"valid_targets_mean": 2345.8,
"valid_targets_min": 790
},
{
"epoch": 6.632453567937439,
"grad_norm": 0.7739946089387783,
"learning_rate": 3.368592411355831e-07,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1267765611410141,
"step": 6785,
"valid_targets_mean": 2384.4,
"valid_targets_min": 771
},
{
"epoch": 6.637341153470186,
"grad_norm": 0.7562090861343093,
"learning_rate": 3.2800757780920846e-07,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1409822702407837,
"step": 6790,
"valid_targets_mean": 2635.0,
"valid_targets_min": 594
},
{
"epoch": 6.642228739002933,
"grad_norm": 0.8014153886361279,
"learning_rate": 3.192728043389237e-07,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15787863731384277,
"step": 6795,
"valid_targets_mean": 2474.6,
"valid_targets_min": 1065
},
{
"epoch": 6.64711632453568,
"grad_norm": 0.8105759791663855,
"learning_rate": 3.106549726262542e-07,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15971817076206207,
"step": 6800,
"valid_targets_mean": 2614.4,
"valid_targets_min": 1129
},
{
"epoch": 6.6520039100684265,
"grad_norm": 0.7732426818990713,
"learning_rate": 3.0215413387787e-07,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1353302150964737,
"step": 6805,
"valid_targets_mean": 2363.2,
"valid_targets_min": 725
},
{
"epoch": 6.656891495601173,
"grad_norm": 0.6933846730883887,
"learning_rate": 2.937703386052637e-07,
"loss": 0.1379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12826628983020782,
"step": 6810,
"valid_targets_mean": 3215.6,
"valid_targets_min": 821
},
{
"epoch": 6.66177908113392,
"grad_norm": 0.8557865157908506,
"learning_rate": 2.8550363662447347e-07,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1560901701450348,
"step": 6815,
"valid_targets_mean": 2224.4,
"valid_targets_min": 803
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.8732910114888374,
"learning_rate": 2.77354077055767e-07,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.145709827542305,
"step": 6820,
"valid_targets_mean": 2143.8,
"valid_targets_min": 729
},
{
"epoch": 6.671554252199414,
"grad_norm": 0.780368314719552,
"learning_rate": 2.6932170832336016e-07,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14553119242191315,
"step": 6825,
"valid_targets_mean": 2521.6,
"valid_targets_min": 934
},
{
"epoch": 6.676441837732161,
"grad_norm": 0.7148221396324418,
"learning_rate": 2.614065781551345e-07,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1638277769088745,
"step": 6830,
"valid_targets_mean": 3283.7,
"valid_targets_min": 1090
},
{
"epoch": 6.681329423264907,
"grad_norm": 0.7948993329236099,
"learning_rate": 2.5360873358234004e-07,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14200204610824585,
"step": 6835,
"valid_targets_mean": 2449.1,
"valid_targets_min": 738
},
{
"epoch": 6.686217008797654,
"grad_norm": 0.7070697581069597,
"learning_rate": 2.459282209393243e-07,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1273440271615982,
"step": 6840,
"valid_targets_mean": 2714.1,
"valid_targets_min": 793
},
{
"epoch": 6.691104594330401,
"grad_norm": 0.804428556746242,
"learning_rate": 2.3836508586325246e-07,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13834835588932037,
"step": 6845,
"valid_targets_mean": 2142.0,
"valid_targets_min": 684
},
{
"epoch": 6.695992179863148,
"grad_norm": 0.8003383717639464,
"learning_rate": 2.309193732938453e-07,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15829630196094513,
"step": 6850,
"valid_targets_mean": 2366.2,
"valid_targets_min": 744
},
{
"epoch": 6.700879765395895,
"grad_norm": 0.8634766410996613,
"learning_rate": 2.235911274730973e-07,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16072383522987366,
"step": 6855,
"valid_targets_mean": 2273.4,
"valid_targets_min": 680
},
{
"epoch": 6.7057673509286415,
"grad_norm": 0.8555538490006295,
"learning_rate": 2.1638039194503246e-07,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15848436951637268,
"step": 6860,
"valid_targets_mean": 2117.4,
"valid_targets_min": 718
},
{
"epoch": 6.710654936461388,
"grad_norm": 0.8279297269051833,
"learning_rate": 2.0928720955542436e-07,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14095677435398102,
"step": 6865,
"valid_targets_mean": 2048.8,
"valid_targets_min": 754
},
{
"epoch": 6.715542521994135,
"grad_norm": 0.7949216593255324,
"learning_rate": 2.0231162245156088e-07,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15973398089408875,
"step": 6870,
"valid_targets_mean": 2616.4,
"valid_targets_min": 898
},
{
"epoch": 6.720430107526882,
"grad_norm": 0.7776529385814106,
"learning_rate": 1.9545367208197995e-07,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13128122687339783,
"step": 6875,
"valid_targets_mean": 2468.4,
"valid_targets_min": 773
},
{
"epoch": 6.725317693059629,
"grad_norm": 0.7470593281900991,
"learning_rate": 1.887133991962342e-07,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13984917104244232,
"step": 6880,
"valid_targets_mean": 2672.4,
"valid_targets_min": 918
},
{
"epoch": 6.730205278592376,
"grad_norm": 0.8327481491216713,
"learning_rate": 1.8209084384464005e-07,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14572235941886902,
"step": 6885,
"valid_targets_mean": 2151.9,
"valid_targets_min": 812
},
{
"epoch": 6.735092864125122,
"grad_norm": 0.7666404720709251,
"learning_rate": 1.7558604537804224e-07,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1454159915447235,
"step": 6890,
"valid_targets_mean": 2545.7,
"valid_targets_min": 759
},
{
"epoch": 6.739980449657869,
"grad_norm": 0.7742410628801816,
"learning_rate": 1.6919904244758311e-07,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15060219168663025,
"step": 6895,
"valid_targets_mean": 2724.8,
"valid_targets_min": 826
},
{
"epoch": 6.744868035190616,
"grad_norm": 0.8696550747312377,
"learning_rate": 1.6292987300446705e-07,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14360955357551575,
"step": 6900,
"valid_targets_mean": 1997.2,
"valid_targets_min": 688
},
{
"epoch": 6.749755620723363,
"grad_norm": 0.669193884708062,
"learning_rate": 1.5677857429974296e-07,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12194126844406128,
"step": 6905,
"valid_targets_mean": 2778.8,
"valid_targets_min": 753
},
{
"epoch": 6.75464320625611,
"grad_norm": 0.8129272991005836,
"learning_rate": 1.507451828840756e-07,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12596674263477325,
"step": 6910,
"valid_targets_mean": 2184.9,
"valid_targets_min": 533
},
{
"epoch": 6.7595307917888565,
"grad_norm": 0.8272536163498828,
"learning_rate": 1.4482973460753446e-07,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16095013916492462,
"step": 6915,
"valid_targets_mean": 2635.4,
"valid_targets_min": 1072
},
{
"epoch": 6.764418377321603,
"grad_norm": 0.8546760713602463,
"learning_rate": 1.3903226461937424e-07,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1363896131515503,
"step": 6920,
"valid_targets_mean": 2176.2,
"valid_targets_min": 663
},
{
"epoch": 6.76930596285435,
"grad_norm": 0.7403266010437409,
"learning_rate": 1.3335280736783028e-07,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15206800401210785,
"step": 6925,
"valid_targets_mean": 2854.7,
"valid_targets_min": 1169
},
{
"epoch": 6.774193548387097,
"grad_norm": 0.7772690818458694,
"learning_rate": 1.2779139659991224e-07,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1384185254573822,
"step": 6930,
"valid_targets_mean": 2430.2,
"valid_targets_min": 708
},
{
"epoch": 6.779081133919844,
"grad_norm": 0.8678197977791959,
"learning_rate": 1.2234806536120857e-07,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1501295566558838,
"step": 6935,
"valid_targets_mean": 1968.8,
"valid_targets_min": 832
},
{
"epoch": 6.783968719452591,
"grad_norm": 1.006053072526263,
"learning_rate": 1.1702284599568014e-07,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15837866067886353,
"step": 6940,
"valid_targets_mean": 1922.8,
"valid_targets_min": 692
},
{
"epoch": 6.788856304985337,
"grad_norm": 0.7781597084300925,
"learning_rate": 1.1181577014547807e-07,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14804880321025848,
"step": 6945,
"valid_targets_mean": 2636.6,
"valid_targets_min": 874
},
{
"epoch": 6.793743890518084,
"grad_norm": 0.7361777760679318,
"learning_rate": 1.0672686875074834e-07,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12848952412605286,
"step": 6950,
"valid_targets_mean": 2487.4,
"valid_targets_min": 880
},
{
"epoch": 6.798631476050831,
"grad_norm": 0.9048873371832021,
"learning_rate": 1.0175617204945421e-07,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1462620347738266,
"step": 6955,
"valid_targets_mean": 1957.2,
"valid_targets_min": 802
},
{
"epoch": 6.803519061583578,
"grad_norm": 0.8115943754772563,
"learning_rate": 9.690370957718965e-08,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14204561710357666,
"step": 6960,
"valid_targets_mean": 2568.1,
"valid_targets_min": 692
},
{
"epoch": 6.808406647116325,
"grad_norm": 0.7847252093602829,
"learning_rate": 9.216951016701281e-08,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1391274333000183,
"step": 6965,
"valid_targets_mean": 2426.6,
"valid_targets_min": 820
},
{
"epoch": 6.8132942326490715,
"grad_norm": 0.7599174927993604,
"learning_rate": 8.755360194926399e-08,
"loss": 0.1344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15206477046012878,
"step": 6970,
"valid_targets_mean": 2830.7,
"valid_targets_min": 847
},
{
"epoch": 6.818181818181818,
"grad_norm": 0.7366744359812574,
"learning_rate": 8.30560123514057e-08,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14298483729362488,
"step": 6975,
"valid_targets_mean": 2676.4,
"valid_targets_min": 1298
},
{
"epoch": 6.823069403714565,
"grad_norm": 0.7873925943117703,
"learning_rate": 7.867676809786284e-08,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14373791217803955,
"step": 6980,
"valid_targets_mean": 2348.8,
"valid_targets_min": 737
},
{
"epoch": 6.827956989247312,
"grad_norm": 0.7786043991826431,
"learning_rate": 7.441589520984726e-08,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594143807888031,
"step": 6985,
"valid_targets_mean": 2935.5,
"valid_targets_min": 921
},
{
"epoch": 6.832844574780059,
"grad_norm": 0.7362339661403121,
"learning_rate": 7.027341900523122e-08,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562596559524536,
"step": 6990,
"valid_targets_mean": 3039.9,
"valid_targets_min": 1045
},
{
"epoch": 6.837732160312806,
"grad_norm": 0.8183556025387007,
"learning_rate": 6.624936409836524e-08,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15503844618797302,
"step": 6995,
"valid_targets_mean": 2337.7,
"valid_targets_min": 727
},
{
"epoch": 6.842619745845552,
"grad_norm": 0.7856265162452774,
"learning_rate": 6.23437543999561e-08,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1516461968421936,
"step": 7000,
"valid_targets_mean": 2516.7,
"valid_targets_min": 1013
},
{
"epoch": 6.847507331378299,
"grad_norm": 0.7797885305733583,
"learning_rate": 5.855661311691574e-08,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16110171377658844,
"step": 7005,
"valid_targets_mean": 2726.2,
"valid_targets_min": 990
},
{
"epoch": 6.852394916911046,
"grad_norm": 0.8996911264100806,
"learning_rate": 5.4887962752216975e-08,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14116908609867096,
"step": 7010,
"valid_targets_mean": 2133.9,
"valid_targets_min": 967
},
{
"epoch": 6.857282502443793,
"grad_norm": 0.7855480605188909,
"learning_rate": 5.1337825104775805e-08,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13040246069431305,
"step": 7015,
"valid_targets_mean": 2354.3,
"valid_targets_min": 815
},
{
"epoch": 6.86217008797654,
"grad_norm": 0.778868414355739,
"learning_rate": 4.790622126930489e-08,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16201795637607574,
"step": 7020,
"valid_targets_mean": 2563.2,
"valid_targets_min": 1043
},
{
"epoch": 6.8670576735092865,
"grad_norm": 0.8949061085156262,
"learning_rate": 4.459317163619803e-08,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1284133791923523,
"step": 7025,
"valid_targets_mean": 1841.8,
"valid_targets_min": 958
},
{
"epoch": 6.871945259042033,
"grad_norm": 0.9097660526010823,
"learning_rate": 4.13986958914081e-08,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15148180723190308,
"step": 7030,
"valid_targets_mean": 1931.8,
"valid_targets_min": 679
},
{
"epoch": 6.87683284457478,
"grad_norm": 0.8079953101764225,
"learning_rate": 3.832281301632712e-08,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472192108631134,
"step": 7035,
"valid_targets_mean": 2672.9,
"valid_targets_min": 670
},
{
"epoch": 6.881720430107527,
"grad_norm": 0.8377820814625377,
"learning_rate": 3.536554128767522e-08,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11620961874723434,
"step": 7040,
"valid_targets_mean": 1944.7,
"valid_targets_min": 917
},
{
"epoch": 6.886608015640274,
"grad_norm": 0.9780072356339135,
"learning_rate": 3.252689827739186e-08,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13305175304412842,
"step": 7045,
"valid_targets_mean": 1505.8,
"valid_targets_min": 921
},
{
"epoch": 6.891495601173021,
"grad_norm": 0.7630678184839079,
"learning_rate": 2.980690085253368e-08,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14864769577980042,
"step": 7050,
"valid_targets_mean": 2593.9,
"valid_targets_min": 625
},
{
"epoch": 6.896383186705767,
"grad_norm": 0.7665055215312272,
"learning_rate": 2.7205565175167925e-08,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14561477303504944,
"step": 7055,
"valid_targets_mean": 3042.3,
"valid_targets_min": 963
},
{
"epoch": 6.901270772238514,
"grad_norm": 0.7931423401009772,
"learning_rate": 2.472290670228361e-08,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14829900860786438,
"step": 7060,
"valid_targets_mean": 2566.6,
"valid_targets_min": 672
},
{
"epoch": 6.906158357771261,
"grad_norm": 0.7348681150492757,
"learning_rate": 2.2358940185698285e-08,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15821123123168945,
"step": 7065,
"valid_targets_mean": 3052.2,
"valid_targets_min": 1009
},
{
"epoch": 6.911045943304008,
"grad_norm": 0.7851239048108627,
"learning_rate": 2.0113679671960317e-08,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15088459849357605,
"step": 7070,
"valid_targets_mean": 2557.6,
"valid_targets_min": 514
},
{
"epoch": 6.915933528836755,
"grad_norm": 0.7257205703096241,
"learning_rate": 1.7987138502284508e-08,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14671635627746582,
"step": 7075,
"valid_targets_mean": 2951.8,
"valid_targets_min": 1216
},
{
"epoch": 6.9208211143695015,
"grad_norm": 0.7158651863598146,
"learning_rate": 1.5979329312456603e-08,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.156073197722435,
"step": 7080,
"valid_targets_mean": 3083.7,
"valid_targets_min": 987
},
{
"epoch": 6.925708699902248,
"grad_norm": 0.7570891695989537,
"learning_rate": 1.4090264032760037e-08,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133244588971138,
"step": 7085,
"valid_targets_mean": 2580.4,
"valid_targets_min": 832
},
{
"epoch": 6.930596285434995,
"grad_norm": 0.8832686071227391,
"learning_rate": 1.2319953887918179e-08,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13915324211120605,
"step": 7090,
"valid_targets_mean": 2498.4,
"valid_targets_min": 632
},
{
"epoch": 6.935483870967742,
"grad_norm": 0.7469142291910154,
"learning_rate": 1.0668409397009972e-08,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13527530431747437,
"step": 7095,
"valid_targets_mean": 3218.7,
"valid_targets_min": 794
},
{
"epoch": 6.940371456500489,
"grad_norm": 0.7764886081432477,
"learning_rate": 9.135640373418853e-09,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15149667859077454,
"step": 7100,
"valid_targets_mean": 2654.7,
"valid_targets_min": 1291
},
{
"epoch": 6.945259042033236,
"grad_norm": 0.792380332907017,
"learning_rate": 7.721655924770588e-09,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14253517985343933,
"step": 7105,
"valid_targets_mean": 2680.3,
"valid_targets_min": 1109
},
{
"epoch": 6.9501466275659824,
"grad_norm": 0.8708382788168486,
"learning_rate": 6.426464452879977e-09,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15370717644691467,
"step": 7110,
"valid_targets_mean": 1872.2,
"valid_targets_min": 824
},
{
"epoch": 6.955034213098729,
"grad_norm": 0.7697531302927278,
"learning_rate": 5.250073653702004e-09,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14434030652046204,
"step": 7115,
"valid_targets_mean": 2634.2,
"valid_targets_min": 882
},
{
"epoch": 6.959921798631476,
"grad_norm": 0.909840589624624,
"learning_rate": 4.192490517285208e-09,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1433998942375183,
"step": 7120,
"valid_targets_mean": 1897.3,
"valid_targets_min": 721
},
{
"epoch": 6.964809384164223,
"grad_norm": 0.880665464777133,
"learning_rate": 3.2537213277228364e-09,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15554025769233704,
"step": 7125,
"valid_targets_mean": 2096.7,
"valid_targets_min": 754
},
{
"epoch": 6.96969696969697,
"grad_norm": 0.7411591407393181,
"learning_rate": 2.4337716631328555e-09,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13086152076721191,
"step": 7130,
"valid_targets_mean": 2635.5,
"valid_targets_min": 826
},
{
"epoch": 6.9745845552297165,
"grad_norm": 0.8057506293460369,
"learning_rate": 1.732646395606885e-09,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14949795603752136,
"step": 7135,
"valid_targets_mean": 2405.2,
"valid_targets_min": 748
},
{
"epoch": 6.979472140762463,
"grad_norm": 0.8097660910794996,
"learning_rate": 1.1503496911924316e-09,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134006530046463,
"step": 7140,
"valid_targets_mean": 2312.4,
"valid_targets_min": 997
},
{
"epoch": 6.98435972629521,
"grad_norm": 0.7666411016932615,
"learning_rate": 6.868850098618041e-10,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1432676464319229,
"step": 7145,
"valid_targets_mean": 2855.9,
"valid_targets_min": 763
},
{
"epoch": 6.989247311827957,
"grad_norm": 0.8085737681168628,
"learning_rate": 3.4225510549656947e-10,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13285693526268005,
"step": 7150,
"valid_targets_mean": 2373.7,
"valid_targets_min": 684
},
{
"epoch": 6.994134897360704,
"grad_norm": 0.6798769668315741,
"learning_rate": 1.1646202586756973e-10,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15072640776634216,
"step": 7155,
"valid_targets_mean": 3628.1,
"valid_targets_min": 1272
},
{
"epoch": 6.999022482893451,
"grad_norm": 0.8430786453318077,
"learning_rate": 9.507112626039316e-12,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11695080995559692,
"step": 7160,
"valid_targets_mean": 2002.8,
"valid_targets_min": 715
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1567835956811905,
"step": 7161,
"total_flos": 1242507420499968.0,
"train_loss": 0.2217263549632857,
"train_runtime": 30173.9773,
"train_samples_per_second": 3.796,
"train_steps_per_second": 0.237,
"valid_targets_mean": 1853.1,
"valid_targets_min": 622
}
],
"logging_steps": 5,
"max_steps": 7161,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1242507420499968.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}