a1-code_feedback / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
2edac2a verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4249,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008237232289950576,
"grad_norm": 18.041129986855786,
"learning_rate": 3.764705882352941e-07,
"loss": 0.7519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8261098861694336,
"step": 5,
"valid_targets_mean": 2174.1,
"valid_targets_min": 693
},
{
"epoch": 0.016474464579901153,
"grad_norm": 14.34905148121762,
"learning_rate": 8.470588235294118e-07,
"loss": 0.7712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7180605530738831,
"step": 10,
"valid_targets_mean": 2644.4,
"valid_targets_min": 287
},
{
"epoch": 0.02471169686985173,
"grad_norm": 15.970319180575778,
"learning_rate": 1.3176470588235296e-06,
"loss": 0.7464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7657804489135742,
"step": 15,
"valid_targets_mean": 2121.8,
"valid_targets_min": 1030
},
{
"epoch": 0.032948929159802305,
"grad_norm": 10.573979142790474,
"learning_rate": 1.7882352941176474e-06,
"loss": 0.6642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5902353525161743,
"step": 20,
"valid_targets_mean": 3019.1,
"valid_targets_min": 388
},
{
"epoch": 0.04118616144975288,
"grad_norm": 6.5189844283078076,
"learning_rate": 2.258823529411765e-06,
"loss": 0.676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6557721495628357,
"step": 25,
"valid_targets_mean": 3073.6,
"valid_targets_min": 1036
},
{
"epoch": 0.04942339373970346,
"grad_norm": 4.427343793861997,
"learning_rate": 2.7294117647058825e-06,
"loss": 0.6411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6275306344032288,
"step": 30,
"valid_targets_mean": 3181.9,
"valid_targets_min": 797
},
{
"epoch": 0.057660626029654036,
"grad_norm": 3.0263978789805233,
"learning_rate": 3.2000000000000003e-06,
"loss": 0.5953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5235786437988281,
"step": 35,
"valid_targets_mean": 2863.2,
"valid_targets_min": 849
},
{
"epoch": 0.06589785831960461,
"grad_norm": 1.8462361669327314,
"learning_rate": 3.670588235294118e-06,
"loss": 0.5154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5156185030937195,
"step": 40,
"valid_targets_mean": 2872.0,
"valid_targets_min": 748
},
{
"epoch": 0.07413509060955518,
"grad_norm": 1.4886243049823848,
"learning_rate": 4.141176470588235e-06,
"loss": 0.4722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4820077419281006,
"step": 45,
"valid_targets_mean": 3115.6,
"valid_targets_min": 1525
},
{
"epoch": 0.08237232289950576,
"grad_norm": 1.0186916863672602,
"learning_rate": 4.611764705882353e-06,
"loss": 0.4663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44742530584335327,
"step": 50,
"valid_targets_mean": 2791.6,
"valid_targets_min": 323
},
{
"epoch": 0.09060955518945635,
"grad_norm": 1.0555979955301744,
"learning_rate": 5.08235294117647e-06,
"loss": 0.5045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5457557439804077,
"step": 55,
"valid_targets_mean": 2666.8,
"valid_targets_min": 636
},
{
"epoch": 0.09884678747940692,
"grad_norm": 0.9431942413892103,
"learning_rate": 5.552941176470589e-06,
"loss": 0.4561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45544564723968506,
"step": 60,
"valid_targets_mean": 2670.2,
"valid_targets_min": 248
},
{
"epoch": 0.1070840197693575,
"grad_norm": 0.9827011262758822,
"learning_rate": 6.023529411764706e-06,
"loss": 0.5112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4421389400959015,
"step": 65,
"valid_targets_mean": 2145.6,
"valid_targets_min": 763
},
{
"epoch": 0.11532125205930807,
"grad_norm": 0.864994814301313,
"learning_rate": 6.494117647058824e-06,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44878387451171875,
"step": 70,
"valid_targets_mean": 2175.3,
"valid_targets_min": 251
},
{
"epoch": 0.12355848434925865,
"grad_norm": 0.8853263389472636,
"learning_rate": 6.964705882352941e-06,
"loss": 0.497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5232568383216858,
"step": 75,
"valid_targets_mean": 2546.2,
"valid_targets_min": 265
},
{
"epoch": 0.13179571663920922,
"grad_norm": 0.8051192678757433,
"learning_rate": 7.43529411764706e-06,
"loss": 0.4507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45036208629608154,
"step": 80,
"valid_targets_mean": 2913.5,
"valid_targets_min": 735
},
{
"epoch": 0.1400329489291598,
"grad_norm": 0.7677204251168979,
"learning_rate": 7.905882352941176e-06,
"loss": 0.4379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40930110216140747,
"step": 85,
"valid_targets_mean": 2679.2,
"valid_targets_min": 768
},
{
"epoch": 0.14827018121911037,
"grad_norm": 0.7800094242006477,
"learning_rate": 8.376470588235295e-06,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44566720724105835,
"step": 90,
"valid_targets_mean": 3371.6,
"valid_targets_min": 1439
},
{
"epoch": 0.15650741350906094,
"grad_norm": 0.6767591438862864,
"learning_rate": 8.847058823529413e-06,
"loss": 0.4233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38728904724121094,
"step": 95,
"valid_targets_mean": 2819.8,
"valid_targets_min": 585
},
{
"epoch": 0.16474464579901152,
"grad_norm": 0.8131291107995611,
"learning_rate": 9.31764705882353e-06,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48519647121429443,
"step": 100,
"valid_targets_mean": 2543.0,
"valid_targets_min": 1046
},
{
"epoch": 0.17298187808896212,
"grad_norm": 0.516958608307116,
"learning_rate": 9.788235294117649e-06,
"loss": 0.3894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3352322280406952,
"step": 105,
"valid_targets_mean": 3974.6,
"valid_targets_min": 1106
},
{
"epoch": 0.1812191103789127,
"grad_norm": 0.7099200398129607,
"learning_rate": 1.0258823529411766e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34124284982681274,
"step": 110,
"valid_targets_mean": 2296.8,
"valid_targets_min": 311
},
{
"epoch": 0.18945634266886327,
"grad_norm": 1.3084249200454359,
"learning_rate": 1.0729411764705884e-05,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3974684476852417,
"step": 115,
"valid_targets_mean": 2726.6,
"valid_targets_min": 841
},
{
"epoch": 0.19769357495881384,
"grad_norm": 0.7452807970704501,
"learning_rate": 1.1200000000000001e-05,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42342647910118103,
"step": 120,
"valid_targets_mean": 2717.6,
"valid_targets_min": 955
},
{
"epoch": 0.20593080724876442,
"grad_norm": 0.6071220337631781,
"learning_rate": 1.1670588235294118e-05,
"loss": 0.4154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44350916147232056,
"step": 125,
"valid_targets_mean": 3765.1,
"valid_targets_min": 287
},
{
"epoch": 0.214168039538715,
"grad_norm": 0.6810266168182173,
"learning_rate": 1.2141176470588237e-05,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3277353048324585,
"step": 130,
"valid_targets_mean": 2465.6,
"valid_targets_min": 321
},
{
"epoch": 0.22240527182866557,
"grad_norm": 0.6694184649708005,
"learning_rate": 1.2611764705882354e-05,
"loss": 0.4057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4071721136569977,
"step": 135,
"valid_targets_mean": 3101.9,
"valid_targets_min": 742
},
{
"epoch": 0.23064250411861614,
"grad_norm": 0.6133654529819055,
"learning_rate": 1.3082352941176472e-05,
"loss": 0.4067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32720082998275757,
"step": 140,
"valid_targets_mean": 3069.0,
"valid_targets_min": 1035
},
{
"epoch": 0.23887973640856672,
"grad_norm": 0.7161672984877867,
"learning_rate": 1.355294117647059e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4013705849647522,
"step": 145,
"valid_targets_mean": 2725.5,
"valid_targets_min": 319
},
{
"epoch": 0.2471169686985173,
"grad_norm": 0.6969489545726383,
"learning_rate": 1.4023529411764706e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38001126050949097,
"step": 150,
"valid_targets_mean": 3276.0,
"valid_targets_min": 1031
},
{
"epoch": 0.2553542009884679,
"grad_norm": 0.6463131347430592,
"learning_rate": 1.4494117647058825e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4384726583957672,
"step": 155,
"valid_targets_mean": 3591.8,
"valid_targets_min": 912
},
{
"epoch": 0.26359143327841844,
"grad_norm": 0.6590571572375514,
"learning_rate": 1.4964705882352943e-05,
"loss": 0.3424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31954580545425415,
"step": 160,
"valid_targets_mean": 2965.2,
"valid_targets_min": 839
},
{
"epoch": 0.27182866556836904,
"grad_norm": 0.6582067773489519,
"learning_rate": 1.543529411764706e-05,
"loss": 0.4073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3766615390777588,
"step": 165,
"valid_targets_mean": 3487.7,
"valid_targets_min": 869
},
{
"epoch": 0.2800658978583196,
"grad_norm": 0.6816959560863262,
"learning_rate": 1.5905882352941177e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38047826290130615,
"step": 170,
"valid_targets_mean": 2549.7,
"valid_targets_min": 821
},
{
"epoch": 0.2883031301482702,
"grad_norm": 0.7251450154291886,
"learning_rate": 1.6376470588235298e-05,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4638799726963043,
"step": 175,
"valid_targets_mean": 2832.6,
"valid_targets_min": 382
},
{
"epoch": 0.29654036243822074,
"grad_norm": 0.6299448981935337,
"learning_rate": 1.6847058823529414e-05,
"loss": 0.3631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3318817913532257,
"step": 180,
"valid_targets_mean": 2848.6,
"valid_targets_min": 944
},
{
"epoch": 0.30477759472817134,
"grad_norm": 0.6977606582667799,
"learning_rate": 1.731764705882353e-05,
"loss": 0.3772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3715594410896301,
"step": 185,
"valid_targets_mean": 2431.6,
"valid_targets_min": 391
},
{
"epoch": 0.3130148270181219,
"grad_norm": 0.7061245411260707,
"learning_rate": 1.778823529411765e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33297649025917053,
"step": 190,
"valid_targets_mean": 2197.2,
"valid_targets_min": 685
},
{
"epoch": 0.3212520593080725,
"grad_norm": 0.6859289408630844,
"learning_rate": 1.8258823529411765e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3794998824596405,
"step": 195,
"valid_targets_mean": 2878.8,
"valid_targets_min": 304
},
{
"epoch": 0.32948929159802304,
"grad_norm": 0.6130651983492513,
"learning_rate": 1.8729411764705886e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38770943880081177,
"step": 200,
"valid_targets_mean": 3607.1,
"valid_targets_min": 230
},
{
"epoch": 0.33772652388797364,
"grad_norm": 0.7234411187513314,
"learning_rate": 1.9200000000000003e-05,
"loss": 0.3789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4269868731498718,
"step": 205,
"valid_targets_mean": 2572.0,
"valid_targets_min": 246
},
{
"epoch": 0.34596375617792424,
"grad_norm": 0.5735815243504443,
"learning_rate": 1.967058823529412e-05,
"loss": 0.3501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31644099950790405,
"step": 210,
"valid_targets_mean": 3513.8,
"valid_targets_min": 876
},
{
"epoch": 0.3542009884678748,
"grad_norm": 0.8651887451217208,
"learning_rate": 2.0141176470588236e-05,
"loss": 0.3411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3497444987297058,
"step": 215,
"valid_targets_mean": 1987.6,
"valid_targets_min": 297
},
{
"epoch": 0.3624382207578254,
"grad_norm": 0.6522031387177083,
"learning_rate": 2.0611764705882353e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38645434379577637,
"step": 220,
"valid_targets_mean": 3107.1,
"valid_targets_min": 1099
},
{
"epoch": 0.37067545304777594,
"grad_norm": 0.7920489560748225,
"learning_rate": 2.1082352941176474e-05,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36695098876953125,
"step": 225,
"valid_targets_mean": 1991.4,
"valid_targets_min": 295
},
{
"epoch": 0.37891268533772654,
"grad_norm": 0.6409036862164285,
"learning_rate": 2.155294117647059e-05,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2995736598968506,
"step": 230,
"valid_targets_mean": 2558.9,
"valid_targets_min": 1074
},
{
"epoch": 0.3871499176276771,
"grad_norm": 0.6032322601598289,
"learning_rate": 2.2023529411764707e-05,
"loss": 0.3675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39067399501800537,
"step": 235,
"valid_targets_mean": 3427.1,
"valid_targets_min": 1229
},
{
"epoch": 0.3953871499176277,
"grad_norm": 0.640108850824614,
"learning_rate": 2.2494117647058828e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3539199233055115,
"step": 240,
"valid_targets_mean": 3306.6,
"valid_targets_min": 219
},
{
"epoch": 0.40362438220757824,
"grad_norm": 0.6923591104747878,
"learning_rate": 2.296470588235294e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25825247168540955,
"step": 245,
"valid_targets_mean": 2549.9,
"valid_targets_min": 271
},
{
"epoch": 0.41186161449752884,
"grad_norm": 0.8803432349351571,
"learning_rate": 2.343529411764706e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40536123514175415,
"step": 250,
"valid_targets_mean": 1919.9,
"valid_targets_min": 226
},
{
"epoch": 0.4200988467874794,
"grad_norm": 0.641574096444431,
"learning_rate": 2.390588235294118e-05,
"loss": 0.3585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35488161444664,
"step": 255,
"valid_targets_mean": 3300.2,
"valid_targets_min": 568
},
{
"epoch": 0.42833607907743,
"grad_norm": 0.6648054089698943,
"learning_rate": 2.4376470588235296e-05,
"loss": 0.3572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3950795531272888,
"step": 260,
"valid_targets_mean": 3831.9,
"valid_targets_min": 563
},
{
"epoch": 0.43657331136738053,
"grad_norm": 0.7333690453284659,
"learning_rate": 2.4847058823529416e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32087090611457825,
"step": 265,
"valid_targets_mean": 2422.1,
"valid_targets_min": 334
},
{
"epoch": 0.44481054365733114,
"grad_norm": 1.0576342544488297,
"learning_rate": 2.5317647058823533e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4411831200122833,
"step": 270,
"valid_targets_mean": 3020.0,
"valid_targets_min": 1122
},
{
"epoch": 0.45304777594728174,
"grad_norm": 0.5404063898551336,
"learning_rate": 2.5788235294117646e-05,
"loss": 0.349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2559725344181061,
"step": 275,
"valid_targets_mean": 3452.1,
"valid_targets_min": 287
},
{
"epoch": 0.4612850082372323,
"grad_norm": 0.6680784878314109,
"learning_rate": 2.6258823529411767e-05,
"loss": 0.3369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3715960383415222,
"step": 280,
"valid_targets_mean": 3149.2,
"valid_targets_min": 1060
},
{
"epoch": 0.4695222405271829,
"grad_norm": 0.6163910100110204,
"learning_rate": 2.6729411764705884e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3177059292793274,
"step": 285,
"valid_targets_mean": 3021.4,
"valid_targets_min": 857
},
{
"epoch": 0.47775947281713343,
"grad_norm": 0.8667382342453931,
"learning_rate": 2.7200000000000004e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3662949502468109,
"step": 290,
"valid_targets_mean": 2007.4,
"valid_targets_min": 699
},
{
"epoch": 0.48599670510708404,
"grad_norm": 0.7018849627415584,
"learning_rate": 2.767058823529412e-05,
"loss": 0.3619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3931698501110077,
"step": 295,
"valid_targets_mean": 2677.9,
"valid_targets_min": 968
},
{
"epoch": 0.4942339373970346,
"grad_norm": 0.6995387214546374,
"learning_rate": 2.8141176470588238e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3696545362472534,
"step": 300,
"valid_targets_mean": 2607.9,
"valid_targets_min": 270
},
{
"epoch": 0.5024711696869851,
"grad_norm": 0.6715688200029435,
"learning_rate": 2.8611764705882358e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27885138988494873,
"step": 305,
"valid_targets_mean": 2609.4,
"valid_targets_min": 785
},
{
"epoch": 0.5107084019769358,
"grad_norm": 0.7737861344674672,
"learning_rate": 2.908235294117647e-05,
"loss": 0.3742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4706699550151825,
"step": 310,
"valid_targets_mean": 2705.9,
"valid_targets_min": 162
},
{
"epoch": 0.5189456342668863,
"grad_norm": 0.6334586406962706,
"learning_rate": 2.955294117647059e-05,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3143928647041321,
"step": 315,
"valid_targets_mean": 3639.9,
"valid_targets_min": 1132
},
{
"epoch": 0.5271828665568369,
"grad_norm": 0.7026900238535507,
"learning_rate": 3.002352941176471e-05,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3668755292892456,
"step": 320,
"valid_targets_mean": 3119.6,
"valid_targets_min": 896
},
{
"epoch": 0.5354200988467874,
"grad_norm": 0.70858594506907,
"learning_rate": 3.0494117647058826e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42341750860214233,
"step": 325,
"valid_targets_mean": 2856.9,
"valid_targets_min": 716
},
{
"epoch": 0.5436573311367381,
"grad_norm": 0.9050380182770631,
"learning_rate": 3.0964705882352946e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28868210315704346,
"step": 330,
"valid_targets_mean": 2783.8,
"valid_targets_min": 1080
},
{
"epoch": 0.5518945634266886,
"grad_norm": 0.6793783253890467,
"learning_rate": 3.143529411764706e-05,
"loss": 0.358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3081079125404358,
"step": 335,
"valid_targets_mean": 2909.4,
"valid_targets_min": 905
},
{
"epoch": 0.5601317957166392,
"grad_norm": 0.6531063772093401,
"learning_rate": 3.190588235294118e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3191760182380676,
"step": 340,
"valid_targets_mean": 2809.9,
"valid_targets_min": 829
},
{
"epoch": 0.5683690280065898,
"grad_norm": 0.8336208889400938,
"learning_rate": 3.23764705882353e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3880823254585266,
"step": 345,
"valid_targets_mean": 2561.3,
"valid_targets_min": 626
},
{
"epoch": 0.5766062602965404,
"grad_norm": 1.1368953862481592,
"learning_rate": 3.2847058823529414e-05,
"loss": 0.3541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27717214822769165,
"step": 350,
"valid_targets_mean": 2409.9,
"valid_targets_min": 831
},
{
"epoch": 0.5848434925864909,
"grad_norm": 0.7026717555920957,
"learning_rate": 3.331764705882353e-05,
"loss": 0.3622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3906007409095764,
"step": 355,
"valid_targets_mean": 2896.1,
"valid_targets_min": 385
},
{
"epoch": 0.5930807248764415,
"grad_norm": 0.6023606367373995,
"learning_rate": 3.378823529411765e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37305983901023865,
"step": 360,
"valid_targets_mean": 3621.6,
"valid_targets_min": 1150
},
{
"epoch": 0.6013179571663921,
"grad_norm": 0.6514047229400881,
"learning_rate": 3.425882352941177e-05,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29843461513519287,
"step": 365,
"valid_targets_mean": 3057.4,
"valid_targets_min": 1271
},
{
"epoch": 0.6095551894563427,
"grad_norm": 0.5626045279089444,
"learning_rate": 3.472941176470589e-05,
"loss": 0.3145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27968597412109375,
"step": 370,
"valid_targets_mean": 3222.4,
"valid_targets_min": 374
},
{
"epoch": 0.6177924217462932,
"grad_norm": 0.5421510206663698,
"learning_rate": 3.52e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32853734493255615,
"step": 375,
"valid_targets_mean": 3641.3,
"valid_targets_min": 569
},
{
"epoch": 0.6260296540362438,
"grad_norm": 0.6144302274176291,
"learning_rate": 3.567058823529412e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33135101199150085,
"step": 380,
"valid_targets_mean": 3392.9,
"valid_targets_min": 1176
},
{
"epoch": 0.6342668863261944,
"grad_norm": 0.5893086168232592,
"learning_rate": 3.614117647058824e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32672643661499023,
"step": 385,
"valid_targets_mean": 2965.9,
"valid_targets_min": 654
},
{
"epoch": 0.642504118616145,
"grad_norm": 0.6559702753858812,
"learning_rate": 3.6611764705882356e-05,
"loss": 0.3469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30627205967903137,
"step": 390,
"valid_targets_mean": 2923.8,
"valid_targets_min": 737
},
{
"epoch": 0.6507413509060955,
"grad_norm": 0.7743858147760204,
"learning_rate": 3.708235294117647e-05,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4699430465698242,
"step": 395,
"valid_targets_mean": 2655.4,
"valid_targets_min": 857
},
{
"epoch": 0.6589785831960461,
"grad_norm": 0.6333244399993251,
"learning_rate": 3.755294117647059e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38278141617774963,
"step": 400,
"valid_targets_mean": 2962.8,
"valid_targets_min": 256
},
{
"epoch": 0.6672158154859967,
"grad_norm": 0.6290385348921544,
"learning_rate": 3.802352941176471e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128456175327301,
"step": 405,
"valid_targets_mean": 2868.9,
"valid_targets_min": 814
},
{
"epoch": 0.6754530477759473,
"grad_norm": 0.9556660046777031,
"learning_rate": 3.849411764705883e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23495997488498688,
"step": 410,
"valid_targets_mean": 3069.1,
"valid_targets_min": 719
},
{
"epoch": 0.6836902800658978,
"grad_norm": 0.6229890597206825,
"learning_rate": 3.8964705882352944e-05,
"loss": 0.385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3396230638027191,
"step": 415,
"valid_targets_mean": 2948.0,
"valid_targets_min": 910
},
{
"epoch": 0.6919275123558485,
"grad_norm": 0.7604982982401985,
"learning_rate": 3.943529411764706e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36150163412094116,
"step": 420,
"valid_targets_mean": 2440.2,
"valid_targets_min": 279
},
{
"epoch": 0.700164744645799,
"grad_norm": 0.6483929715914343,
"learning_rate": 3.990588235294118e-05,
"loss": 0.3206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31857752799987793,
"step": 425,
"valid_targets_mean": 2489.6,
"valid_targets_min": 250
},
{
"epoch": 0.7084019769357496,
"grad_norm": 0.6077661449463507,
"learning_rate": 3.9999892009992835e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35132089257240295,
"step": 430,
"valid_targets_mean": 3160.6,
"valid_targets_min": 711
},
{
"epoch": 0.7166392092257001,
"grad_norm": 0.6568155761335552,
"learning_rate": 3.999945330258739e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3767227828502655,
"step": 435,
"valid_targets_mean": 2791.2,
"valid_targets_min": 378
},
{
"epoch": 0.7248764415156508,
"grad_norm": 0.6549147402066008,
"learning_rate": 3.9998677135805034e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3399823307991028,
"step": 440,
"valid_targets_mean": 2741.8,
"valid_targets_min": 237
},
{
"epoch": 0.7331136738056013,
"grad_norm": 0.6266647101324666,
"learning_rate": 3.999756352274235e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2891290783882141,
"step": 445,
"valid_targets_mean": 2656.9,
"valid_targets_min": 766
},
{
"epoch": 0.7413509060955519,
"grad_norm": 0.7173443868039945,
"learning_rate": 3.9996112482189823e-05,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35799193382263184,
"step": 450,
"valid_targets_mean": 2232.7,
"valid_targets_min": 281
},
{
"epoch": 0.7495881383855024,
"grad_norm": 0.7475444722849752,
"learning_rate": 3.9994324038631475e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31564396619796753,
"step": 455,
"valid_targets_mean": 2473.4,
"valid_targets_min": 425
},
{
"epoch": 0.7578253706754531,
"grad_norm": 0.7565191294316428,
"learning_rate": 3.999219822224449e-05,
"loss": 0.3607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3808445930480957,
"step": 460,
"valid_targets_mean": 2174.1,
"valid_targets_min": 260
},
{
"epoch": 0.7660626029654036,
"grad_norm": 0.6005283358301972,
"learning_rate": 3.998973506889867e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31527596712112427,
"step": 465,
"valid_targets_mean": 2908.4,
"valid_targets_min": 714
},
{
"epoch": 0.7742998352553542,
"grad_norm": 0.6631763471679214,
"learning_rate": 3.998693462015588e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2902739346027374,
"step": 470,
"valid_targets_mean": 2522.3,
"valid_targets_min": 440
},
{
"epoch": 0.7825370675453048,
"grad_norm": 0.7214500863472263,
"learning_rate": 3.9983796923269284e-05,
"loss": 0.3284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3250043988227844,
"step": 475,
"valid_targets_mean": 2207.5,
"valid_targets_min": 629
},
{
"epoch": 0.7907742998352554,
"grad_norm": 0.6204766994564088,
"learning_rate": 3.99803220311826e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3031291365623474,
"step": 480,
"valid_targets_mean": 2860.6,
"valid_targets_min": 647
},
{
"epoch": 0.7990115321252059,
"grad_norm": 0.6251122638878225,
"learning_rate": 3.997651000252916e-05,
"loss": 0.3509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3469051718711853,
"step": 485,
"valid_targets_mean": 3213.5,
"valid_targets_min": 317
},
{
"epoch": 0.8072487644151565,
"grad_norm": 0.6183054272635903,
"learning_rate": 3.997236090163097e-05,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36611422896385193,
"step": 490,
"valid_targets_mean": 3578.0,
"valid_targets_min": 1081
},
{
"epoch": 0.8154859967051071,
"grad_norm": 0.7643699670266144,
"learning_rate": 3.99678747984976e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4362257122993469,
"step": 495,
"valid_targets_mean": 2453.6,
"valid_targets_min": 542
},
{
"epoch": 0.8237232289950577,
"grad_norm": 0.8341652264979282,
"learning_rate": 3.9963051768824996e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26549232006073,
"step": 500,
"valid_targets_mean": 2642.1,
"valid_targets_min": 1008
},
{
"epoch": 0.8319604612850082,
"grad_norm": 0.6792332627863412,
"learning_rate": 3.995789189399421e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27049073576927185,
"step": 505,
"valid_targets_mean": 2643.8,
"valid_targets_min": 391
},
{
"epoch": 0.8401976935749588,
"grad_norm": 0.6315353366191043,
"learning_rate": 3.995239526107003e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29464757442474365,
"step": 510,
"valid_targets_mean": 2849.6,
"valid_targets_min": 330
},
{
"epoch": 0.8484349258649094,
"grad_norm": 0.7540062474541283,
"learning_rate": 3.99465619627995e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3380299508571625,
"step": 515,
"valid_targets_mean": 2119.2,
"valid_targets_min": 567
},
{
"epoch": 0.85667215815486,
"grad_norm": 0.613809876372666,
"learning_rate": 3.994039209761038e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2560957074165344,
"step": 520,
"valid_targets_mean": 3331.9,
"valid_targets_min": 748
},
{
"epoch": 0.8649093904448105,
"grad_norm": 0.6123292685393475,
"learning_rate": 3.993388576960947e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33387625217437744,
"step": 525,
"valid_targets_mean": 3419.0,
"valid_targets_min": 326
},
{
"epoch": 0.8731466227347611,
"grad_norm": 0.5538651672396367,
"learning_rate": 3.9927043088580805e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37178099155426025,
"step": 530,
"valid_targets_mean": 4541.1,
"valid_targets_min": 701
},
{
"epoch": 0.8813838550247117,
"grad_norm": 0.5909393191732646,
"learning_rate": 3.991986416998391e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3093166947364807,
"step": 535,
"valid_targets_mean": 2899.0,
"valid_targets_min": 397
},
{
"epoch": 0.8896210873146623,
"grad_norm": 0.6546363609842427,
"learning_rate": 3.991234913495177e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.296301007270813,
"step": 540,
"valid_targets_mean": 2484.8,
"valid_targets_min": 1012
},
{
"epoch": 0.8978583196046128,
"grad_norm": 0.6157315771578695,
"learning_rate": 3.99044981102888e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3564984202384949,
"step": 545,
"valid_targets_mean": 3432.4,
"valid_targets_min": 832
},
{
"epoch": 0.9060955518945635,
"grad_norm": 0.5853646079194815,
"learning_rate": 3.98963112284687e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27953511476516724,
"step": 550,
"valid_targets_mean": 2949.4,
"valid_targets_min": 677
},
{
"epoch": 0.914332784184514,
"grad_norm": 0.6929994545262912,
"learning_rate": 3.9887788627632266e-05,
"loss": 0.3304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3079501986503601,
"step": 555,
"valid_targets_mean": 2296.4,
"valid_targets_min": 242
},
{
"epoch": 0.9225700164744646,
"grad_norm": 0.6175410466216474,
"learning_rate": 3.9878930451584995e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3442390561103821,
"step": 560,
"valid_targets_mean": 3016.9,
"valid_targets_min": 223
},
{
"epoch": 0.9308072487644151,
"grad_norm": 0.5759924285268283,
"learning_rate": 3.986973684979471e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3262675404548645,
"step": 565,
"valid_targets_mean": 3156.9,
"valid_targets_min": 223
},
{
"epoch": 0.9390444810543658,
"grad_norm": 0.6354650452462268,
"learning_rate": 3.9860207977389e-05,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4005314111709595,
"step": 570,
"valid_targets_mean": 3261.8,
"valid_targets_min": 718
},
{
"epoch": 0.9472817133443163,
"grad_norm": 0.816503500430313,
"learning_rate": 3.9850343995152634e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29235273599624634,
"step": 575,
"valid_targets_mean": 2347.9,
"valid_targets_min": 307
},
{
"epoch": 0.9555189456342669,
"grad_norm": 0.6708495614164758,
"learning_rate": 3.9840145069524825e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32615166902542114,
"step": 580,
"valid_targets_mean": 2426.5,
"valid_targets_min": 1424
},
{
"epoch": 0.9637561779242174,
"grad_norm": 0.6448102084828288,
"learning_rate": 3.982961137259643e-05,
"loss": 0.3464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3473745882511139,
"step": 585,
"valid_targets_mean": 2862.9,
"valid_targets_min": 382
},
{
"epoch": 0.9719934102141681,
"grad_norm": 0.6252647889505737,
"learning_rate": 3.981874308210705e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31804078817367554,
"step": 590,
"valid_targets_mean": 2728.4,
"valid_targets_min": 647
},
{
"epoch": 0.9802306425041186,
"grad_norm": 0.5871449715572906,
"learning_rate": 3.980754038144202e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31086063385009766,
"step": 595,
"valid_targets_mean": 3214.8,
"valid_targets_min": 251
},
{
"epoch": 0.9884678747940692,
"grad_norm": 0.6461194424571096,
"learning_rate": 3.9796003459629335e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39187324047088623,
"step": 600,
"valid_targets_mean": 2897.5,
"valid_targets_min": 702
},
{
"epoch": 0.9967051070840197,
"grad_norm": 0.6731453411587777,
"learning_rate": 3.978413251133643e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304431676864624,
"step": 605,
"valid_targets_mean": 2816.6,
"valid_targets_min": 1209
},
{
"epoch": 1.0049423393739703,
"grad_norm": 0.6830394009205784,
"learning_rate": 3.9771927736866926e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29772090911865234,
"step": 610,
"valid_targets_mean": 2312.0,
"valid_targets_min": 847
},
{
"epoch": 1.013179571663921,
"grad_norm": 0.5982189648576913,
"learning_rate": 3.9759389342157225e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953491508960724,
"step": 615,
"valid_targets_mean": 3731.6,
"valid_targets_min": 725
},
{
"epoch": 1.0214168039538716,
"grad_norm": 0.6464219651312553,
"learning_rate": 3.974651753877306e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32838666439056396,
"step": 620,
"valid_targets_mean": 2931.8,
"valid_targets_min": 212
},
{
"epoch": 1.029654036243822,
"grad_norm": 0.6819518166567332,
"learning_rate": 3.9733312543905904e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28917109966278076,
"step": 625,
"valid_targets_mean": 2779.7,
"valid_targets_min": 614
},
{
"epoch": 1.0378912685337727,
"grad_norm": 0.6274036687821978,
"learning_rate": 3.971977458036931e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930309772491455,
"step": 630,
"valid_targets_mean": 2777.7,
"valid_targets_min": 293
},
{
"epoch": 1.0461285008237233,
"grad_norm": 0.617268853064774,
"learning_rate": 3.9705903876595167e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34295734763145447,
"step": 635,
"valid_targets_mean": 3084.1,
"valid_targets_min": 938
},
{
"epoch": 1.0543657331136738,
"grad_norm": 0.6419145579444464,
"learning_rate": 3.969170066662982e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29465362429618835,
"step": 640,
"valid_targets_mean": 2784.9,
"valid_targets_min": 1046
},
{
"epoch": 1.0626029654036244,
"grad_norm": 0.5589047587447845,
"learning_rate": 3.967716519013014e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33022594451904297,
"step": 645,
"valid_targets_mean": 4427.2,
"valid_targets_min": 937
},
{
"epoch": 1.0708401976935749,
"grad_norm": 0.821250839806891,
"learning_rate": 3.9662297692359486e-05,
"loss": 0.3201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3356301188468933,
"step": 650,
"valid_targets_mean": 3180.2,
"valid_targets_min": 886
},
{
"epoch": 1.0790774299835255,
"grad_norm": 0.5563507731732716,
"learning_rate": 3.964709842418351e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2440907061100006,
"step": 655,
"valid_targets_mean": 3412.5,
"valid_targets_min": 780
},
{
"epoch": 1.0873146622734762,
"grad_norm": 0.6207510688705554,
"learning_rate": 3.9631567642066036e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30460572242736816,
"step": 660,
"valid_targets_mean": 3038.8,
"valid_targets_min": 322
},
{
"epoch": 1.0955518945634266,
"grad_norm": 0.7017906174899363,
"learning_rate": 3.961570560806461e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3034290075302124,
"step": 665,
"valid_targets_mean": 2448.2,
"valid_targets_min": 244
},
{
"epoch": 1.1037891268533773,
"grad_norm": 0.6601151517121949,
"learning_rate": 3.959951258982616e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31534379720687866,
"step": 670,
"valid_targets_mean": 2649.9,
"valid_targets_min": 790
},
{
"epoch": 1.112026359143328,
"grad_norm": 0.6564702714451534,
"learning_rate": 3.958298886058244e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642975151538849,
"step": 675,
"valid_targets_mean": 2336.2,
"valid_targets_min": 915
},
{
"epoch": 1.1202635914332784,
"grad_norm": 0.7154383695421775,
"learning_rate": 3.956613469914546e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3255589008331299,
"step": 680,
"valid_targets_mean": 2366.6,
"valid_targets_min": 862
},
{
"epoch": 1.128500823723229,
"grad_norm": 0.8969246671748706,
"learning_rate": 3.95489503899027e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32357919216156006,
"step": 685,
"valid_targets_mean": 2685.2,
"valid_targets_min": 202
},
{
"epoch": 1.1367380560131797,
"grad_norm": 0.6519391757431306,
"learning_rate": 3.9531436222812434e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531551718711853,
"step": 690,
"valid_targets_mean": 2837.1,
"valid_targets_min": 750
},
{
"epoch": 1.1449752883031301,
"grad_norm": 0.6259788308504319,
"learning_rate": 3.951359249339872e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27987170219421387,
"step": 695,
"valid_targets_mean": 2745.1,
"valid_targets_min": 866
},
{
"epoch": 1.1532125205930808,
"grad_norm": 0.6978771465302991,
"learning_rate": 3.9495419502746485e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3704025149345398,
"step": 700,
"valid_targets_mean": 2759.8,
"valid_targets_min": 846
},
{
"epoch": 1.1614497528830312,
"grad_norm": 0.5939150143068824,
"learning_rate": 3.9476917557496406e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28111281991004944,
"step": 705,
"valid_targets_mean": 3140.9,
"valid_targets_min": 831
},
{
"epoch": 1.1696869851729819,
"grad_norm": 0.6245181056230996,
"learning_rate": 3.945808696983977e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27186596393585205,
"step": 710,
"valid_targets_mean": 3023.4,
"valid_targets_min": 1342
},
{
"epoch": 1.1779242174629325,
"grad_norm": 0.6803023490819639,
"learning_rate": 3.943892805751318e-05,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31058281660079956,
"step": 715,
"valid_targets_mean": 2626.4,
"valid_targets_min": 765
},
{
"epoch": 1.186161449752883,
"grad_norm": 0.6833347407466104,
"learning_rate": 3.941944114379321e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29879602789878845,
"step": 720,
"valid_targets_mean": 2617.1,
"valid_targets_min": 438
},
{
"epoch": 1.1943986820428336,
"grad_norm": 0.7184104527406685,
"learning_rate": 3.939962655749092e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28567400574684143,
"step": 725,
"valid_targets_mean": 3099.2,
"valid_targets_min": 817
},
{
"epoch": 1.2026359143327843,
"grad_norm": 0.5458746613899529,
"learning_rate": 3.937948463294636e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22731509804725647,
"step": 730,
"valid_targets_mean": 3388.2,
"valid_targets_min": 297
},
{
"epoch": 1.2108731466227347,
"grad_norm": 0.54504544091912,
"learning_rate": 3.935901571002288e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33203086256980896,
"step": 735,
"valid_targets_mean": 4777.1,
"valid_targets_min": 1301
},
{
"epoch": 1.2191103789126854,
"grad_norm": 0.6106385198867497,
"learning_rate": 3.9338220134101426e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3434884548187256,
"step": 740,
"valid_targets_mean": 3176.8,
"valid_targets_min": 789
},
{
"epoch": 1.227347611202636,
"grad_norm": 0.632041382439529,
"learning_rate": 3.931709825607469e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28263598680496216,
"step": 745,
"valid_targets_mean": 2709.9,
"valid_targets_min": 749
},
{
"epoch": 1.2355848434925865,
"grad_norm": 0.6654709061054238,
"learning_rate": 3.9295650432341195e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2941563129425049,
"step": 750,
"valid_targets_mean": 2752.9,
"valid_targets_min": 569
},
{
"epoch": 1.2438220757825371,
"grad_norm": 0.5691752162475886,
"learning_rate": 3.927387702479931e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27349454164505005,
"step": 755,
"valid_targets_mean": 3335.9,
"valid_targets_min": 698
},
{
"epoch": 1.2520593080724876,
"grad_norm": 0.639705746497503,
"learning_rate": 3.925177840084109e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904908061027527,
"step": 760,
"valid_targets_mean": 2948.4,
"valid_targets_min": 1389
},
{
"epoch": 1.2602965403624382,
"grad_norm": 0.6452781995342208,
"learning_rate": 3.922935493334614e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24950724840164185,
"step": 765,
"valid_targets_mean": 2633.5,
"valid_targets_min": 245
},
{
"epoch": 1.2685337726523889,
"grad_norm": 0.6556539492801983,
"learning_rate": 3.920660700067526e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3787687122821808,
"step": 770,
"valid_targets_mean": 3176.0,
"valid_targets_min": 1059
},
{
"epoch": 1.2767710049423393,
"grad_norm": 0.6614063472129723,
"learning_rate": 3.9183534986664094e-05,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30761298537254333,
"step": 775,
"valid_targets_mean": 2789.6,
"valid_targets_min": 607
},
{
"epoch": 1.28500823723229,
"grad_norm": 0.5321065467089631,
"learning_rate": 3.9160139280616674e-05,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3060571551322937,
"step": 780,
"valid_targets_mean": 4055.0,
"valid_targets_min": 1195
},
{
"epoch": 1.2932454695222404,
"grad_norm": 0.6354469805842081,
"learning_rate": 3.9136420277298795e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.268049955368042,
"step": 785,
"valid_targets_mean": 2501.8,
"valid_targets_min": 1260
},
{
"epoch": 1.301482701812191,
"grad_norm": 0.743079520777049,
"learning_rate": 3.911237837693141e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2993124723434448,
"step": 790,
"valid_targets_mean": 2397.9,
"valid_targets_min": 702
},
{
"epoch": 1.3097199341021417,
"grad_norm": 0.6922482501855028,
"learning_rate": 3.9088013985183836e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3406824767589569,
"step": 795,
"valid_targets_mean": 2366.7,
"valid_targets_min": 334
},
{
"epoch": 1.3179571663920924,
"grad_norm": 0.6649210661228457,
"learning_rate": 3.9063327513166945e-05,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3096727430820465,
"step": 800,
"valid_targets_mean": 2671.3,
"valid_targets_min": 331
},
{
"epoch": 1.3261943986820428,
"grad_norm": 0.7476716763557605,
"learning_rate": 3.9038319377426186e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2687912583351135,
"step": 805,
"valid_targets_mean": 2750.8,
"valid_targets_min": 1079
},
{
"epoch": 1.3344316309719935,
"grad_norm": 0.7202214301792093,
"learning_rate": 3.9012989999934595e-05,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25632429122924805,
"step": 810,
"valid_targets_mean": 2071.9,
"valid_targets_min": 336
},
{
"epoch": 1.342668863261944,
"grad_norm": 0.7285006052829752,
"learning_rate": 3.898733980808565e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2646828293800354,
"step": 815,
"valid_targets_mean": 1977.5,
"valid_targets_min": 685
},
{
"epoch": 1.3509060955518946,
"grad_norm": 0.5637166344318452,
"learning_rate": 3.896136923468607e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26190030574798584,
"step": 820,
"valid_targets_mean": 3011.3,
"valid_targets_min": 321
},
{
"epoch": 1.3591433278418452,
"grad_norm": 0.6680895688573001,
"learning_rate": 3.8935078717948507e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34075266122817993,
"step": 825,
"valid_targets_mean": 2643.4,
"valid_targets_min": 685
},
{
"epoch": 1.3673805601317957,
"grad_norm": 0.6343514611286315,
"learning_rate": 3.890846870148416e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886373698711395,
"step": 830,
"valid_targets_mean": 2637.9,
"valid_targets_min": 915
},
{
"epoch": 1.3756177924217463,
"grad_norm": 0.6380139244277822,
"learning_rate": 3.8881539634295287e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33058857917785645,
"step": 835,
"valid_targets_mean": 2910.9,
"valid_targets_min": 627
},
{
"epoch": 1.3838550247116967,
"grad_norm": 0.6309951441851109,
"learning_rate": 3.88542919707676e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25456634163856506,
"step": 840,
"valid_targets_mean": 3141.1,
"valid_targets_min": 1207
},
{
"epoch": 1.3920922570016474,
"grad_norm": 0.631875618821807,
"learning_rate": 3.882672617066266e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26138928532600403,
"step": 845,
"valid_targets_mean": 2551.6,
"valid_targets_min": 803
},
{
"epoch": 1.400329489291598,
"grad_norm": 0.6937940108661667,
"learning_rate": 3.8798842699110075e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2633447051048279,
"step": 850,
"valid_targets_mean": 2452.7,
"valid_targets_min": 858
},
{
"epoch": 1.4085667215815487,
"grad_norm": 0.550875012894034,
"learning_rate": 3.877064202659964e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30909478664398193,
"step": 855,
"valid_targets_mean": 3598.6,
"valid_targets_min": 867
},
{
"epoch": 1.4168039538714992,
"grad_norm": 0.7341957843695258,
"learning_rate": 3.874212462897343e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32587555050849915,
"step": 860,
"valid_targets_mean": 2998.2,
"valid_targets_min": 187
},
{
"epoch": 1.4250411861614498,
"grad_norm": 0.564651910132328,
"learning_rate": 3.871329098741776e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27226191759109497,
"step": 865,
"valid_targets_mean": 2943.2,
"valid_targets_min": 1012
},
{
"epoch": 1.4332784184514002,
"grad_norm": 0.6486502156947155,
"learning_rate": 3.8684141588455076e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2052830308675766,
"step": 870,
"valid_targets_mean": 2074.1,
"valid_targets_min": 290
},
{
"epoch": 1.441515650741351,
"grad_norm": 0.6013453446093197,
"learning_rate": 3.865467692393571e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24652577936649323,
"step": 875,
"valid_targets_mean": 2540.7,
"valid_targets_min": 746
},
{
"epoch": 1.4497528830313016,
"grad_norm": 0.5514571107088988,
"learning_rate": 3.862489749102963e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31356847286224365,
"step": 880,
"valid_targets_mean": 3385.4,
"valid_targets_min": 767
},
{
"epoch": 1.457990115321252,
"grad_norm": 0.7273008617384937,
"learning_rate": 3.8594803792218e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32229501008987427,
"step": 885,
"valid_targets_mean": 2529.9,
"valid_targets_min": 245
},
{
"epoch": 1.4662273476112027,
"grad_norm": 0.6091081729268533,
"learning_rate": 3.856439633528476e-05,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31231796741485596,
"step": 890,
"valid_targets_mean": 2814.8,
"valid_targets_min": 1098
},
{
"epoch": 1.474464579901153,
"grad_norm": 0.5906549436799012,
"learning_rate": 3.853367563330799e-05,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24671581387519836,
"step": 895,
"valid_targets_mean": 3008.8,
"valid_targets_min": 768
},
{
"epoch": 1.4827018121911038,
"grad_norm": 0.6097661246585641,
"learning_rate": 3.850264220465134e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2906344532966614,
"step": 900,
"valid_targets_mean": 2819.9,
"valid_targets_min": 857
},
{
"epoch": 1.4909390444810544,
"grad_norm": 0.6471614592146676,
"learning_rate": 3.847129657295516e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26892954111099243,
"step": 905,
"valid_targets_mean": 3368.9,
"valid_targets_min": 806
},
{
"epoch": 1.499176276771005,
"grad_norm": 0.6035423144036351,
"learning_rate": 3.843963926712778e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25377434492111206,
"step": 910,
"valid_targets_mean": 2901.8,
"valid_targets_min": 633
},
{
"epoch": 1.5074135090609555,
"grad_norm": 0.7343329864064728,
"learning_rate": 3.840767082133656e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28473225235939026,
"step": 915,
"valid_targets_mean": 2271.8,
"valid_targets_min": 845
},
{
"epoch": 1.515650741350906,
"grad_norm": 0.7136048929578265,
"learning_rate": 3.837539177499882e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092586398124695,
"step": 920,
"valid_targets_mean": 3439.1,
"valid_targets_min": 811
},
{
"epoch": 1.5238879736408566,
"grad_norm": 0.5393319708825398,
"learning_rate": 3.834280267277279e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33659571409225464,
"step": 925,
"valid_targets_mean": 3570.9,
"valid_targets_min": 1369
},
{
"epoch": 1.5321252059308073,
"grad_norm": 0.5596333567807844,
"learning_rate": 3.830990406454842e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25617244839668274,
"step": 930,
"valid_targets_mean": 2960.6,
"valid_targets_min": 312
},
{
"epoch": 1.540362438220758,
"grad_norm": 0.5510656760962294,
"learning_rate": 3.827669650543805e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.256226509809494,
"step": 935,
"valid_targets_mean": 2793.9,
"valid_targets_min": 248
},
{
"epoch": 1.5485996705107083,
"grad_norm": 0.6314296620321947,
"learning_rate": 3.8243180555767135e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26010096073150635,
"step": 940,
"valid_targets_mean": 2288.9,
"valid_targets_min": 626
},
{
"epoch": 1.556836902800659,
"grad_norm": 0.633916371794186,
"learning_rate": 3.8209356781064686e-05,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26327386498451233,
"step": 945,
"valid_targets_mean": 2440.3,
"valid_targets_min": 253
},
{
"epoch": 1.5650741350906094,
"grad_norm": 0.5989790640609941,
"learning_rate": 3.8175225752053816e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305331826210022,
"step": 950,
"valid_targets_mean": 2859.9,
"valid_targets_min": 405
},
{
"epoch": 1.57331136738056,
"grad_norm": 0.5603727241833217,
"learning_rate": 3.814078804464205e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24717459082603455,
"step": 955,
"valid_targets_mean": 2985.9,
"valid_targets_min": 836
},
{
"epoch": 1.5815485996705108,
"grad_norm": 0.6330587421810094,
"learning_rate": 3.8106044239911645e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.293704628944397,
"step": 960,
"valid_targets_mean": 2647.1,
"valid_targets_min": 256
},
{
"epoch": 1.5897858319604614,
"grad_norm": 0.7241910589825704,
"learning_rate": 3.8070994924109746e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26694560050964355,
"step": 965,
"valid_targets_mean": 3463.4,
"valid_targets_min": 799
},
{
"epoch": 1.5980230642504119,
"grad_norm": 0.6839216284178794,
"learning_rate": 3.803564068863854e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3023781180381775,
"step": 970,
"valid_targets_mean": 2531.4,
"valid_targets_min": 271
},
{
"epoch": 1.6062602965403623,
"grad_norm": 0.5965662328078362,
"learning_rate": 3.7999982130045246e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28980326652526855,
"step": 975,
"valid_targets_mean": 3020.4,
"valid_targets_min": 869
},
{
"epoch": 1.614497528830313,
"grad_norm": 0.6306332846050356,
"learning_rate": 3.796401985001206e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018638491630554,
"step": 980,
"valid_targets_mean": 2907.6,
"valid_targets_min": 1108
},
{
"epoch": 1.6227347611202636,
"grad_norm": 0.6196308352831952,
"learning_rate": 3.792775445534601e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28585222363471985,
"step": 985,
"valid_targets_mean": 2755.2,
"valid_targets_min": 1110
},
{
"epoch": 1.6309719934102143,
"grad_norm": 0.5061334101918796,
"learning_rate": 3.7891186557968665e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2653998136520386,
"step": 990,
"valid_targets_mean": 3828.8,
"valid_targets_min": 380
},
{
"epoch": 1.6392092257001647,
"grad_norm": 0.5548171900791329,
"learning_rate": 3.785431677490592e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25885725021362305,
"step": 995,
"valid_targets_mean": 3003.2,
"valid_targets_min": 716
},
{
"epoch": 1.6474464579901154,
"grad_norm": 0.544647990594083,
"learning_rate": 3.781714572827746e-05,
"loss": 0.3231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3178400993347168,
"step": 1000,
"valid_targets_mean": 3262.6,
"valid_targets_min": 575
},
{
"epoch": 1.6556836902800658,
"grad_norm": 0.5957620379095658,
"learning_rate": 3.777967404528636e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3391578793525696,
"step": 1005,
"valid_targets_mean": 3305.6,
"valid_targets_min": 224
},
{
"epoch": 1.6639209225700164,
"grad_norm": 0.5831365067144099,
"learning_rate": 3.774190235820843e-05,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27633339166641235,
"step": 1010,
"valid_targets_mean": 3138.8,
"valid_targets_min": 1102
},
{
"epoch": 1.672158154859967,
"grad_norm": 0.5866526617411725,
"learning_rate": 3.770383130438159e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521780729293823,
"step": 1015,
"valid_targets_mean": 2772.1,
"valid_targets_min": 899
},
{
"epoch": 1.6803953871499178,
"grad_norm": 0.6617850729419059,
"learning_rate": 3.76654615261951e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704291045665741,
"step": 1020,
"valid_targets_mean": 2489.5,
"valid_targets_min": 800
},
{
"epoch": 1.6886326194398682,
"grad_norm": 0.6758228599415805,
"learning_rate": 3.7626793671078743e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29394012689590454,
"step": 1025,
"valid_targets_mean": 2479.1,
"valid_targets_min": 475
},
{
"epoch": 1.6968698517298186,
"grad_norm": 0.6302344983972948,
"learning_rate": 3.758782839149187e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2621959447860718,
"step": 1030,
"valid_targets_mean": 2202.9,
"valid_targets_min": 841
},
{
"epoch": 1.7051070840197693,
"grad_norm": 0.7505883002451076,
"learning_rate": 3.754856634491238e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3061571717262268,
"step": 1035,
"valid_targets_mean": 2011.4,
"valid_targets_min": 552
},
{
"epoch": 1.71334431630972,
"grad_norm": 0.6982098895422223,
"learning_rate": 3.75090081938257e-05,
"loss": 0.3261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32887348532676697,
"step": 1040,
"valid_targets_mean": 2548.1,
"valid_targets_min": 264
},
{
"epoch": 1.7215815485996706,
"grad_norm": 0.6826562094159441,
"learning_rate": 3.7469154605713496e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2549431622028351,
"step": 1045,
"valid_targets_mean": 2234.9,
"valid_targets_min": 311
},
{
"epoch": 1.729818780889621,
"grad_norm": 0.6436168602201539,
"learning_rate": 3.742900625304252e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26707977056503296,
"step": 1050,
"valid_targets_mean": 2868.2,
"valid_targets_min": 730
},
{
"epoch": 1.7380560131795717,
"grad_norm": 0.6004930059899968,
"learning_rate": 3.7388563813253194e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33015143871307373,
"step": 1055,
"valid_targets_mean": 3110.4,
"valid_targets_min": 728
},
{
"epoch": 1.7462932454695221,
"grad_norm": 0.5441236234486593,
"learning_rate": 3.7347827968748196e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2715633511543274,
"step": 1060,
"valid_targets_mean": 3396.2,
"valid_targets_min": 935
},
{
"epoch": 1.7545304777594728,
"grad_norm": 0.6675223889236319,
"learning_rate": 3.730679940688094e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3189924657344818,
"step": 1065,
"valid_targets_mean": 2620.6,
"valid_targets_min": 308
},
{
"epoch": 1.7627677100494235,
"grad_norm": 0.6168969110960196,
"learning_rate": 3.7265478819944004e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3395520746707916,
"step": 1070,
"valid_targets_mean": 2912.7,
"valid_targets_min": 985
},
{
"epoch": 1.771004942339374,
"grad_norm": 0.6046464594479612,
"learning_rate": 3.722386690515742e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24619776010513306,
"step": 1075,
"valid_targets_mean": 2565.3,
"valid_targets_min": 936
},
{
"epoch": 1.7792421746293245,
"grad_norm": 0.5733766197797237,
"learning_rate": 3.718196436465693e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24001248180866241,
"step": 1080,
"valid_targets_mean": 3276.8,
"valid_targets_min": 1391
},
{
"epoch": 1.787479406919275,
"grad_norm": 0.5359416776650924,
"learning_rate": 3.713977190548211e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31075796484947205,
"step": 1085,
"valid_targets_mean": 3900.6,
"valid_targets_min": 1288
},
{
"epoch": 1.7957166392092256,
"grad_norm": 0.7891318947723374,
"learning_rate": 3.709729023956448e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24248431622982025,
"step": 1090,
"valid_targets_mean": 2105.8,
"valid_targets_min": 525
},
{
"epoch": 1.8039538714991763,
"grad_norm": 0.4963674547261414,
"learning_rate": 3.705452008371545e-05,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084948718547821,
"step": 1095,
"valid_targets_mean": 3216.0,
"valid_targets_min": 539
},
{
"epoch": 1.812191103789127,
"grad_norm": 0.6700038145214892,
"learning_rate": 3.701146215961426e-05,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2652949392795563,
"step": 1100,
"valid_targets_mean": 2111.5,
"valid_targets_min": 832
},
{
"epoch": 1.8204283360790774,
"grad_norm": 0.5716232564162521,
"learning_rate": 3.696811719379578e-05,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3448944389820099,
"step": 1105,
"valid_targets_mean": 3898.4,
"valid_targets_min": 287
},
{
"epoch": 1.828665568369028,
"grad_norm": 0.5998885452948804,
"learning_rate": 3.692448591763827e-05,
"loss": 0.266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2568257451057434,
"step": 1110,
"valid_targets_mean": 2799.3,
"valid_targets_min": 751
},
{
"epoch": 1.8369028006589785,
"grad_norm": 0.7726688835753368,
"learning_rate": 3.6880569067350994e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870601415634155,
"step": 1115,
"valid_targets_mean": 2597.6,
"valid_targets_min": 275
},
{
"epoch": 1.8451400329489291,
"grad_norm": 0.6739523370370597,
"learning_rate": 3.683636738396187e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.295218288898468,
"step": 1120,
"valid_targets_mean": 2633.4,
"valid_targets_min": 323
},
{
"epoch": 1.8533772652388798,
"grad_norm": 0.5074395074268739,
"learning_rate": 3.6791881613304916e-05,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2503700256347656,
"step": 1125,
"valid_targets_mean": 3885.8,
"valid_targets_min": 861
},
{
"epoch": 1.8616144975288305,
"grad_norm": 0.6419133897350886,
"learning_rate": 3.674711250600766e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30119603872299194,
"step": 1130,
"valid_targets_mean": 2609.1,
"valid_targets_min": 1010
},
{
"epoch": 1.869851729818781,
"grad_norm": 0.6074389296511881,
"learning_rate": 3.6702060817478524e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2686932682991028,
"step": 1135,
"valid_targets_mean": 2378.4,
"valid_targets_min": 776
},
{
"epoch": 1.8780889621087313,
"grad_norm": 0.6457310520573254,
"learning_rate": 3.6656727307894e-05,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615449130535126,
"step": 1140,
"valid_targets_mean": 2275.4,
"valid_targets_min": 792
},
{
"epoch": 1.886326194398682,
"grad_norm": 0.6191056984207056,
"learning_rate": 3.6611112742185913e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25483569502830505,
"step": 1145,
"valid_targets_mean": 2271.7,
"valid_targets_min": 352
},
{
"epoch": 1.8945634266886326,
"grad_norm": 0.6246965459645147,
"learning_rate": 3.6565217890028435e-05,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788812816143036,
"step": 1150,
"valid_targets_mean": 2767.0,
"valid_targets_min": 679
},
{
"epoch": 1.9028006589785833,
"grad_norm": 0.656487573533247,
"learning_rate": 3.651904352582514e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3155135214328766,
"step": 1155,
"valid_targets_mean": 2277.2,
"valid_targets_min": 216
},
{
"epoch": 1.9110378912685337,
"grad_norm": 0.6272798767220624,
"learning_rate": 3.647259042869595e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3550041615962982,
"step": 1160,
"valid_targets_mean": 2828.5,
"valid_targets_min": 356
},
{
"epoch": 1.9192751235584844,
"grad_norm": 0.6089019795513212,
"learning_rate": 3.642585938246394e-05,
"loss": 0.2961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3001123070716858,
"step": 1165,
"valid_targets_mean": 2918.1,
"valid_targets_min": 1368
},
{
"epoch": 1.9275123558484348,
"grad_norm": 0.7155478877487227,
"learning_rate": 3.6378851175642166e-05,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31469109654426575,
"step": 1170,
"valid_targets_mean": 2766.4,
"valid_targets_min": 764
},
{
"epoch": 1.9357495881383855,
"grad_norm": 0.5900071227360756,
"learning_rate": 3.63315666014203e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28159189224243164,
"step": 1175,
"valid_targets_mean": 2722.8,
"valid_targets_min": 1564
},
{
"epoch": 1.9439868204283361,
"grad_norm": 0.5720042983430078,
"learning_rate": 3.6284006457651295e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.306449294090271,
"step": 1180,
"valid_targets_mean": 3149.6,
"valid_targets_min": 821
},
{
"epoch": 1.9522240527182868,
"grad_norm": 0.6518952324340549,
"learning_rate": 3.6236171546837936e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28307563066482544,
"step": 1185,
"valid_targets_mean": 2688.5,
"valid_targets_min": 654
},
{
"epoch": 1.9604612850082372,
"grad_norm": 0.5643073151697097,
"learning_rate": 3.618806267611923e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32395491003990173,
"step": 1190,
"valid_targets_mean": 3477.4,
"valid_targets_min": 600
},
{
"epoch": 1.9686985172981877,
"grad_norm": 0.6448164120369934,
"learning_rate": 3.613968065725685e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536458373069763,
"step": 1195,
"valid_targets_mean": 2676.1,
"valid_targets_min": 942
},
{
"epoch": 1.9769357495881383,
"grad_norm": 2.2836948181723016,
"learning_rate": 3.60910263066214e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24172762036323547,
"step": 1200,
"valid_targets_mean": 2737.7,
"valid_targets_min": 1061
},
{
"epoch": 1.985172981878089,
"grad_norm": 0.5707078354838783,
"learning_rate": 3.604210044517867e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31775957345962524,
"step": 1205,
"valid_targets_mean": 3227.9,
"valid_targets_min": 992
},
{
"epoch": 1.9934102141680397,
"grad_norm": 0.7989744132116524,
"learning_rate": 3.599290389847576e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4108525514602661,
"step": 1210,
"valid_targets_mean": 3928.9,
"valid_targets_min": 869
},
{
"epoch": 2.0016474464579903,
"grad_norm": 0.6264226403015248,
"learning_rate": 3.594343749662716e-05,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27158790826797485,
"step": 1215,
"valid_targets_mean": 2425.3,
"valid_targets_min": 234
},
{
"epoch": 2.0098846787479405,
"grad_norm": 0.5942699391272229,
"learning_rate": 3.5893702074300745e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23825138807296753,
"step": 1220,
"valid_targets_mean": 2739.1,
"valid_targets_min": 233
},
{
"epoch": 2.018121911037891,
"grad_norm": 0.7236717591594628,
"learning_rate": 3.584369847070369e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27776312828063965,
"step": 1225,
"valid_targets_mean": 2409.8,
"valid_targets_min": 795
},
{
"epoch": 2.026359143327842,
"grad_norm": 0.5761714008930021,
"learning_rate": 3.579342752956829e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2385309338569641,
"step": 1230,
"valid_targets_mean": 3224.9,
"valid_targets_min": 835
},
{
"epoch": 2.0345963756177925,
"grad_norm": 0.5691413404913723,
"learning_rate": 3.574289009913776e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18973645567893982,
"step": 1235,
"valid_targets_mean": 3347.5,
"valid_targets_min": 785
},
{
"epoch": 2.042833607907743,
"grad_norm": 0.6341526990742906,
"learning_rate": 3.5692087032151915e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24696478247642517,
"step": 1240,
"valid_targets_mean": 2765.2,
"valid_targets_min": 334
},
{
"epoch": 2.0510708401976934,
"grad_norm": 0.5063130857062907,
"learning_rate": 3.564101918583274e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24281460046768188,
"step": 1245,
"valid_targets_mean": 4392.6,
"valid_targets_min": 1107
},
{
"epoch": 2.059308072487644,
"grad_norm": 0.6823195765956594,
"learning_rate": 3.5589687421869964e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24046598374843597,
"step": 1250,
"valid_targets_mean": 2668.4,
"valid_targets_min": 879
},
{
"epoch": 2.0675453047775947,
"grad_norm": 0.5891801634089261,
"learning_rate": 3.553809260640653e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24028754234313965,
"step": 1255,
"valid_targets_mean": 3647.4,
"valid_targets_min": 878
},
{
"epoch": 2.0757825370675453,
"grad_norm": 0.560587648872072,
"learning_rate": 3.5486235610023935e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25208956003189087,
"step": 1260,
"valid_targets_mean": 3228.0,
"valid_targets_min": 1006
},
{
"epoch": 2.084019769357496,
"grad_norm": 0.5431257163133473,
"learning_rate": 3.54341173077276e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619468569755554,
"step": 1265,
"valid_targets_mean": 3691.9,
"valid_targets_min": 1020
},
{
"epoch": 2.0922570016474467,
"grad_norm": 0.6876181195287832,
"learning_rate": 3.5381738578932035e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2359652817249298,
"step": 1270,
"valid_targets_mean": 2196.4,
"valid_targets_min": 896
},
{
"epoch": 2.100494233937397,
"grad_norm": 0.7408152195912641,
"learning_rate": 3.532910030744607e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2573264539241791,
"step": 1275,
"valid_targets_mean": 2346.4,
"valid_targets_min": 297
},
{
"epoch": 2.1087314662273475,
"grad_norm": 0.6103530118299919,
"learning_rate": 3.5276203381457894e-05,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2797989845275879,
"step": 1280,
"valid_targets_mean": 3206.1,
"valid_targets_min": 674
},
{
"epoch": 2.116968698517298,
"grad_norm": 0.5891608135099099,
"learning_rate": 3.5223048693520094e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533876597881317,
"step": 1285,
"valid_targets_mean": 3108.0,
"valid_targets_min": 591
},
{
"epoch": 2.125205930807249,
"grad_norm": 0.6208888605283639,
"learning_rate": 3.5169637140534574e-05,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2187802642583847,
"step": 1290,
"valid_targets_mean": 2592.9,
"valid_targets_min": 281
},
{
"epoch": 2.1334431630971995,
"grad_norm": 0.6676297767164048,
"learning_rate": 3.5115969623737447e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24208733439445496,
"step": 1295,
"valid_targets_mean": 2669.2,
"valid_targets_min": 330
},
{
"epoch": 2.1416803953871497,
"grad_norm": 0.7229124706726481,
"learning_rate": 3.506204704868379e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2806577980518341,
"step": 1300,
"valid_targets_mean": 2626.9,
"valid_targets_min": 349
},
{
"epoch": 2.1499176276771004,
"grad_norm": 0.5658374542999091,
"learning_rate": 3.500787032523242e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21356990933418274,
"step": 1305,
"valid_targets_mean": 3147.4,
"valid_targets_min": 275
},
{
"epoch": 2.158154859967051,
"grad_norm": 0.6089410486353419,
"learning_rate": 3.495344036753048e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27112677693367004,
"step": 1310,
"valid_targets_mean": 3331.5,
"valid_targets_min": 394
},
{
"epoch": 2.1663920922570017,
"grad_norm": 0.6145684158379482,
"learning_rate": 3.489875809399806e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2448844313621521,
"step": 1315,
"valid_targets_mean": 2984.2,
"valid_targets_min": 265
},
{
"epoch": 2.1746293245469523,
"grad_norm": 0.6846498864389476,
"learning_rate": 3.484382442731268e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2414667010307312,
"step": 1320,
"valid_targets_mean": 2606.9,
"valid_targets_min": 644
},
{
"epoch": 2.182866556836903,
"grad_norm": 0.73318481182418,
"learning_rate": 3.4788640294393725e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2895458936691284,
"step": 1325,
"valid_targets_mean": 2585.8,
"valid_targets_min": 216
},
{
"epoch": 2.191103789126853,
"grad_norm": 0.6942685225765722,
"learning_rate": 3.47332066263868e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770744562149048,
"step": 1330,
"valid_targets_mean": 3022.6,
"valid_targets_min": 242
},
{
"epoch": 2.199341021416804,
"grad_norm": 0.520985364981708,
"learning_rate": 3.467752435864803e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20206497609615326,
"step": 1335,
"valid_targets_mean": 3354.1,
"valid_targets_min": 809
},
{
"epoch": 2.2075782537067545,
"grad_norm": 0.5832089119364511,
"learning_rate": 3.462159443072826e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2927054166793823,
"step": 1340,
"valid_targets_mean": 3694.7,
"valid_targets_min": 948
},
{
"epoch": 2.215815485996705,
"grad_norm": 0.58897748237891,
"learning_rate": 3.456541778635722e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19613176584243774,
"step": 1345,
"valid_targets_mean": 2776.6,
"valid_targets_min": 1254
},
{
"epoch": 2.224052718286656,
"grad_norm": 0.6484887362652936,
"learning_rate": 3.45089953734276e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20931027829647064,
"step": 1350,
"valid_targets_mean": 2288.8,
"valid_targets_min": 297
},
{
"epoch": 2.232289950576606,
"grad_norm": 0.5929321738275963,
"learning_rate": 3.445232814397902e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19637475907802582,
"step": 1355,
"valid_targets_mean": 2361.2,
"valid_targets_min": 912
},
{
"epoch": 2.2405271828665567,
"grad_norm": 0.6012994089232492,
"learning_rate": 3.4395417054182034e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27980607748031616,
"step": 1360,
"valid_targets_mean": 3480.1,
"valid_targets_min": 402
},
{
"epoch": 2.2487644151565074,
"grad_norm": 0.5960949440370955,
"learning_rate": 3.433826306432193e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25292590260505676,
"step": 1365,
"valid_targets_mean": 2758.2,
"valid_targets_min": 886
},
{
"epoch": 2.257001647446458,
"grad_norm": 0.5481540263656652,
"learning_rate": 3.428086713878255e-05,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18284395337104797,
"step": 1370,
"valid_targets_mean": 3020.9,
"valid_targets_min": 380
},
{
"epoch": 2.2652388797364087,
"grad_norm": 0.6107676338306715,
"learning_rate": 3.422323024603004e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2406243532896042,
"step": 1375,
"valid_targets_mean": 3207.1,
"valid_targets_min": 1181
},
{
"epoch": 2.2734761120263594,
"grad_norm": 0.7818816948424279,
"learning_rate": 3.4165353358596475e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35243645310401917,
"step": 1380,
"valid_targets_mean": 3005.8,
"valid_targets_min": 688
},
{
"epoch": 2.2817133443163096,
"grad_norm": 0.6375768102457982,
"learning_rate": 3.410723745306348e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23199833929538727,
"step": 1385,
"valid_targets_mean": 2873.8,
"valid_targets_min": 735
},
{
"epoch": 2.2899505766062602,
"grad_norm": 0.7095261625145105,
"learning_rate": 3.404888351004571e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275643527507782,
"step": 1390,
"valid_targets_mean": 2629.0,
"valid_targets_min": 930
},
{
"epoch": 2.298187808896211,
"grad_norm": 0.5955591755415022,
"learning_rate": 3.3990292514174346e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2331334948539734,
"step": 1395,
"valid_targets_mean": 2833.2,
"valid_targets_min": 776
},
{
"epoch": 2.3064250411861615,
"grad_norm": 0.5761183125798899,
"learning_rate": 3.393146545408047e-05,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2591421902179718,
"step": 1400,
"valid_targets_mean": 3131.5,
"valid_targets_min": 830
},
{
"epoch": 2.314662273476112,
"grad_norm": 0.646758804736525,
"learning_rate": 3.3872403322378354e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23602330684661865,
"step": 1405,
"valid_targets_mean": 2488.8,
"valid_targets_min": 226
},
{
"epoch": 2.3228995057660624,
"grad_norm": 0.6866011148331042,
"learning_rate": 3.3813107115648745e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3126336634159088,
"step": 1410,
"valid_targets_mean": 2544.7,
"valid_targets_min": 723
},
{
"epoch": 2.331136738056013,
"grad_norm": 0.6346999798467989,
"learning_rate": 3.375357783442205e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2111891508102417,
"step": 1415,
"valid_targets_mean": 2556.5,
"valid_targets_min": 763
},
{
"epoch": 2.3393739703459637,
"grad_norm": 0.6309803885063188,
"learning_rate": 3.369381648316144e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24223890900611877,
"step": 1420,
"valid_targets_mean": 2757.2,
"valid_targets_min": 704
},
{
"epoch": 2.3476112026359144,
"grad_norm": 0.6326584329828758,
"learning_rate": 3.363382407024588e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26198041439056396,
"step": 1425,
"valid_targets_mean": 2648.4,
"valid_targets_min": 1051
},
{
"epoch": 2.355848434925865,
"grad_norm": 0.6361946094436111,
"learning_rate": 3.357360160795317e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635315954685211,
"step": 1430,
"valid_targets_mean": 2999.0,
"valid_targets_min": 1031
},
{
"epoch": 2.3640856672158153,
"grad_norm": 0.6154578078423868,
"learning_rate": 3.35131501124428e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19209545850753784,
"step": 1435,
"valid_targets_mean": 2452.1,
"valid_targets_min": 679
},
{
"epoch": 2.372322899505766,
"grad_norm": 0.5871616148619758,
"learning_rate": 3.345247060373887e-05,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23240095376968384,
"step": 1440,
"valid_targets_mean": 3175.5,
"valid_targets_min": 700
},
{
"epoch": 2.3805601317957166,
"grad_norm": 0.6841219210951218,
"learning_rate": 3.3391564105712824e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33838337659835815,
"step": 1445,
"valid_targets_mean": 2693.4,
"valid_targets_min": 899
},
{
"epoch": 2.3887973640856672,
"grad_norm": 0.5614836697402698,
"learning_rate": 3.333043164606618e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2738487124443054,
"step": 1450,
"valid_targets_mean": 3429.0,
"valid_targets_min": 951
},
{
"epoch": 2.397034596375618,
"grad_norm": 0.53864317436498,
"learning_rate": 3.3269074256313246e-05,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20876136422157288,
"step": 1455,
"valid_targets_mean": 3511.2,
"valid_targets_min": 751
},
{
"epoch": 2.4052718286655685,
"grad_norm": 0.655242664968237,
"learning_rate": 3.320749297176363e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22833922505378723,
"step": 1460,
"valid_targets_mean": 2380.5,
"valid_targets_min": 346
},
{
"epoch": 2.4135090609555188,
"grad_norm": 0.8232236295806061,
"learning_rate": 3.3145688831504845e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2448880970478058,
"step": 1465,
"valid_targets_mean": 3051.5,
"valid_targets_min": 712
},
{
"epoch": 2.4217462932454694,
"grad_norm": 0.638531424640081,
"learning_rate": 3.308366287838472e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23629572987556458,
"step": 1470,
"valid_targets_mean": 2371.6,
"valid_targets_min": 675
},
{
"epoch": 2.42998352553542,
"grad_norm": 0.6526933180553507,
"learning_rate": 3.302141615899384e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2188447117805481,
"step": 1475,
"valid_targets_mean": 2430.1,
"valid_targets_min": 750
},
{
"epoch": 2.4382207578253707,
"grad_norm": 0.6236160880845308,
"learning_rate": 3.2958949723647875e-05,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29466351866722107,
"step": 1480,
"valid_targets_mean": 2820.9,
"valid_targets_min": 615
},
{
"epoch": 2.4464579901153214,
"grad_norm": 0.6349685298066351,
"learning_rate": 3.289626462636985e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22705788910388947,
"step": 1485,
"valid_targets_mean": 2800.2,
"valid_targets_min": 638
},
{
"epoch": 2.454695222405272,
"grad_norm": 0.6592423626712279,
"learning_rate": 3.283336192487238e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22058206796646118,
"step": 1490,
"valid_targets_mean": 2350.7,
"valid_targets_min": 743
},
{
"epoch": 2.4629324546952223,
"grad_norm": 0.6228303104982533,
"learning_rate": 3.277024268053978e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24452120065689087,
"step": 1495,
"valid_targets_mean": 3045.2,
"valid_targets_min": 312
},
{
"epoch": 2.471169686985173,
"grad_norm": 0.6786946251861339,
"learning_rate": 3.2706907958410234e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24040010571479797,
"step": 1500,
"valid_targets_mean": 2688.6,
"valid_targets_min": 1069
},
{
"epoch": 2.4794069192751236,
"grad_norm": 0.56494805323628,
"learning_rate": 3.2643358827157724e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2005000114440918,
"step": 1505,
"valid_targets_mean": 3374.3,
"valid_targets_min": 1096
},
{
"epoch": 2.4876441515650742,
"grad_norm": 0.597724401455926,
"learning_rate": 3.257959635907409e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22339114546775818,
"step": 1510,
"valid_targets_mean": 2986.3,
"valid_targets_min": 920
},
{
"epoch": 2.495881383855025,
"grad_norm": 0.6561352881615815,
"learning_rate": 3.251562163005087e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22298067808151245,
"step": 1515,
"valid_targets_mean": 2253.1,
"valid_targets_min": 925
},
{
"epoch": 2.504118616144975,
"grad_norm": 0.6162020968409021,
"learning_rate": 3.245143571956117e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27440690994262695,
"step": 1520,
"valid_targets_mean": 2877.1,
"valid_targets_min": 821
},
{
"epoch": 2.5123558484349258,
"grad_norm": 0.6082712508042523,
"learning_rate": 3.2387039710641486e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22499428689479828,
"step": 1525,
"valid_targets_mean": 2861.8,
"valid_targets_min": 289
},
{
"epoch": 2.5205930807248764,
"grad_norm": 0.7384333926998505,
"learning_rate": 3.232243468987336e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21579819917678833,
"step": 1530,
"valid_targets_mean": 3231.4,
"valid_targets_min": 729
},
{
"epoch": 2.528830313014827,
"grad_norm": 0.6877047193253706,
"learning_rate": 3.2257621747365086e-05,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097109794616699,
"step": 1535,
"valid_targets_mean": 2337.8,
"valid_targets_min": 755
},
{
"epoch": 2.5370675453047777,
"grad_norm": 0.543065421568093,
"learning_rate": 3.219260197673333e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24384282529354095,
"step": 1540,
"valid_targets_mean": 3961.9,
"valid_targets_min": 1428
},
{
"epoch": 2.545304777594728,
"grad_norm": 0.6248347745562823,
"learning_rate": 3.212737647508464e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28097227215766907,
"step": 1545,
"valid_targets_mean": 3362.5,
"valid_targets_min": 821
},
{
"epoch": 2.5535420098846786,
"grad_norm": 0.5691317720774456,
"learning_rate": 3.206194634299696e-05,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23817376792430878,
"step": 1550,
"valid_targets_mean": 3836.8,
"valid_targets_min": 1197
},
{
"epoch": 2.5617792421746293,
"grad_norm": 0.684915654232255,
"learning_rate": 3.199631268450104e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2511272132396698,
"step": 1555,
"valid_targets_mean": 2801.4,
"valid_targets_min": 471
},
{
"epoch": 2.57001647446458,
"grad_norm": 0.7982907744163267,
"learning_rate": 3.1930476607061835e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38522768020629883,
"step": 1560,
"valid_targets_mean": 3067.9,
"valid_targets_min": 743
},
{
"epoch": 2.5782537067545306,
"grad_norm": 0.6053095568591514,
"learning_rate": 3.1864439221559797e-05,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25679144263267517,
"step": 1565,
"valid_targets_mean": 2767.1,
"valid_targets_min": 829
},
{
"epoch": 2.586490939044481,
"grad_norm": 0.49767493638955396,
"learning_rate": 3.179820164227213e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3335208296775818,
"step": 1570,
"valid_targets_mean": 4638.4,
"valid_targets_min": 783
},
{
"epoch": 2.594728171334432,
"grad_norm": 0.6569402555128312,
"learning_rate": 3.1731764986853985e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24302177131175995,
"step": 1575,
"valid_targets_mean": 2489.9,
"valid_targets_min": 939
},
{
"epoch": 2.602965403624382,
"grad_norm": 0.5921594644458538,
"learning_rate": 3.166513037631965e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26702389121055603,
"step": 1580,
"valid_targets_mean": 2795.8,
"valid_targets_min": 744
},
{
"epoch": 2.6112026359143328,
"grad_norm": 0.6407404206933615,
"learning_rate": 3.1598298935023536e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2785078287124634,
"step": 1585,
"valid_targets_mean": 2990.9,
"valid_targets_min": 630
},
{
"epoch": 2.6194398682042834,
"grad_norm": 0.6833324929674904,
"learning_rate": 3.153127179064131e-05,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.251248300075531,
"step": 1590,
"valid_targets_mean": 2696.2,
"valid_targets_min": 287
},
{
"epoch": 2.627677100494234,
"grad_norm": 0.6339558018061027,
"learning_rate": 3.146405007415081e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.281749427318573,
"step": 1595,
"valid_targets_mean": 2749.6,
"valid_targets_min": 849
},
{
"epoch": 2.6359143327841847,
"grad_norm": 0.6273664397725301,
"learning_rate": 3.1396634919812955e-05,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563917636871338,
"step": 1600,
"valid_targets_mean": 2623.4,
"valid_targets_min": 902
},
{
"epoch": 2.644151565074135,
"grad_norm": 0.6622434597804578,
"learning_rate": 3.1329027465152654e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3303392827510834,
"step": 1605,
"valid_targets_mean": 2999.7,
"valid_targets_min": 250
},
{
"epoch": 2.6523887973640856,
"grad_norm": 0.6020506711799892,
"learning_rate": 3.126122885093955e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22898972034454346,
"step": 1610,
"valid_targets_mean": 2827.9,
"valid_targets_min": 216
},
{
"epoch": 2.6606260296540363,
"grad_norm": 0.5656507553130597,
"learning_rate": 3.1193240221168835e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24721187353134155,
"step": 1615,
"valid_targets_mean": 3554.2,
"valid_targets_min": 824
},
{
"epoch": 2.668863261943987,
"grad_norm": 0.644282073051523,
"learning_rate": 3.112506272304189e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2700679898262024,
"step": 1620,
"valid_targets_mean": 2953.6,
"valid_targets_min": 1192
},
{
"epoch": 2.6771004942339376,
"grad_norm": 0.6841700983785681,
"learning_rate": 3.1056697506946965e-05,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23583650588989258,
"step": 1625,
"valid_targets_mean": 2720.4,
"valid_targets_min": 523
},
{
"epoch": 2.685337726523888,
"grad_norm": 0.7340836959990856,
"learning_rate": 3.0988145726439754e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307033509016037,
"step": 1630,
"valid_targets_mean": 2578.5,
"valid_targets_min": 382
},
{
"epoch": 2.6935749588138385,
"grad_norm": 0.6673998137709523,
"learning_rate": 3.091940853822393e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29108643531799316,
"step": 1635,
"valid_targets_mean": 2832.3,
"valid_targets_min": 1206
},
{
"epoch": 2.701812191103789,
"grad_norm": 0.6467186852795253,
"learning_rate": 3.0850487102131624e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21308313310146332,
"step": 1640,
"valid_targets_mean": 2594.9,
"valid_targets_min": 360
},
{
"epoch": 2.7100494233937398,
"grad_norm": 0.6944087919516522,
"learning_rate": 3.078138258110389e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23937004804611206,
"step": 1645,
"valid_targets_mean": 2263.4,
"valid_targets_min": 245
},
{
"epoch": 2.7182866556836904,
"grad_norm": 0.5326350886269784,
"learning_rate": 3.071209614117103e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3428668975830078,
"step": 1650,
"valid_targets_mean": 4543.8,
"valid_targets_min": 900
},
{
"epoch": 2.7265238879736406,
"grad_norm": 0.5078601743477384,
"learning_rate": 3.0642628951432916e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22137928009033203,
"step": 1655,
"valid_targets_mean": 3942.6,
"valid_targets_min": 769
},
{
"epoch": 2.7347611202635913,
"grad_norm": 0.601538874178317,
"learning_rate": 3.057298218403934e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2587862014770508,
"step": 1660,
"valid_targets_mean": 2621.9,
"valid_targets_min": 730
},
{
"epoch": 2.742998352553542,
"grad_norm": 0.5100732784028359,
"learning_rate": 3.050315701417016e-05,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22114631533622742,
"step": 1665,
"valid_targets_mean": 3594.6,
"valid_targets_min": 1032
},
{
"epoch": 2.7512355848434926,
"grad_norm": 0.6403837824931091,
"learning_rate": 3.043315462001549e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2376575469970703,
"step": 1670,
"valid_targets_mean": 2361.1,
"valid_targets_min": 1050
},
{
"epoch": 2.7594728171334433,
"grad_norm": 0.6630544642728583,
"learning_rate": 3.0362976182755837e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2816362679004669,
"step": 1675,
"valid_targets_mean": 2989.6,
"valid_targets_min": 324
},
{
"epoch": 2.7677100494233935,
"grad_norm": 0.6196334831818463,
"learning_rate": 3.0292622886542154e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24809390306472778,
"step": 1680,
"valid_targets_mean": 2796.4,
"valid_targets_min": 884
},
{
"epoch": 2.775947281713344,
"grad_norm": 0.5970044349725444,
"learning_rate": 3.0222095918475873e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2813631594181061,
"step": 1685,
"valid_targets_mean": 3382.0,
"valid_targets_min": 303
},
{
"epoch": 2.784184514003295,
"grad_norm": 0.6241679803491641,
"learning_rate": 3.0151396468588848e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3226885199546814,
"step": 1690,
"valid_targets_mean": 3349.4,
"valid_targets_min": 629
},
{
"epoch": 2.7924217462932455,
"grad_norm": 0.6758678539427506,
"learning_rate": 3.0080525729823306e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2838185131549835,
"step": 1695,
"valid_targets_mean": 2828.4,
"valid_targets_min": 414
},
{
"epoch": 2.800658978583196,
"grad_norm": 0.6626285467688362,
"learning_rate": 3.0009484898011707e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20693442225456238,
"step": 1700,
"valid_targets_mean": 2387.9,
"valid_targets_min": 330
},
{
"epoch": 2.808896210873147,
"grad_norm": 0.6348234491622945,
"learning_rate": 2.993827517185656e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1983412504196167,
"step": 1705,
"valid_targets_mean": 2287.1,
"valid_targets_min": 344
},
{
"epoch": 2.8171334431630974,
"grad_norm": 0.61643554024194,
"learning_rate": 2.9866897752910194e-05,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.283508837223053,
"step": 1710,
"valid_targets_mean": 3377.9,
"valid_targets_min": 296
},
{
"epoch": 2.8253706754530477,
"grad_norm": 0.6199082976797735,
"learning_rate": 2.979535384555449e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2590184211730957,
"step": 1715,
"valid_targets_mean": 2785.8,
"valid_targets_min": 525
},
{
"epoch": 2.8336079077429983,
"grad_norm": 0.6125979185177308,
"learning_rate": 2.972364465698058e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20899072289466858,
"step": 1720,
"valid_targets_mean": 2579.9,
"valid_targets_min": 1082
},
{
"epoch": 2.841845140032949,
"grad_norm": 0.5290588033442578,
"learning_rate": 2.9651771397168443e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22369131445884705,
"step": 1725,
"valid_targets_mean": 3426.8,
"valid_targets_min": 293
},
{
"epoch": 2.8500823723228996,
"grad_norm": 0.6539333797819626,
"learning_rate": 2.95797352788665e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23585286736488342,
"step": 1730,
"valid_targets_mean": 2215.5,
"valid_targets_min": 995
},
{
"epoch": 2.8583196046128503,
"grad_norm": 0.5667125641727214,
"learning_rate": 2.9507537517571144e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26343971490859985,
"step": 1735,
"valid_targets_mean": 3617.1,
"valid_targets_min": 698
},
{
"epoch": 2.8665568369028005,
"grad_norm": 0.6487727126984469,
"learning_rate": 2.943517933150627e-05,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18966974318027496,
"step": 1740,
"valid_targets_mean": 2072.4,
"valid_targets_min": 620
},
{
"epoch": 2.874794069192751,
"grad_norm": 0.6607579482836561,
"learning_rate": 2.936266194160266e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2583504319190979,
"step": 1745,
"valid_targets_mean": 2565.9,
"valid_targets_min": 271
},
{
"epoch": 2.883031301482702,
"grad_norm": 0.5329687913430899,
"learning_rate": 2.9289986571477437e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20519870519638062,
"step": 1750,
"valid_targets_mean": 3771.8,
"valid_targets_min": 287
},
{
"epoch": 2.8912685337726525,
"grad_norm": 0.6309469478492378,
"learning_rate": 2.9217154447413353e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2913402020931244,
"step": 1755,
"valid_targets_mean": 3011.4,
"valid_targets_min": 440
},
{
"epoch": 2.899505766062603,
"grad_norm": 0.6181431157029986,
"learning_rate": 2.9144166798338183e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2582964301109314,
"step": 1760,
"valid_targets_mean": 2926.4,
"valid_targets_min": 904
},
{
"epoch": 2.9077429983525533,
"grad_norm": 0.561800631902138,
"learning_rate": 2.9071024855803915e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24287906289100647,
"step": 1765,
"valid_targets_mean": 3191.9,
"valid_targets_min": 725
},
{
"epoch": 2.915980230642504,
"grad_norm": 0.5450888844326778,
"learning_rate": 2.899772985396599e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29268404841423035,
"step": 1770,
"valid_targets_mean": 4125.9,
"valid_targets_min": 219
},
{
"epoch": 2.9242174629324547,
"grad_norm": 0.6136775430077496,
"learning_rate": 2.8924283029562507e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2912731170654297,
"step": 1775,
"valid_targets_mean": 2938.9,
"valid_targets_min": 696
},
{
"epoch": 2.9324546952224053,
"grad_norm": 0.5978265935100938,
"learning_rate": 2.8850685621893325e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252366840839386,
"step": 1780,
"valid_targets_mean": 2998.1,
"valid_targets_min": 1471
},
{
"epoch": 2.940691927512356,
"grad_norm": 0.7550055402423995,
"learning_rate": 2.8776938872799154e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3611225187778473,
"step": 1785,
"valid_targets_mean": 2618.1,
"valid_targets_min": 425
},
{
"epoch": 2.948929159802306,
"grad_norm": 0.7818665512831672,
"learning_rate": 2.8703044026640606e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23194675147533417,
"step": 1790,
"valid_targets_mean": 2316.6,
"valid_targets_min": 737
},
{
"epoch": 2.957166392092257,
"grad_norm": 0.5892658804250798,
"learning_rate": 2.8629002330277193e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2277798354625702,
"step": 1795,
"valid_targets_mean": 3049.9,
"valid_targets_min": 1228
},
{
"epoch": 2.9654036243822075,
"grad_norm": 0.5471885661828383,
"learning_rate": 2.8554815033046314e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2878086566925049,
"step": 1800,
"valid_targets_mean": 3484.8,
"valid_targets_min": 711
},
{
"epoch": 2.973640856672158,
"grad_norm": 0.6505108723919814,
"learning_rate": 2.8480483386742138e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3757530748844147,
"step": 1805,
"valid_targets_mean": 3585.3,
"valid_targets_min": 685
},
{
"epoch": 2.981878088962109,
"grad_norm": 0.7103264195165173,
"learning_rate": 2.8406008645594503e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637771964073181,
"step": 1810,
"valid_targets_mean": 2895.6,
"valid_targets_min": 658
},
{
"epoch": 2.990115321252059,
"grad_norm": 0.5946550823036287,
"learning_rate": 2.8331392066247737e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252275288105011,
"step": 1815,
"valid_targets_mean": 3185.4,
"valid_targets_min": 917
},
{
"epoch": 2.99835255354201,
"grad_norm": 0.6152199859425457,
"learning_rate": 2.825663490773949e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2030968815088272,
"step": 1820,
"valid_targets_mean": 2650.6,
"valid_targets_min": 1287
},
{
"epoch": 3.0065897858319603,
"grad_norm": 0.6258707256547769,
"learning_rate": 2.8181738431479436e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27519214153289795,
"step": 1825,
"valid_targets_mean": 3554.0,
"valid_targets_min": 242
},
{
"epoch": 3.014827018121911,
"grad_norm": 0.6979619035300266,
"learning_rate": 2.8106703901228038e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24069149792194366,
"step": 1830,
"valid_targets_mean": 2847.0,
"valid_targets_min": 793
},
{
"epoch": 3.0230642504118617,
"grad_norm": 0.7103856015735733,
"learning_rate": 2.803153258307519e-05,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22712934017181396,
"step": 1835,
"valid_targets_mean": 3009.5,
"valid_targets_min": 1145
},
{
"epoch": 3.0313014827018123,
"grad_norm": 0.6606325974128326,
"learning_rate": 2.795622574541887e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18506592512130737,
"step": 1840,
"valid_targets_mean": 2418.6,
"valid_targets_min": 265
},
{
"epoch": 3.039538714991763,
"grad_norm": 0.6850431486225936,
"learning_rate": 2.7880784658943754e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18309485912322998,
"step": 1845,
"valid_targets_mean": 2489.2,
"valid_targets_min": 223
},
{
"epoch": 3.047775947281713,
"grad_norm": 0.5538682132728715,
"learning_rate": 2.780521059659972e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23113849759101868,
"step": 1850,
"valid_targets_mean": 3999.1,
"valid_targets_min": 202
},
{
"epoch": 3.056013179571664,
"grad_norm": 0.6796686047382778,
"learning_rate": 2.7729504833580435e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25922173261642456,
"step": 1855,
"valid_targets_mean": 3340.5,
"valid_targets_min": 296
},
{
"epoch": 3.0642504118616145,
"grad_norm": 0.6304747169185941,
"learning_rate": 2.7653668647301797e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16006682813167572,
"step": 1860,
"valid_targets_mean": 2294.0,
"valid_targets_min": 810
},
{
"epoch": 3.072487644151565,
"grad_norm": 0.7093598321151464,
"learning_rate": 2.7577703317380396e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18509194254875183,
"step": 1865,
"valid_targets_mean": 2160.2,
"valid_targets_min": 630
},
{
"epoch": 3.080724876441516,
"grad_norm": 0.7844752556313203,
"learning_rate": 2.7501610125611908e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27326297760009766,
"step": 1870,
"valid_targets_mean": 2360.1,
"valid_targets_min": 640
},
{
"epoch": 3.088962108731466,
"grad_norm": 0.6203395631329998,
"learning_rate": 2.7425390355949485e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20063695311546326,
"step": 1875,
"valid_targets_mean": 3214.6,
"valid_targets_min": 803
},
{
"epoch": 3.0971993410214167,
"grad_norm": 0.5972430112657969,
"learning_rate": 2.7349045294482085e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1896412968635559,
"step": 1880,
"valid_targets_mean": 3004.9,
"valid_targets_min": 858
},
{
"epoch": 3.1054365733113674,
"grad_norm": 0.6109690382269436,
"learning_rate": 2.727257622941276e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823769062757492,
"step": 1885,
"valid_targets_mean": 3246.3,
"valid_targets_min": 869
},
{
"epoch": 3.113673805601318,
"grad_norm": 0.6680979030364619,
"learning_rate": 2.719598445103693e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30736616253852844,
"step": 1890,
"valid_targets_mean": 3581.5,
"valid_targets_min": 891
},
{
"epoch": 3.1219110378912687,
"grad_norm": 0.656674091764851,
"learning_rate": 2.7119271251720628e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24723771214485168,
"step": 1895,
"valid_targets_mean": 3369.2,
"valid_targets_min": 281
},
{
"epoch": 3.130148270181219,
"grad_norm": 0.7728854258315987,
"learning_rate": 2.7042437925878638e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2554164528846741,
"step": 1900,
"valid_targets_mean": 2117.9,
"valid_targets_min": 347
},
{
"epoch": 3.1383855024711695,
"grad_norm": 0.6642247085562812,
"learning_rate": 2.696548576995273e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1960965394973755,
"step": 1905,
"valid_targets_mean": 2602.1,
"valid_targets_min": 315
},
{
"epoch": 3.14662273476112,
"grad_norm": 0.6414494783887725,
"learning_rate": 2.688841608238971e-05,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22181352972984314,
"step": 1910,
"valid_targets_mean": 3207.8,
"valid_targets_min": 372
},
{
"epoch": 3.154859967051071,
"grad_norm": 0.6164066662964309,
"learning_rate": 2.6811230163619573e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2142753303050995,
"step": 1915,
"valid_targets_mean": 3368.1,
"valid_targets_min": 508
},
{
"epoch": 3.1630971993410215,
"grad_norm": 0.6512147028551658,
"learning_rate": 2.6733929316033516e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2733863592147827,
"step": 1920,
"valid_targets_mean": 3103.7,
"valid_targets_min": 696
},
{
"epoch": 3.171334431630972,
"grad_norm": 0.7299868596833275,
"learning_rate": 2.6656514843961995e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24958714842796326,
"step": 1925,
"valid_targets_mean": 2279.0,
"valid_targets_min": 330
},
{
"epoch": 3.1795716639209224,
"grad_norm": 0.8142044039966199,
"learning_rate": 2.6578988053652674e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18350908160209656,
"step": 1930,
"valid_targets_mean": 2545.4,
"valid_targets_min": 311
},
{
"epoch": 3.187808896210873,
"grad_norm": 0.562898892452807,
"learning_rate": 2.650135025324845e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17142733931541443,
"step": 1935,
"valid_targets_mean": 3330.9,
"valid_targets_min": 1394
},
{
"epoch": 3.1960461285008237,
"grad_norm": 0.6582097758062362,
"learning_rate": 2.6423602752765313e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20524603128433228,
"step": 1940,
"valid_targets_mean": 2706.2,
"valid_targets_min": 762
},
{
"epoch": 3.2042833607907744,
"grad_norm": 0.6657980269588102,
"learning_rate": 2.6345746864070266e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18109837174415588,
"step": 1945,
"valid_targets_mean": 3052.4,
"valid_targets_min": 1259
},
{
"epoch": 3.212520593080725,
"grad_norm": 0.5233060688239787,
"learning_rate": 2.626778390085921e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23430457711219788,
"step": 1950,
"valid_targets_mean": 3784.8,
"valid_targets_min": 1133
},
{
"epoch": 3.2207578253706757,
"grad_norm": 0.5640310501280067,
"learning_rate": 2.618971517863475e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508048415184021,
"step": 1955,
"valid_targets_mean": 3848.9,
"valid_targets_min": 829
},
{
"epoch": 3.228995057660626,
"grad_norm": 0.6757649235613026,
"learning_rate": 2.611154201468402e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19972142577171326,
"step": 1960,
"valid_targets_mean": 2526.3,
"valid_targets_min": 287
},
{
"epoch": 3.2372322899505765,
"grad_norm": 0.6327380969439266,
"learning_rate": 2.6033265728056437e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27250388264656067,
"step": 1965,
"valid_targets_mean": 3225.0,
"valid_targets_min": 162
},
{
"epoch": 3.245469522240527,
"grad_norm": 0.6804914744524357,
"learning_rate": 2.5954887639541435e-05,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24783380329608917,
"step": 1970,
"valid_targets_mean": 3115.6,
"valid_targets_min": 1233
},
{
"epoch": 3.253706754530478,
"grad_norm": 0.6893147997495879,
"learning_rate": 2.5876409071646224e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19912023842334747,
"step": 1975,
"valid_targets_mean": 2359.8,
"valid_targets_min": 704
},
{
"epoch": 3.2619439868204285,
"grad_norm": 0.7483268034445905,
"learning_rate": 2.5797831348573425e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24190068244934082,
"step": 1980,
"valid_targets_mean": 2175.4,
"valid_targets_min": 287
},
{
"epoch": 3.2701812191103787,
"grad_norm": 0.7575224906224661,
"learning_rate": 2.571915579619876e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20588669180870056,
"step": 1985,
"valid_targets_mean": 2110.9,
"valid_targets_min": 459
},
{
"epoch": 3.2784184514003294,
"grad_norm": 0.7392556685136732,
"learning_rate": 2.5640383742048654e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323339730501175,
"step": 1990,
"valid_targets_mean": 3014.4,
"valid_targets_min": 617
},
{
"epoch": 3.28665568369028,
"grad_norm": 0.6831064439961768,
"learning_rate": 2.5561516515277863e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21883323788642883,
"step": 1995,
"valid_targets_mean": 2510.6,
"valid_targets_min": 302
},
{
"epoch": 3.2948929159802307,
"grad_norm": 0.8007206900810597,
"learning_rate": 2.5482555446647018e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22404079139232635,
"step": 2000,
"valid_targets_mean": 2083.4,
"valid_targets_min": 246
},
{
"epoch": 3.3031301482701814,
"grad_norm": 0.5429592839510521,
"learning_rate": 2.5403501868500185e-05,
"loss": 0.2114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2400265783071518,
"step": 2005,
"valid_targets_mean": 4130.8,
"valid_targets_min": 1160
},
{
"epoch": 3.3113673805601316,
"grad_norm": 0.5660803486075174,
"learning_rate": 2.5324357114742397e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2689647376537323,
"step": 2010,
"valid_targets_mean": 3778.0,
"valid_targets_min": 1193
},
{
"epoch": 3.3196046128500822,
"grad_norm": 0.7767761209530037,
"learning_rate": 2.5245122520817117e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2215704619884491,
"step": 2015,
"valid_targets_mean": 2003.6,
"valid_targets_min": 1036
},
{
"epoch": 3.327841845140033,
"grad_norm": 0.6855725876862521,
"learning_rate": 2.516579942368373e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2817282974720001,
"step": 2020,
"valid_targets_mean": 2737.0,
"valid_targets_min": 888
},
{
"epoch": 3.3360790774299836,
"grad_norm": 0.6814741906770814,
"learning_rate": 2.508638916179497e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21324288845062256,
"step": 2025,
"valid_targets_mean": 2609.9,
"valid_targets_min": 702
},
{
"epoch": 3.344316309719934,
"grad_norm": 0.6327378315223203,
"learning_rate": 2.5006893075074326e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19734251499176025,
"step": 2030,
"valid_targets_mean": 2890.1,
"valid_targets_min": 1511
},
{
"epoch": 3.352553542009885,
"grad_norm": 0.6132165565742003,
"learning_rate": 2.4927312504893467e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18627655506134033,
"step": 2035,
"valid_targets_mean": 2605.4,
"valid_targets_min": 1161
},
{
"epoch": 3.360790774299835,
"grad_norm": 0.5659647262055583,
"learning_rate": 2.4847648794049587e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27079278230667114,
"step": 2040,
"valid_targets_mean": 3818.2,
"valid_targets_min": 307
},
{
"epoch": 3.3690280065897857,
"grad_norm": 0.7525363828497744,
"learning_rate": 2.4767903286742732e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642737030982971,
"step": 2045,
"valid_targets_mean": 2758.6,
"valid_targets_min": 915
},
{
"epoch": 3.3772652388797364,
"grad_norm": 0.643032011061072,
"learning_rate": 2.468807732855314e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521781921386719,
"step": 2050,
"valid_targets_mean": 2820.3,
"valid_targets_min": 869
},
{
"epoch": 3.385502471169687,
"grad_norm": 0.5925300737235305,
"learning_rate": 2.4608172266418543e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20423221588134766,
"step": 2055,
"valid_targets_mean": 3420.7,
"valid_targets_min": 1010
},
{
"epoch": 3.3937397034596377,
"grad_norm": 0.6235488121604282,
"learning_rate": 2.4528189448611417e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18752437829971313,
"step": 2060,
"valid_targets_mean": 2721.8,
"valid_targets_min": 592
},
{
"epoch": 3.4019769357495884,
"grad_norm": 0.6870040109780278,
"learning_rate": 2.4448130224716248e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22506539523601532,
"step": 2065,
"valid_targets_mean": 2590.9,
"valid_targets_min": 264
},
{
"epoch": 3.4102141680395386,
"grad_norm": 0.7094267432239266,
"learning_rate": 2.436799594560675e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2151351273059845,
"step": 2070,
"valid_targets_mean": 2135.9,
"valid_targets_min": 556
},
{
"epoch": 3.4184514003294892,
"grad_norm": 0.6314415541358995,
"learning_rate": 2.4287787963423076e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21119928359985352,
"step": 2075,
"valid_targets_mean": 2751.8,
"valid_targets_min": 964
},
{
"epoch": 3.42668863261944,
"grad_norm": 0.6546436274570712,
"learning_rate": 2.4207507631549013e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2236832231283188,
"step": 2080,
"valid_targets_mean": 2722.8,
"valid_targets_min": 438
},
{
"epoch": 3.4349258649093906,
"grad_norm": 0.7372518274682155,
"learning_rate": 2.412715630458912e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20843760669231415,
"step": 2085,
"valid_targets_mean": 1994.7,
"valid_targets_min": 289
},
{
"epoch": 3.443163097199341,
"grad_norm": 0.608006914662658,
"learning_rate": 2.4046735338345895e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18041086196899414,
"step": 2090,
"valid_targets_mean": 3166.0,
"valid_targets_min": 252
},
{
"epoch": 3.4514003294892914,
"grad_norm": 0.6151046163508607,
"learning_rate": 2.396624608979689e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19882315397262573,
"step": 2095,
"valid_targets_mean": 3122.8,
"valid_targets_min": 565
},
{
"epoch": 3.459637561779242,
"grad_norm": 0.6562773996483675,
"learning_rate": 2.3885689917071822e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.235906183719635,
"step": 2100,
"valid_targets_mean": 2765.6,
"valid_targets_min": 686
},
{
"epoch": 3.4678747940691927,
"grad_norm": 0.6592007545756166,
"learning_rate": 2.3805068179429628e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1776544600725174,
"step": 2105,
"valid_targets_mean": 2520.6,
"valid_targets_min": 1343
},
{
"epoch": 3.4761120263591434,
"grad_norm": 0.6590580088665366,
"learning_rate": 2.372438223723555e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21588583290576935,
"step": 2110,
"valid_targets_mean": 2554.1,
"valid_targets_min": 380
},
{
"epoch": 3.484349258649094,
"grad_norm": 0.8076922098904575,
"learning_rate": 2.3643633451938216e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25158339738845825,
"step": 2115,
"valid_targets_mean": 2090.4,
"valid_targets_min": 303
},
{
"epoch": 3.4925864909390443,
"grad_norm": 0.6332341820976258,
"learning_rate": 2.35628231860466e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24031797051429749,
"step": 2120,
"valid_targets_mean": 2920.2,
"valid_targets_min": 354
},
{
"epoch": 3.500823723228995,
"grad_norm": 0.577407770793513,
"learning_rate": 2.3481952803107067e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22233733534812927,
"step": 2125,
"valid_targets_mean": 3850.7,
"valid_targets_min": 1515
},
{
"epoch": 3.5090609555189456,
"grad_norm": 0.6567622204640255,
"learning_rate": 2.3401023667680373e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19248053431510925,
"step": 2130,
"valid_targets_mean": 2304.1,
"valid_targets_min": 237
},
{
"epoch": 3.5172981878088962,
"grad_norm": 0.7141705443386381,
"learning_rate": 2.332003714531862e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976984441280365,
"step": 2135,
"valid_targets_mean": 2048.7,
"valid_targets_min": 694
},
{
"epoch": 3.525535420098847,
"grad_norm": 0.607697425345425,
"learning_rate": 2.3238994602542246e-05,
"loss": 0.2115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21744032204151154,
"step": 2140,
"valid_targets_mean": 3213.8,
"valid_targets_min": 413
},
{
"epoch": 3.533772652388797,
"grad_norm": 0.7021370663152642,
"learning_rate": 2.3157897406816917e-05,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28610166907310486,
"step": 2145,
"valid_targets_mean": 2821.2,
"valid_targets_min": 230
},
{
"epoch": 3.5420098846787478,
"grad_norm": 0.5461733110954154,
"learning_rate": 2.3076746926530497e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2287541776895523,
"step": 2150,
"valid_targets_mean": 3553.9,
"valid_targets_min": 650
},
{
"epoch": 3.5502471169686984,
"grad_norm": 0.5850319326104395,
"learning_rate": 2.2995544530969946e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22641529142856598,
"step": 2155,
"valid_targets_mean": 3302.9,
"valid_targets_min": 781
},
{
"epoch": 3.558484349258649,
"grad_norm": 0.582193722764864,
"learning_rate": 2.2914291590298197e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886036992073059,
"step": 2160,
"valid_targets_mean": 2990.2,
"valid_targets_min": 1004
},
{
"epoch": 3.5667215815485998,
"grad_norm": 0.6473717041137795,
"learning_rate": 2.2832989475531073e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25963377952575684,
"step": 2165,
"valid_targets_mean": 3190.9,
"valid_targets_min": 769
},
{
"epoch": 3.5749588138385504,
"grad_norm": 0.6615310004983426,
"learning_rate": 2.2751639558514116e-05,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2162645161151886,
"step": 2170,
"valid_targets_mean": 2861.2,
"valid_targets_min": 613
},
{
"epoch": 3.583196046128501,
"grad_norm": 0.6338711397955663,
"learning_rate": 2.267024321189947e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.251259446144104,
"step": 2175,
"valid_targets_mean": 3085.6,
"valid_targets_min": 941
},
{
"epoch": 3.5914332784184513,
"grad_norm": 0.783642027585893,
"learning_rate": 2.2588801809122692e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2465619146823883,
"step": 2180,
"valid_targets_mean": 2471.6,
"valid_targets_min": 1463
},
{
"epoch": 3.599670510708402,
"grad_norm": 0.586321202432999,
"learning_rate": 2.2507316724379603e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637313961982727,
"step": 2185,
"valid_targets_mean": 3156.4,
"valid_targets_min": 910
},
{
"epoch": 3.6079077429983526,
"grad_norm": 0.6379027755615722,
"learning_rate": 2.2425789332603073e-05,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23997169733047485,
"step": 2190,
"valid_targets_mean": 2858.4,
"valid_targets_min": 847
},
{
"epoch": 3.6161449752883033,
"grad_norm": 0.6047690528170985,
"learning_rate": 2.2344221009439863e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24346941709518433,
"step": 2195,
"valid_targets_mean": 3866.5,
"valid_targets_min": 813
},
{
"epoch": 3.624382207578254,
"grad_norm": 0.6313067950028487,
"learning_rate": 2.2262613131227357e-05,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22747395932674408,
"step": 2200,
"valid_targets_mean": 3051.4,
"valid_targets_min": 940
},
{
"epoch": 3.632619439868204,
"grad_norm": 0.6656343358447956,
"learning_rate": 2.2180967074970384e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19725120067596436,
"step": 2205,
"valid_targets_mean": 2394.8,
"valid_targets_min": 1078
},
{
"epoch": 3.640856672158155,
"grad_norm": 0.7130890060910889,
"learning_rate": 2.2099284218317965e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25655680894851685,
"step": 2210,
"valid_targets_mean": 3127.7,
"valid_targets_min": 1049
},
{
"epoch": 3.6490939044481054,
"grad_norm": 0.610819423734245,
"learning_rate": 2.201756593954007e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23688563704490662,
"step": 2215,
"valid_targets_mean": 2912.0,
"valid_targets_min": 591
},
{
"epoch": 3.657331136738056,
"grad_norm": 0.6314338546235789,
"learning_rate": 2.1935813617504372e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23836040496826172,
"step": 2220,
"valid_targets_mean": 3433.9,
"valid_targets_min": 1226
},
{
"epoch": 3.6655683690280068,
"grad_norm": 0.6913445443394045,
"learning_rate": 2.1854028631652958e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20062170922756195,
"step": 2225,
"valid_targets_mean": 3753.8,
"valid_targets_min": 1806
},
{
"epoch": 3.673805601317957,
"grad_norm": 0.6508619258749753,
"learning_rate": 2.1772212361979053e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572256624698639,
"step": 2230,
"valid_targets_mean": 2761.0,
"valid_targets_min": 261
},
{
"epoch": 3.6820428336079076,
"grad_norm": 0.5753873608912875,
"learning_rate": 2.1690366189003776e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2219148576259613,
"step": 2235,
"valid_targets_mean": 3162.1,
"valid_targets_min": 871
},
{
"epoch": 3.6902800658978583,
"grad_norm": 0.6527308666941445,
"learning_rate": 2.16084914937528e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24218809604644775,
"step": 2240,
"valid_targets_mean": 3107.4,
"valid_targets_min": 1077
},
{
"epoch": 3.698517298187809,
"grad_norm": 1.124267119734622,
"learning_rate": 2.1526589657733076e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22716014087200165,
"step": 2245,
"valid_targets_mean": 2182.6,
"valid_targets_min": 245
},
{
"epoch": 3.7067545304777596,
"grad_norm": 0.5693915019753482,
"learning_rate": 2.1444662062909497e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18227519094944,
"step": 2250,
"valid_targets_mean": 3361.0,
"valid_targets_min": 377
},
{
"epoch": 3.71499176276771,
"grad_norm": 0.6891371173963926,
"learning_rate": 2.136271009168162e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1876133233308792,
"step": 2255,
"valid_targets_mean": 2128.9,
"valid_targets_min": 719
},
{
"epoch": 3.7232289950576605,
"grad_norm": 0.6567207894440227,
"learning_rate": 2.128073512686029e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2048790454864502,
"step": 2260,
"valid_targets_mean": 2656.5,
"valid_targets_min": 1183
},
{
"epoch": 3.731466227347611,
"grad_norm": 0.7458147326733252,
"learning_rate": 2.1198738551644344e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2422378957271576,
"step": 2265,
"valid_targets_mean": 2192.9,
"valid_targets_min": 251
},
{
"epoch": 3.739703459637562,
"grad_norm": 0.6442647879430062,
"learning_rate": 2.1116721749597265e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20766223967075348,
"step": 2270,
"valid_targets_mean": 2699.9,
"valid_targets_min": 251
},
{
"epoch": 3.7479406919275124,
"grad_norm": 0.6516890191749407,
"learning_rate": 2.1034686104623828e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24694222211837769,
"step": 2275,
"valid_targets_mean": 2857.2,
"valid_targets_min": 1068
},
{
"epoch": 3.7561779242174627,
"grad_norm": 0.7329917353431759,
"learning_rate": 2.0952633000946753e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23302693665027618,
"step": 2280,
"valid_targets_mean": 2236.2,
"valid_targets_min": 251
},
{
"epoch": 3.7644151565074138,
"grad_norm": 0.7031038589727836,
"learning_rate": 2.0870563823083347e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21459734439849854,
"step": 2285,
"valid_targets_mean": 2116.3,
"valid_targets_min": 683
},
{
"epoch": 3.772652388797364,
"grad_norm": 0.6857035428769572,
"learning_rate": 2.0788479955822137e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20176962018013,
"step": 2290,
"valid_targets_mean": 2616.1,
"valid_targets_min": 1007
},
{
"epoch": 3.7808896210873146,
"grad_norm": 0.8073211974656119,
"learning_rate": 2.0706382784199524e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27309340238571167,
"step": 2295,
"valid_targets_mean": 2650.2,
"valid_targets_min": 753
},
{
"epoch": 3.7891268533772653,
"grad_norm": 0.7210086182232971,
"learning_rate": 2.06242736934764e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21143299341201782,
"step": 2300,
"valid_targets_mean": 2429.8,
"valid_targets_min": 693
},
{
"epoch": 3.797364085667216,
"grad_norm": 0.6610150115701522,
"learning_rate": 2.0542154069114753e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20834533870220184,
"step": 2305,
"valid_targets_mean": 2753.0,
"valid_targets_min": 317
},
{
"epoch": 3.8056013179571666,
"grad_norm": 0.8143475265522775,
"learning_rate": 2.0460025296754326e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2677311897277832,
"step": 2310,
"valid_targets_mean": 1949.5,
"valid_targets_min": 311
},
{
"epoch": 3.813838550247117,
"grad_norm": 0.6674017870698288,
"learning_rate": 2.037788876218923e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17726172506809235,
"step": 2315,
"valid_targets_mean": 2284.8,
"valid_targets_min": 324
},
{
"epoch": 3.8220757825370675,
"grad_norm": 0.5838081717362156,
"learning_rate": 2.029574585134452e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22934329509735107,
"step": 2320,
"valid_targets_mean": 3687.3,
"valid_targets_min": 791
},
{
"epoch": 3.830313014827018,
"grad_norm": 0.6778643643059814,
"learning_rate": 2.0213597950252864e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21608680486679077,
"step": 2325,
"valid_targets_mean": 2646.7,
"valid_targets_min": 374
},
{
"epoch": 3.838550247116969,
"grad_norm": 0.5949453895813899,
"learning_rate": 2.0131446445031132e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23367094993591309,
"step": 2330,
"valid_targets_mean": 3113.8,
"valid_targets_min": 1029
},
{
"epoch": 3.8467874794069195,
"grad_norm": 0.6215489423579595,
"learning_rate": 2.0049292721857005e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2354554384946823,
"step": 2335,
"valid_targets_mean": 2976.0,
"valid_targets_min": 1576
},
{
"epoch": 3.8550247116968697,
"grad_norm": 0.6525560252314341,
"learning_rate": 1.9967138166945584e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21559584140777588,
"step": 2340,
"valid_targets_mean": 2901.3,
"valid_targets_min": 1446
},
{
"epoch": 3.8632619439868203,
"grad_norm": 0.6584339432357748,
"learning_rate": 1.9884984166525996e-05,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2388259917497635,
"step": 2345,
"valid_targets_mean": 2916.9,
"valid_targets_min": 809
},
{
"epoch": 3.871499176276771,
"grad_norm": 0.6625292350672669,
"learning_rate": 1.9802832106818038e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20597676932811737,
"step": 2350,
"valid_targets_mean": 2825.5,
"valid_targets_min": 425
},
{
"epoch": 3.8797364085667216,
"grad_norm": 0.6845618073993892,
"learning_rate": 1.9720683374008742e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833724617958069,
"step": 2355,
"valid_targets_mean": 2759.7,
"valid_targets_min": 811
},
{
"epoch": 3.8879736408566723,
"grad_norm": 0.7583414594121382,
"learning_rate": 1.9638539354228994e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23047031462192535,
"step": 2360,
"valid_targets_mean": 1862.4,
"valid_targets_min": 728
},
{
"epoch": 3.8962108731466225,
"grad_norm": 0.6863919509729713,
"learning_rate": 1.9556401433530186e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19445081055164337,
"step": 2365,
"valid_targets_mean": 2312.0,
"valid_targets_min": 236
},
{
"epoch": 3.904448105436573,
"grad_norm": 0.5702207511533826,
"learning_rate": 1.947427099786077e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1521320939064026,
"step": 2370,
"valid_targets_mean": 2876.6,
"valid_targets_min": 574
},
{
"epoch": 3.912685337726524,
"grad_norm": 0.725652791371573,
"learning_rate": 1.9392149433042915e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21470411121845245,
"step": 2375,
"valid_targets_mean": 2422.2,
"valid_targets_min": 1293
},
{
"epoch": 3.9209225700164745,
"grad_norm": 0.7521039314890973,
"learning_rate": 1.9310038124749102e-05,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2105662226676941,
"step": 2380,
"valid_targets_mean": 2092.1,
"valid_targets_min": 914
},
{
"epoch": 3.929159802306425,
"grad_norm": 0.7221609491167119,
"learning_rate": 1.9227938458478744e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1993308663368225,
"step": 2385,
"valid_targets_mean": 2114.9,
"valid_targets_min": 286
},
{
"epoch": 3.9373970345963754,
"grad_norm": 0.6765877567980294,
"learning_rate": 1.9145851819534824e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19120612740516663,
"step": 2390,
"valid_targets_mean": 2558.6,
"valid_targets_min": 817
},
{
"epoch": 3.9456342668863265,
"grad_norm": 0.5868278571600912,
"learning_rate": 1.9063779593000507e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1894645094871521,
"step": 2395,
"valid_targets_mean": 3188.8,
"valid_targets_min": 847
},
{
"epoch": 3.9538714991762767,
"grad_norm": 0.5382630298422423,
"learning_rate": 1.8981723163715756e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20977070927619934,
"step": 2400,
"valid_targets_mean": 3654.6,
"valid_targets_min": 708
},
{
"epoch": 3.9621087314662273,
"grad_norm": 0.6247881187672814,
"learning_rate": 1.8899683916254013e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19764485955238342,
"step": 2405,
"valid_targets_mean": 2881.1,
"valid_targets_min": 849
},
{
"epoch": 3.970345963756178,
"grad_norm": 0.7327354122670338,
"learning_rate": 1.881766323489877e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23579062521457672,
"step": 2410,
"valid_targets_mean": 2472.6,
"valid_targets_min": 746
},
{
"epoch": 3.9785831960461286,
"grad_norm": 0.6595175545075271,
"learning_rate": 1.8735662503620268e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2350047081708908,
"step": 2415,
"valid_targets_mean": 3148.6,
"valid_targets_min": 309
},
{
"epoch": 3.9868204283360793,
"grad_norm": 0.510007753878104,
"learning_rate": 1.8653683106052097e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20294642448425293,
"step": 2420,
"valid_targets_mean": 3626.1,
"valid_targets_min": 341
},
{
"epoch": 3.9950576606260295,
"grad_norm": 0.6659822075544012,
"learning_rate": 1.857172642546791e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24123075604438782,
"step": 2425,
"valid_targets_mean": 2767.6,
"valid_targets_min": 866
},
{
"epoch": 4.003294892915981,
"grad_norm": 0.6848919535763092,
"learning_rate": 1.8489793844758015e-05,
"loss": 0.2112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.196708083152771,
"step": 2430,
"valid_targets_mean": 2348.8,
"valid_targets_min": 780
},
{
"epoch": 4.011532125205931,
"grad_norm": 0.8126335054852767,
"learning_rate": 1.8407886746406082e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18026752769947052,
"step": 2435,
"valid_targets_mean": 1642.7,
"valid_targets_min": 524
},
{
"epoch": 4.019769357495881,
"grad_norm": 0.6954560411576156,
"learning_rate": 1.8326006512465806e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1572655588388443,
"step": 2440,
"valid_targets_mean": 2657.9,
"valid_targets_min": 304
},
{
"epoch": 4.028006589785832,
"grad_norm": 0.6681376975506721,
"learning_rate": 1.8244154524537602e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940767467021942,
"step": 2445,
"valid_targets_mean": 3489.4,
"valid_targets_min": 674
},
{
"epoch": 4.036243822075782,
"grad_norm": 0.675763921438596,
"learning_rate": 1.8162332163745253e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18810434639453888,
"step": 2450,
"valid_targets_mean": 2845.8,
"valid_targets_min": 245
},
{
"epoch": 4.0444810543657335,
"grad_norm": 0.6559161150800585,
"learning_rate": 1.8080540810712652e-05,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1783156543970108,
"step": 2455,
"valid_targets_mean": 3050.2,
"valid_targets_min": 747
},
{
"epoch": 4.052718286655684,
"grad_norm": 0.7053939038206681,
"learning_rate": 1.799878184554047e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18840208649635315,
"step": 2460,
"valid_targets_mean": 2819.3,
"valid_targets_min": 1529
},
{
"epoch": 4.060955518945634,
"grad_norm": 0.5768463220547291,
"learning_rate": 1.7917056647782888e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2617749571800232,
"step": 2465,
"valid_targets_mean": 4129.8,
"valid_targets_min": 245
},
{
"epoch": 4.069192751235585,
"grad_norm": 0.6610629470321063,
"learning_rate": 1.7835366596424317e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20493917167186737,
"step": 2470,
"valid_targets_mean": 3070.0,
"valid_targets_min": 1007
},
{
"epoch": 4.077429983525535,
"grad_norm": 0.6908004026096404,
"learning_rate": 1.775371306985613e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2220386117696762,
"step": 2475,
"valid_targets_mean": 2883.8,
"valid_targets_min": 829
},
{
"epoch": 4.085667215815486,
"grad_norm": 0.679048587976391,
"learning_rate": 1.7672097445853388e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17979687452316284,
"step": 2480,
"valid_targets_mean": 2942.2,
"valid_targets_min": 1084
},
{
"epoch": 4.0939044481054365,
"grad_norm": 0.7517226829701907,
"learning_rate": 1.7590521101551635e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20365673303604126,
"step": 2485,
"valid_targets_mean": 2352.6,
"valid_targets_min": 250
},
{
"epoch": 4.102141680395387,
"grad_norm": 0.7091041235957187,
"learning_rate": 1.7508985413423595e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2280346006155014,
"step": 2490,
"valid_targets_mean": 2677.7,
"valid_targets_min": 1029
},
{
"epoch": 4.110378912685338,
"grad_norm": 0.7089396573462521,
"learning_rate": 1.742749175725601e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18262189626693726,
"step": 2495,
"valid_targets_mean": 2452.9,
"valid_targets_min": 224
},
{
"epoch": 4.118616144975288,
"grad_norm": 0.6892080263313686,
"learning_rate": 1.7346041508126386e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1696496605873108,
"step": 2500,
"valid_targets_mean": 2710.0,
"valid_targets_min": 891
},
{
"epoch": 4.126853377265239,
"grad_norm": 0.7552024083884684,
"learning_rate": 1.7264636040379808e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2135401964187622,
"step": 2505,
"valid_targets_mean": 2567.6,
"valid_targets_min": 307
},
{
"epoch": 4.135090609555189,
"grad_norm": 0.6846684162918165,
"learning_rate": 1.7183276727605743e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17049439251422882,
"step": 2510,
"valid_targets_mean": 3185.9,
"valid_targets_min": 1214
},
{
"epoch": 4.1433278418451405,
"grad_norm": 0.6726148670882198,
"learning_rate": 1.7101964942614864e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18531067669391632,
"step": 2515,
"valid_targets_mean": 2673.3,
"valid_targets_min": 241
},
{
"epoch": 4.151565074135091,
"grad_norm": 0.7050748175603723,
"learning_rate": 1.7020702057415884e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.192526176571846,
"step": 2520,
"valid_targets_mean": 3261.9,
"valid_targets_min": 890
},
{
"epoch": 4.159802306425041,
"grad_norm": 0.7166479950826307,
"learning_rate": 1.6939489443192435e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17323213815689087,
"step": 2525,
"valid_targets_mean": 2580.0,
"valid_targets_min": 279
},
{
"epoch": 4.168039538714992,
"grad_norm": 0.6307866731323056,
"learning_rate": 1.6858328470279862e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18545058369636536,
"step": 2530,
"valid_targets_mean": 3305.8,
"valid_targets_min": 809
},
{
"epoch": 4.176276771004942,
"grad_norm": 0.6262445327354411,
"learning_rate": 1.6777220508142184e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2297663688659668,
"step": 2535,
"valid_targets_mean": 3642.7,
"valid_targets_min": 1657
},
{
"epoch": 4.184514003294893,
"grad_norm": 1.123430237088534,
"learning_rate": 1.6696166925348924e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15774188935756683,
"step": 2540,
"valid_targets_mean": 4065.2,
"valid_targets_min": 696
},
{
"epoch": 4.1927512355848435,
"grad_norm": 0.6851282095150327,
"learning_rate": 1.6615169089552038e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3130187392234802,
"step": 2545,
"valid_targets_mean": 3510.0,
"valid_targets_min": 346
},
{
"epoch": 4.200988467874794,
"grad_norm": 0.6776890152032327,
"learning_rate": 1.6534228367462843e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18178880214691162,
"step": 2550,
"valid_targets_mean": 2698.2,
"valid_targets_min": 380
},
{
"epoch": 4.209225700164745,
"grad_norm": 0.5858915064486262,
"learning_rate": 1.6453346124828966e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18752583861351013,
"step": 2555,
"valid_targets_mean": 4041.8,
"valid_targets_min": 876
},
{
"epoch": 4.217462932454695,
"grad_norm": 0.6603867459341165,
"learning_rate": 1.6372523726411253e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18429623544216156,
"step": 2560,
"valid_targets_mean": 3103.4,
"valid_targets_min": 817
},
{
"epoch": 4.225700164744646,
"grad_norm": 0.6627234827005007,
"learning_rate": 1.6291762535960817e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14199604094028473,
"step": 2565,
"valid_targets_mean": 2462.8,
"valid_targets_min": 320
},
{
"epoch": 4.233937397034596,
"grad_norm": 0.6553355284722763,
"learning_rate": 1.6211063916195945e-05,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1949518620967865,
"step": 2570,
"valid_targets_mean": 3206.4,
"valid_targets_min": 667
},
{
"epoch": 4.242174629324547,
"grad_norm": 0.6980909727917753,
"learning_rate": 1.6130429228779154e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1674255132675171,
"step": 2575,
"valid_targets_mean": 2631.8,
"valid_targets_min": 817
},
{
"epoch": 4.250411861614498,
"grad_norm": 1.0730056513064912,
"learning_rate": 1.604985983429421e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18854576349258423,
"step": 2580,
"valid_targets_mean": 3124.4,
"valid_targets_min": 569
},
{
"epoch": 4.258649093904448,
"grad_norm": 0.7520222031647412,
"learning_rate": 1.596935709222315e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21556442975997925,
"step": 2585,
"valid_targets_mean": 2409.2,
"valid_targets_min": 708
},
{
"epoch": 4.266886326194399,
"grad_norm": 0.6583239060045123,
"learning_rate": 1.5888922360923375e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19209733605384827,
"step": 2590,
"valid_targets_mean": 2888.0,
"valid_targets_min": 658
},
{
"epoch": 4.275123558484349,
"grad_norm": 0.643988352278543,
"learning_rate": 1.5808556997604684e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1911228597164154,
"step": 2595,
"valid_targets_mean": 3091.2,
"valid_targets_min": 649
},
{
"epoch": 4.283360790774299,
"grad_norm": 0.7313653605878269,
"learning_rate": 1.5728262358306418e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18181253969669342,
"step": 2600,
"valid_targets_mean": 2933.1,
"valid_targets_min": 866
},
{
"epoch": 4.2915980230642505,
"grad_norm": 0.7255332306218216,
"learning_rate": 1.564803979787457e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20717540383338928,
"step": 2605,
"valid_targets_mean": 2623.2,
"valid_targets_min": 1101
},
{
"epoch": 4.299835255354201,
"grad_norm": 0.7531476679995408,
"learning_rate": 1.5567890669938903e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1496737003326416,
"step": 2610,
"valid_targets_mean": 2502.5,
"valid_targets_min": 754
},
{
"epoch": 4.308072487644152,
"grad_norm": 0.6487606715317696,
"learning_rate": 1.5487816326890118e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19765833020210266,
"step": 2615,
"valid_targets_mean": 2939.9,
"valid_targets_min": 744
},
{
"epoch": 4.316309719934102,
"grad_norm": 0.7240518260494907,
"learning_rate": 1.540781811985704e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20093931257724762,
"step": 2620,
"valid_targets_mean": 3010.4,
"valid_targets_min": 237
},
{
"epoch": 4.324546952224052,
"grad_norm": 0.7571300929723414,
"learning_rate": 1.5327897398683827e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22667065262794495,
"step": 2625,
"valid_targets_mean": 2461.3,
"valid_targets_min": 320
},
{
"epoch": 4.332784184514003,
"grad_norm": 0.6867670673018871,
"learning_rate": 1.5248055511907183e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2281215339899063,
"step": 2630,
"valid_targets_mean": 2981.8,
"valid_targets_min": 340
},
{
"epoch": 4.341021416803954,
"grad_norm": 0.8256870657949581,
"learning_rate": 1.5168293806733594e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1914563775062561,
"step": 2635,
"valid_targets_mean": 1873.8,
"valid_targets_min": 595
},
{
"epoch": 4.349258649093905,
"grad_norm": 0.6775685498781048,
"learning_rate": 1.5088613629016613e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19783690571784973,
"step": 2640,
"valid_targets_mean": 3498.0,
"valid_targets_min": 585
},
{
"epoch": 4.357495881383855,
"grad_norm": 0.6103793140474083,
"learning_rate": 1.5009016323234158e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14736308157444,
"step": 2645,
"valid_targets_mean": 3104.6,
"valid_targets_min": 809
},
{
"epoch": 4.365733113673806,
"grad_norm": 0.6444833412719732,
"learning_rate": 1.4929503232465804e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17908361554145813,
"step": 2650,
"valid_targets_mean": 2714.5,
"valid_targets_min": 896
},
{
"epoch": 4.373970345963756,
"grad_norm": 0.6125674016153442,
"learning_rate": 1.485007569837011e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18148434162139893,
"step": 2655,
"valid_targets_mean": 3145.8,
"valid_targets_min": 324
},
{
"epoch": 4.382207578253706,
"grad_norm": 0.6907068990363627,
"learning_rate": 1.477073506116204e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808583080768585,
"step": 2660,
"valid_targets_mean": 3140.5,
"valid_targets_min": 270
},
{
"epoch": 4.3904448105436575,
"grad_norm": 0.6513537135662765,
"learning_rate": 1.469148265959028e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20921581983566284,
"step": 2665,
"valid_targets_mean": 3432.5,
"valid_targets_min": 1145
},
{
"epoch": 4.398682042833608,
"grad_norm": 0.7190243287207262,
"learning_rate": 1.4612319830914684e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19826185703277588,
"step": 2670,
"valid_targets_mean": 2480.8,
"valid_targets_min": 959
},
{
"epoch": 4.406919275123559,
"grad_norm": 0.6374744860830139,
"learning_rate": 1.4533247910883704e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17492321133613586,
"step": 2675,
"valid_targets_mean": 3242.9,
"valid_targets_min": 542
},
{
"epoch": 4.415156507413509,
"grad_norm": 0.736114349197071,
"learning_rate": 1.445426823371186e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15052483975887299,
"step": 2680,
"valid_targets_mean": 2257.1,
"valid_targets_min": 260
},
{
"epoch": 4.423393739703459,
"grad_norm": 0.6964652002410009,
"learning_rate": 1.4375382132057207e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18424688279628754,
"step": 2685,
"valid_targets_mean": 2731.6,
"valid_targets_min": 751
},
{
"epoch": 4.43163097199341,
"grad_norm": 0.6646723911201924,
"learning_rate": 1.4296590936998875e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1773110330104828,
"step": 2690,
"valid_targets_mean": 2841.5,
"valid_targets_min": 786
},
{
"epoch": 4.439868204283361,
"grad_norm": 0.7043596578211233,
"learning_rate": 1.4217895978014583e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15232154726982117,
"step": 2695,
"valid_targets_mean": 2430.2,
"valid_targets_min": 738
},
{
"epoch": 4.448105436573312,
"grad_norm": 0.8743360493221132,
"learning_rate": 1.4139298582958208e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20513039827346802,
"step": 2700,
"valid_targets_mean": 3039.7,
"valid_targets_min": 729
},
{
"epoch": 4.456342668863262,
"grad_norm": 0.7367043918610189,
"learning_rate": 1.4060800078037407e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24137605726718903,
"step": 2705,
"valid_targets_mean": 3009.7,
"valid_targets_min": 539
},
{
"epoch": 4.464579901153212,
"grad_norm": 0.6735512497948377,
"learning_rate": 1.3982401787791215e-05,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19957660138607025,
"step": 2710,
"valid_targets_mean": 3105.6,
"valid_targets_min": 1394
},
{
"epoch": 4.472817133443163,
"grad_norm": 0.6987608708119356,
"learning_rate": 1.3904105035067701e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18072089552879333,
"step": 2715,
"valid_targets_mean": 2651.4,
"valid_targets_min": 864
},
{
"epoch": 4.481054365733113,
"grad_norm": 0.718751412393381,
"learning_rate": 1.3825911141001637e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16804978251457214,
"step": 2720,
"valid_targets_mean": 2340.1,
"valid_targets_min": 567
},
{
"epoch": 4.4892915980230645,
"grad_norm": 0.7064126385360051,
"learning_rate": 1.3747821424992245e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2070191204547882,
"step": 2725,
"valid_targets_mean": 2916.1,
"valid_targets_min": 925
},
{
"epoch": 4.497528830313015,
"grad_norm": 0.6972537885141782,
"learning_rate": 1.3669837204680879e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23842665553092957,
"step": 2730,
"valid_targets_mean": 2726.9,
"valid_targets_min": 638
},
{
"epoch": 4.505766062602966,
"grad_norm": 0.67473224143467,
"learning_rate": 1.3591959795928821e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2541242241859436,
"step": 2735,
"valid_targets_mean": 3227.6,
"valid_targets_min": 278
},
{
"epoch": 4.514003294892916,
"grad_norm": 0.6398227567414478,
"learning_rate": 1.3514190512795096e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18463942408561707,
"step": 2740,
"valid_targets_mean": 3369.2,
"valid_targets_min": 768
},
{
"epoch": 4.522240527182866,
"grad_norm": 0.914208935807342,
"learning_rate": 1.3436530667514258e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25415050983428955,
"step": 2745,
"valid_targets_mean": 2069.6,
"valid_targets_min": 260
},
{
"epoch": 4.530477759472817,
"grad_norm": 0.666232807251606,
"learning_rate": 1.3358981570474276e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19541533291339874,
"step": 2750,
"valid_targets_mean": 3547.4,
"valid_targets_min": 440
},
{
"epoch": 4.538714991762768,
"grad_norm": 1.1834154877573295,
"learning_rate": 1.3281544530194412e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22194775938987732,
"step": 2755,
"valid_targets_mean": 2390.3,
"valid_targets_min": 352
},
{
"epoch": 4.546952224052719,
"grad_norm": 0.6988385348664411,
"learning_rate": 1.3204220853303157e-05,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1807519942522049,
"step": 2760,
"valid_targets_mean": 2474.5,
"valid_targets_min": 930
},
{
"epoch": 4.555189456342669,
"grad_norm": 0.6268602624217262,
"learning_rate": 1.3127011844516165e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17390185594558716,
"step": 2765,
"valid_targets_mean": 2855.5,
"valid_targets_min": 364
},
{
"epoch": 4.563426688632619,
"grad_norm": 0.698300348357958,
"learning_rate": 1.304991880661425e-05,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18733061850070953,
"step": 2770,
"valid_targets_mean": 2874.1,
"valid_targets_min": 1214
},
{
"epoch": 4.57166392092257,
"grad_norm": 0.904490419197706,
"learning_rate": 1.2972943040421398e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1777077168226242,
"step": 2775,
"valid_targets_mean": 2739.2,
"valid_targets_min": 1111
},
{
"epoch": 4.5799011532125204,
"grad_norm": 0.7738385301230464,
"learning_rate": 1.2896085844782808e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19284678995609283,
"step": 2780,
"valid_targets_mean": 2336.1,
"valid_targets_min": 812
},
{
"epoch": 4.5881383855024716,
"grad_norm": 1.2378287916149417,
"learning_rate": 1.2819348516543003e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1683550775051117,
"step": 2785,
"valid_targets_mean": 2737.6,
"valid_targets_min": 696
},
{
"epoch": 4.596375617792422,
"grad_norm": 0.6483004452802794,
"learning_rate": 1.2742732350523928e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20438411831855774,
"step": 2790,
"valid_targets_mean": 3092.1,
"valid_targets_min": 356
},
{
"epoch": 4.604612850082372,
"grad_norm": 0.6880072116270369,
"learning_rate": 1.2666238639503099e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21004796028137207,
"step": 2795,
"valid_targets_mean": 2588.2,
"valid_targets_min": 866
},
{
"epoch": 4.612850082372323,
"grad_norm": 0.7996980024277847,
"learning_rate": 1.2589868674191794e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19884052872657776,
"step": 2800,
"valid_targets_mean": 2046.0,
"valid_targets_min": 979
},
{
"epoch": 4.621087314662273,
"grad_norm": 0.6228896426672722,
"learning_rate": 1.2513623743213297e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1847865730524063,
"step": 2805,
"valid_targets_mean": 3417.0,
"valid_targets_min": 252
},
{
"epoch": 4.629324546952224,
"grad_norm": 0.714956059080542,
"learning_rate": 1.243750513308111e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20548203587532043,
"step": 2810,
"valid_targets_mean": 2715.6,
"valid_targets_min": 594
},
{
"epoch": 4.637561779242175,
"grad_norm": 0.746190840563027,
"learning_rate": 1.2361514128177286e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19804972410202026,
"step": 2815,
"valid_targets_mean": 2636.1,
"valid_targets_min": 711
},
{
"epoch": 4.645799011532125,
"grad_norm": 0.6236556080477057,
"learning_rate": 1.2285652010730727e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16948853433132172,
"step": 2820,
"valid_targets_mean": 3223.8,
"valid_targets_min": 246
},
{
"epoch": 4.654036243822076,
"grad_norm": 0.7487803781790527,
"learning_rate": 1.220992006079557e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18032564222812653,
"step": 2825,
"valid_targets_mean": 2885.8,
"valid_targets_min": 1173
},
{
"epoch": 4.662273476112026,
"grad_norm": 0.6953634890626381,
"learning_rate": 1.2134319556229577e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17370088398456573,
"step": 2830,
"valid_targets_mean": 2609.1,
"valid_targets_min": 636
},
{
"epoch": 4.670510708401977,
"grad_norm": 0.6207408692644977,
"learning_rate": 1.2058851772672569e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2368783950805664,
"step": 2835,
"valid_targets_mean": 4058.8,
"valid_targets_min": 718
},
{
"epoch": 4.6787479406919275,
"grad_norm": 0.7159596910910173,
"learning_rate": 1.1983517983524917e-05,
"loss": 0.2383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2987104654312134,
"step": 2840,
"valid_targets_mean": 4173.1,
"valid_targets_min": 1281
},
{
"epoch": 4.686985172981878,
"grad_norm": 0.7698653286065977,
"learning_rate": 1.1908319459926059e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789364457130432,
"step": 2845,
"valid_targets_mean": 2637.2,
"valid_targets_min": 341
},
{
"epoch": 4.695222405271829,
"grad_norm": 0.6885585604727101,
"learning_rate": 1.183325747073301e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16655626893043518,
"step": 2850,
"valid_targets_mean": 2233.1,
"valid_targets_min": 762
},
{
"epoch": 4.703459637561779,
"grad_norm": 0.7000465338140921,
"learning_rate": 1.1758333282499004e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18717628717422485,
"step": 2855,
"valid_targets_mean": 2459.1,
"valid_targets_min": 251
},
{
"epoch": 4.71169686985173,
"grad_norm": 0.649981251933767,
"learning_rate": 1.1683548159452083e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19186502695083618,
"step": 2860,
"valid_targets_mean": 3500.6,
"valid_targets_min": 1184
},
{
"epoch": 4.71993410214168,
"grad_norm": 0.7074888663516279,
"learning_rate": 1.1608903363473804e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14978522062301636,
"step": 2865,
"valid_targets_mean": 2693.1,
"valid_targets_min": 1092
},
{
"epoch": 4.7281713344316305,
"grad_norm": 0.5890780017197069,
"learning_rate": 1.1534400154077901e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18731525540351868,
"step": 2870,
"valid_targets_mean": 3308.1,
"valid_targets_min": 752
},
{
"epoch": 4.736408566721582,
"grad_norm": 0.62302716913029,
"learning_rate": 1.146003978838908e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20663988590240479,
"step": 2875,
"valid_targets_mean": 3739.2,
"valid_targets_min": 877
},
{
"epoch": 4.744645799011532,
"grad_norm": 0.7831927582297329,
"learning_rate": 1.1385823521121755e-05,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18367904424667358,
"step": 2880,
"valid_targets_mean": 2389.8,
"valid_targets_min": 646
},
{
"epoch": 4.752883031301483,
"grad_norm": 0.7136796015209697,
"learning_rate": 1.1311752604558945e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18837086856365204,
"step": 2885,
"valid_targets_mean": 2352.7,
"valid_targets_min": 867
},
{
"epoch": 4.761120263591433,
"grad_norm": 0.7417881865230119,
"learning_rate": 1.1237828288531065e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16705411672592163,
"step": 2890,
"valid_targets_mean": 2411.9,
"valid_targets_min": 295
},
{
"epoch": 4.769357495881383,
"grad_norm": 0.7278603551951753,
"learning_rate": 1.1164051820394903e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18239541351795197,
"step": 2895,
"valid_targets_mean": 2383.0,
"valid_targets_min": 377
},
{
"epoch": 4.7775947281713345,
"grad_norm": 0.7684800575498447,
"learning_rate": 1.1090424445012524e-05,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619876265525818,
"step": 2900,
"valid_targets_mean": 2578.1,
"valid_targets_min": 753
},
{
"epoch": 4.785831960461285,
"grad_norm": 0.7762954518335069,
"learning_rate": 1.1016947404730302e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2098005712032318,
"step": 2905,
"valid_targets_mean": 2469.4,
"valid_targets_min": 280
},
{
"epoch": 4.794069192751236,
"grad_norm": 0.6972231214453025,
"learning_rate": 1.0943621939357952e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2021644413471222,
"step": 2910,
"valid_targets_mean": 2612.5,
"valid_targets_min": 799
},
{
"epoch": 4.802306425041186,
"grad_norm": 0.7647388529572376,
"learning_rate": 1.0870449286147565e-05,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24047201871871948,
"step": 2915,
"valid_targets_mean": 2461.9,
"valid_targets_min": 219
},
{
"epoch": 4.810543657331137,
"grad_norm": 0.6738602004759084,
"learning_rate": 1.07974306797728e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17990803718566895,
"step": 2920,
"valid_targets_mean": 3235.8,
"valid_targets_min": 1435
},
{
"epoch": 4.818780889621087,
"grad_norm": 0.6592140334086931,
"learning_rate": 1.0724567352308008e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20495711266994476,
"step": 2925,
"valid_targets_mean": 3125.3,
"valid_targets_min": 226
},
{
"epoch": 4.8270181219110375,
"grad_norm": 0.7407499909683418,
"learning_rate": 1.0651860533207448e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599995195865631,
"step": 2930,
"valid_targets_mean": 3042.9,
"valid_targets_min": 935
},
{
"epoch": 4.835255354200989,
"grad_norm": 0.716775005898679,
"learning_rate": 1.0579311449284555e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17676642537117004,
"step": 2935,
"valid_targets_mean": 2293.6,
"valid_targets_min": 777
},
{
"epoch": 4.843492586490939,
"grad_norm": 0.8291279498158952,
"learning_rate": 1.0506921324691209e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19918978214263916,
"step": 2940,
"valid_targets_mean": 2218.4,
"valid_targets_min": 1162
},
{
"epoch": 4.85172981878089,
"grad_norm": 0.6111907605345152,
"learning_rate": 1.0434691380897132e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18697769939899445,
"step": 2945,
"valid_targets_mean": 3431.4,
"valid_targets_min": 895
},
{
"epoch": 4.85996705107084,
"grad_norm": 0.7998141165292254,
"learning_rate": 1.0362622836669216e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752634048461914,
"step": 2950,
"valid_targets_mean": 2012.6,
"valid_targets_min": 257
},
{
"epoch": 4.868204283360791,
"grad_norm": 0.7214959209341665,
"learning_rate": 1.0290716908051009e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23504498600959778,
"step": 2955,
"valid_targets_mean": 3218.4,
"valid_targets_min": 1304
},
{
"epoch": 4.8764415156507415,
"grad_norm": 0.6902196978381809,
"learning_rate": 1.0218974808342168e-05,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1906399428844452,
"step": 2960,
"valid_targets_mean": 2743.1,
"valid_targets_min": 322
},
{
"epoch": 4.884678747940692,
"grad_norm": 0.6282845815110746,
"learning_rate": 1.0147397748077999e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19511428475379944,
"step": 2965,
"valid_targets_mean": 3286.5,
"valid_targets_min": 385
},
{
"epoch": 4.892915980230643,
"grad_norm": 0.7362780284461559,
"learning_rate": 1.007598693500903e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19690576195716858,
"step": 2970,
"valid_targets_mean": 2372.4,
"valid_targets_min": 265
},
{
"epoch": 4.901153212520593,
"grad_norm": 0.6683978371796541,
"learning_rate": 1.0004743574080607e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1450890302658081,
"step": 2975,
"valid_targets_mean": 2457.7,
"valid_targets_min": 858
},
{
"epoch": 4.909390444810544,
"grad_norm": 0.6596995747936142,
"learning_rate": 9.93366886741261e-06,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22884449362754822,
"step": 2980,
"valid_targets_mean": 3525.4,
"valid_targets_min": 187
},
{
"epoch": 4.917627677100494,
"grad_norm": 0.7659921918500595,
"learning_rate": 9.862764014279134e-06,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2457534223794937,
"step": 2985,
"valid_targets_mean": 2558.6,
"valid_targets_min": 799
},
{
"epoch": 4.9258649093904445,
"grad_norm": 0.7799286605012021,
"learning_rate": 9.792030211088248e-06,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22971343994140625,
"step": 2990,
"valid_targets_mean": 2437.7,
"valid_targets_min": 330
},
{
"epoch": 4.934102141680396,
"grad_norm": 0.6320931491436543,
"learning_rate": 9.721468651361852e-06,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18385854363441467,
"step": 2995,
"valid_targets_mean": 3284.8,
"valid_targets_min": 696
},
{
"epoch": 4.942339373970346,
"grad_norm": 0.6523206752281229,
"learning_rate": 9.651080525715464e-06,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16642795503139496,
"step": 3000,
"valid_targets_mean": 3221.4,
"valid_targets_min": 1577
},
{
"epoch": 4.950576606260297,
"grad_norm": 0.6643564942274582,
"learning_rate": 9.580867021838234e-06,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2085125744342804,
"step": 3005,
"valid_targets_mean": 3377.6,
"valid_targets_min": 297
},
{
"epoch": 4.958813838550247,
"grad_norm": 0.6413957328149001,
"learning_rate": 9.510829324472784e-06,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25765886902809143,
"step": 3010,
"valid_targets_mean": 4052.6,
"valid_targets_min": 1031
},
{
"epoch": 4.967051070840197,
"grad_norm": 0.6990492677300354,
"learning_rate": 9.440968615395314e-06,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18069782853126526,
"step": 3015,
"valid_targets_mean": 2553.2,
"valid_targets_min": 1073
},
{
"epoch": 4.9752883031301485,
"grad_norm": 0.6736246492056246,
"learning_rate": 9.37128607339562e-06,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594797819852829,
"step": 3020,
"valid_targets_mean": 2709.8,
"valid_targets_min": 290
},
{
"epoch": 4.983525535420099,
"grad_norm": 0.7071383567645622,
"learning_rate": 9.301782874257186e-06,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15425880253314972,
"step": 3025,
"valid_targets_mean": 2314.9,
"valid_targets_min": 345
},
{
"epoch": 4.99176276771005,
"grad_norm": 0.6562276890652816,
"learning_rate": 9.232460190737394e-06,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21255633234977722,
"step": 3030,
"valid_targets_mean": 4083.8,
"valid_targets_min": 1116
},
{
"epoch": 5.0,
"grad_norm": 0.7135456083913048,
"learning_rate": 9.163319192547702e-06,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18922117352485657,
"step": 3035,
"valid_targets_mean": 2817.9,
"valid_targets_min": 766
},
{
"epoch": 5.00823723228995,
"grad_norm": 0.6064180034994974,
"learning_rate": 9.094361046333887e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17224377393722534,
"step": 3040,
"valid_targets_mean": 3418.8,
"valid_targets_min": 1679
},
{
"epoch": 5.016474464579901,
"grad_norm": 0.6250290364668916,
"learning_rate": 9.025586915656435e-06,
"loss": 0.2112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19228821992874146,
"step": 3045,
"valid_targets_mean": 3741.3,
"valid_targets_min": 886
},
{
"epoch": 5.0247116968698515,
"grad_norm": 0.6608009238868802,
"learning_rate": 8.956997960970811e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19262053072452545,
"step": 3050,
"valid_targets_mean": 3611.7,
"valid_targets_min": 839
},
{
"epoch": 5.032948929159803,
"grad_norm": 0.7772909122140956,
"learning_rate": 8.888595339607961e-06,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18313942849636078,
"step": 3055,
"valid_targets_mean": 2424.2,
"valid_targets_min": 356
},
{
"epoch": 5.041186161449753,
"grad_norm": 0.7689441961709437,
"learning_rate": 8.82038020575472e-06,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2497469037771225,
"step": 3060,
"valid_targets_mean": 2754.6,
"valid_targets_min": 290
},
{
"epoch": 5.049423393739703,
"grad_norm": 0.6503950444326292,
"learning_rate": 8.752353710434384e-06,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2629661560058594,
"step": 3065,
"valid_targets_mean": 4315.6,
"valid_targets_min": 980
},
{
"epoch": 5.057660626029654,
"grad_norm": 0.6604107548804747,
"learning_rate": 8.684517001487276e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20543421804904938,
"step": 3070,
"valid_targets_mean": 3637.5,
"valid_targets_min": 287
},
{
"epoch": 5.065897858319604,
"grad_norm": 0.65130591346722,
"learning_rate": 8.616871223551335e-06,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1576567441225052,
"step": 3075,
"valid_targets_mean": 3172.4,
"valid_targets_min": 1218
},
{
"epoch": 5.0741350906095555,
"grad_norm": 0.7123187129434798,
"learning_rate": 8.549417518042899e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19344539940357208,
"step": 3080,
"valid_targets_mean": 3020.7,
"valid_targets_min": 702
},
{
"epoch": 5.082372322899506,
"grad_norm": 0.684466499187168,
"learning_rate": 8.482157023137326e-06,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15878722071647644,
"step": 3085,
"valid_targets_mean": 3033.1,
"valid_targets_min": 1433
},
{
"epoch": 5.090609555189456,
"grad_norm": 0.6591878834846665,
"learning_rate": 8.415090873749882e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14512422680854797,
"step": 3090,
"valid_targets_mean": 2839.8,
"valid_targets_min": 326
},
{
"epoch": 5.098846787479407,
"grad_norm": 0.7689559250431048,
"learning_rate": 8.348220201516559e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2209683060646057,
"step": 3095,
"valid_targets_mean": 2806.2,
"valid_targets_min": 539
},
{
"epoch": 5.107084019769357,
"grad_norm": 0.6724369983360083,
"learning_rate": 8.281546134774952e-06,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1659250110387802,
"step": 3100,
"valid_targets_mean": 3220.8,
"valid_targets_min": 586
},
{
"epoch": 5.115321252059308,
"grad_norm": 0.6592543385028731,
"learning_rate": 8.215069798545272e-06,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23743778467178345,
"step": 3105,
"valid_targets_mean": 3924.8,
"valid_targets_min": 1061
},
{
"epoch": 5.1235584843492585,
"grad_norm": 0.7140903108295529,
"learning_rate": 8.148792314511338e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18408019840717316,
"step": 3110,
"valid_targets_mean": 2868.4,
"valid_targets_min": 279
},
{
"epoch": 5.13179571663921,
"grad_norm": 0.899945522646544,
"learning_rate": 8.082714801001619e-06,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1668897271156311,
"step": 3115,
"valid_targets_mean": 1955.2,
"valid_targets_min": 809
},
{
"epoch": 5.14003294892916,
"grad_norm": 0.7903726889847759,
"learning_rate": 8.016838372970453e-06,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19560575485229492,
"step": 3120,
"valid_targets_mean": 2365.5,
"valid_targets_min": 850
},
{
"epoch": 5.14827018121911,
"grad_norm": 0.6437043381500877,
"learning_rate": 7.951164141979115e-06,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22203288972377777,
"step": 3125,
"valid_targets_mean": 3675.4,
"valid_targets_min": 1346
},
{
"epoch": 5.156507413509061,
"grad_norm": 0.6355970111306471,
"learning_rate": 7.885693216177166e-06,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17794297635555267,
"step": 3130,
"valid_targets_mean": 3428.3,
"valid_targets_min": 993
},
{
"epoch": 5.164744645799011,
"grad_norm": 0.6602780647849495,
"learning_rate": 7.820426700283681e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1728067845106125,
"step": 3135,
"valid_targets_mean": 3440.2,
"valid_targets_min": 988
},
{
"epoch": 5.1729818780889625,
"grad_norm": 0.7558597560486282,
"learning_rate": 7.75536569556866e-06,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20588910579681396,
"step": 3140,
"valid_targets_mean": 2655.5,
"valid_targets_min": 814
},
{
"epoch": 5.181219110378913,
"grad_norm": 0.7254810135039633,
"learning_rate": 7.690511299834422e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662125587463379,
"step": 3145,
"valid_targets_mean": 2955.9,
"valid_targets_min": 311
},
{
"epoch": 5.189456342668863,
"grad_norm": 0.8088311377677032,
"learning_rate": 7.625864607397066e-06,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25056391954421997,
"step": 3150,
"valid_targets_mean": 2665.3,
"valid_targets_min": 565
},
{
"epoch": 5.197693574958814,
"grad_norm": 0.6600076683827095,
"learning_rate": 7.561426709068045e-06,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18403570353984833,
"step": 3155,
"valid_targets_mean": 3254.5,
"valid_targets_min": 728
},
{
"epoch": 5.205930807248764,
"grad_norm": 0.5798390366412892,
"learning_rate": 7.497198692135728e-06,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14264634251594543,
"step": 3160,
"valid_targets_mean": 4274.8,
"valid_targets_min": 1430
},
{
"epoch": 5.214168039538715,
"grad_norm": 0.8075445062618977,
"learning_rate": 7.433181640347069e-06,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17545044422149658,
"step": 3165,
"valid_targets_mean": 3412.2,
"valid_targets_min": 219
},
{
"epoch": 5.2224052718286655,
"grad_norm": 0.8096547199240914,
"learning_rate": 7.369376633889325e-06,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15541712939739227,
"step": 3170,
"valid_targets_mean": 2235.3,
"valid_targets_min": 204
},
{
"epoch": 5.230642504118616,
"grad_norm": 0.7262956103025833,
"learning_rate": 7.305784749371792e-06,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.218002587556839,
"step": 3175,
"valid_targets_mean": 3621.4,
"valid_targets_min": 1416
},
{
"epoch": 5.238879736408567,
"grad_norm": 0.7538387339240314,
"learning_rate": 7.242407059807703e-06,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20847590267658234,
"step": 3180,
"valid_targets_mean": 2906.4,
"valid_targets_min": 900
},
{
"epoch": 5.247116968698517,
"grad_norm": 0.6712012846940215,
"learning_rate": 7.1792446345960585e-06,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1522168517112732,
"step": 3185,
"valid_targets_mean": 2999.8,
"valid_targets_min": 335
},
{
"epoch": 5.255354200988468,
"grad_norm": 0.7008582088098334,
"learning_rate": 7.116298539503632e-06,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15230123698711395,
"step": 3190,
"valid_targets_mean": 2597.4,
"valid_targets_min": 212
},
{
"epoch": 5.263591433278418,
"grad_norm": 0.6913752679862281,
"learning_rate": 7.053569836646954e-06,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16717877984046936,
"step": 3195,
"valid_targets_mean": 3209.5,
"valid_targets_min": 445
},
{
"epoch": 5.2718286655683695,
"grad_norm": 0.6501280031713065,
"learning_rate": 6.991059584474411e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15155775845050812,
"step": 3200,
"valid_targets_mean": 3640.1,
"valid_targets_min": 244
},
{
"epoch": 5.28006589785832,
"grad_norm": 0.7765572752139934,
"learning_rate": 6.928768837748374e-06,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1907849758863449,
"step": 3205,
"valid_targets_mean": 2407.2,
"valid_targets_min": 1252
},
{
"epoch": 5.28830313014827,
"grad_norm": 0.7092172752068605,
"learning_rate": 6.866698647527392e-06,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19017310440540314,
"step": 3210,
"valid_targets_mean": 2805.6,
"valid_targets_min": 776
},
{
"epoch": 5.296540362438221,
"grad_norm": 0.8973485963057156,
"learning_rate": 6.804850061148485e-06,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752794086933136,
"step": 3215,
"valid_targets_mean": 2147.9,
"valid_targets_min": 677
},
{
"epoch": 5.304777594728171,
"grad_norm": 0.707169418301808,
"learning_rate": 6.7432241222094595e-06,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20905683934688568,
"step": 3220,
"valid_targets_mean": 3281.1,
"valid_targets_min": 724
},
{
"epoch": 5.313014827018122,
"grad_norm": 0.632264893798177,
"learning_rate": 6.68182187055127e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13711237907409668,
"step": 3225,
"valid_targets_mean": 3425.3,
"valid_targets_min": 847
},
{
"epoch": 5.3212520593080725,
"grad_norm": 0.6416477054286873,
"learning_rate": 6.620644342240534e-06,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15817886590957642,
"step": 3230,
"valid_targets_mean": 3488.2,
"valid_targets_min": 585
},
{
"epoch": 5.329489291598023,
"grad_norm": 0.7253505491366616,
"learning_rate": 6.559692569551976e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18176016211509705,
"step": 3235,
"valid_targets_mean": 2424.8,
"valid_targets_min": 965
},
{
"epoch": 5.337726523887974,
"grad_norm": 0.7467293463976239,
"learning_rate": 6.498967580951099e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569557785987854,
"step": 3240,
"valid_targets_mean": 2483.9,
"valid_targets_min": 1182
},
{
"epoch": 5.345963756177924,
"grad_norm": 0.8565193699113087,
"learning_rate": 6.4384704010767284e-06,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18094724416732788,
"step": 3245,
"valid_targets_mean": 2141.0,
"valid_targets_min": 260
},
{
"epoch": 5.354200988467875,
"grad_norm": 0.7269022982597675,
"learning_rate": 6.37820205072381e-06,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.121427983045578,
"step": 3250,
"valid_targets_mean": 2299.0,
"valid_targets_min": 1207
},
{
"epoch": 5.362438220757825,
"grad_norm": 0.7414210784723774,
"learning_rate": 6.318163546826141e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17040827870368958,
"step": 3255,
"valid_targets_mean": 2556.3,
"valid_targets_min": 265
},
{
"epoch": 5.370675453047776,
"grad_norm": 0.7458160033756344,
"learning_rate": 6.258355902439211e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14077043533325195,
"step": 3260,
"valid_targets_mean": 2237.4,
"valid_targets_min": 1025
},
{
"epoch": 5.378912685337727,
"grad_norm": 0.8342015753026745,
"learning_rate": 6.198780126723127e-06,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14754045009613037,
"step": 3265,
"valid_targets_mean": 1824.2,
"valid_targets_min": 402
},
{
"epoch": 5.387149917627677,
"grad_norm": 0.7694290384969541,
"learning_rate": 6.139437224925586e-06,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1629246175289154,
"step": 3270,
"valid_targets_mean": 2445.3,
"valid_targets_min": 845
},
{
"epoch": 5.395387149917628,
"grad_norm": 0.8433928744995592,
"learning_rate": 6.080328198364871e-06,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084483504295349,
"step": 3275,
"valid_targets_mean": 2179.2,
"valid_targets_min": 633
},
{
"epoch": 5.403624382207578,
"grad_norm": 0.6765682861675392,
"learning_rate": 6.021454044413036e-06,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2180410623550415,
"step": 3280,
"valid_targets_mean": 3277.3,
"valid_targets_min": 1020
},
{
"epoch": 5.4118616144975284,
"grad_norm": 0.8357652595647097,
"learning_rate": 5.962815756478979e-06,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1691618412733078,
"step": 3285,
"valid_targets_mean": 2519.4,
"valid_targets_min": 878
},
{
"epoch": 5.4200988467874796,
"grad_norm": 0.7365400222373201,
"learning_rate": 5.904414323991758e-06,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17638184130191803,
"step": 3290,
"valid_targets_mean": 2686.8,
"valid_targets_min": 358
},
{
"epoch": 5.42833607907743,
"grad_norm": 0.7247240550977059,
"learning_rate": 5.846250732383869e-06,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24847513437271118,
"step": 3295,
"valid_targets_mean": 3847.8,
"valid_targets_min": 698
},
{
"epoch": 5.436573311367381,
"grad_norm": 0.7198196895329133,
"learning_rate": 5.788325963074594e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17607322335243225,
"step": 3300,
"valid_targets_mean": 3049.2,
"valid_targets_min": 260
},
{
"epoch": 5.444810543657331,
"grad_norm": 0.8022615837890243,
"learning_rate": 5.7306409934534936e-06,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18957354128360748,
"step": 3305,
"valid_targets_mean": 2815.9,
"valid_targets_min": 796
},
{
"epoch": 5.453047775947281,
"grad_norm": 0.7703287318099119,
"learning_rate": 5.673196796863852e-06,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19865599274635315,
"step": 3310,
"valid_targets_mean": 3163.5,
"valid_targets_min": 1041
},
{
"epoch": 5.461285008237232,
"grad_norm": 0.6861868123941506,
"learning_rate": 5.615994342586313e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.160249724984169,
"step": 3315,
"valid_targets_mean": 2706.8,
"valid_targets_min": 1026
},
{
"epoch": 5.469522240527183,
"grad_norm": 0.7519375725202005,
"learning_rate": 5.5590345958224875e-06,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19434326887130737,
"step": 3320,
"valid_targets_mean": 2473.9,
"valid_targets_min": 357
},
{
"epoch": 5.477759472817134,
"grad_norm": 0.7034008504710153,
"learning_rate": 5.502318517678682e-06,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13975057005882263,
"step": 3325,
"valid_targets_mean": 2624.3,
"valid_targets_min": 380
},
{
"epoch": 5.485996705107084,
"grad_norm": 0.8591217062074403,
"learning_rate": 5.445847065149679e-06,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19654160737991333,
"step": 3330,
"valid_targets_mean": 2530.1,
"valid_targets_min": 647
},
{
"epoch": 5.494233937397034,
"grad_norm": 0.8338393901784925,
"learning_rate": 5.389621191102574e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19803670048713684,
"step": 3335,
"valid_targets_mean": 3171.4,
"valid_targets_min": 925
},
{
"epoch": 5.502471169686985,
"grad_norm": 0.8232013140154525,
"learning_rate": 5.333641844260726e-06,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21081340312957764,
"step": 3340,
"valid_targets_mean": 2620.4,
"valid_targets_min": 607
},
{
"epoch": 5.5107084019769355,
"grad_norm": 0.7263973632736029,
"learning_rate": 5.277909969187738e-06,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11975730210542679,
"step": 3345,
"valid_targets_mean": 2141.7,
"valid_targets_min": 552
},
{
"epoch": 5.518945634266887,
"grad_norm": 0.7175609162042647,
"learning_rate": 5.222426506271492e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15939165651798248,
"step": 3350,
"valid_targets_mean": 3050.1,
"valid_targets_min": 746
},
{
"epoch": 5.527182866556837,
"grad_norm": 0.748834509252294,
"learning_rate": 5.1671923917083265e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18665283918380737,
"step": 3355,
"valid_targets_mean": 2947.6,
"valid_targets_min": 927
},
{
"epoch": 5.535420098846787,
"grad_norm": 0.915756061799089,
"learning_rate": 5.112208557487215e-06,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17622342705726624,
"step": 3360,
"valid_targets_mean": 3114.1,
"valid_targets_min": 776
},
{
"epoch": 5.543657331136738,
"grad_norm": 0.6861044823588834,
"learning_rate": 5.057475931374043e-06,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15702880918979645,
"step": 3365,
"valid_targets_mean": 3333.8,
"valid_targets_min": 283
},
{
"epoch": 5.551894563426688,
"grad_norm": 0.5651714611404062,
"learning_rate": 5.002995436895939e-06,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19566282629966736,
"step": 3370,
"valid_targets_mean": 4441.9,
"valid_targets_min": 1039
},
{
"epoch": 5.560131795716639,
"grad_norm": 0.6967484805438395,
"learning_rate": 4.9487679933257225e-06,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17878486216068268,
"step": 3375,
"valid_targets_mean": 3512.9,
"valid_targets_min": 977
},
{
"epoch": 5.56836902800659,
"grad_norm": 0.8309410288700217,
"learning_rate": 4.894794515666379e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1670929193496704,
"step": 3380,
"valid_targets_mean": 2985.6,
"valid_targets_min": 791
},
{
"epoch": 5.576606260296541,
"grad_norm": 0.8303611692984448,
"learning_rate": 4.8410759146355955e-06,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16505856812000275,
"step": 3385,
"valid_targets_mean": 2491.2,
"valid_targets_min": 940
},
{
"epoch": 5.584843492586491,
"grad_norm": 0.7021211702845122,
"learning_rate": 4.787613096650436e-06,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12547199428081512,
"step": 3390,
"valid_targets_mean": 3197.2,
"valid_targets_min": 706
},
{
"epoch": 5.593080724876441,
"grad_norm": 0.6982593083876117,
"learning_rate": 4.734406963812024e-06,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16671398282051086,
"step": 3395,
"valid_targets_mean": 3031.1,
"valid_targets_min": 651
},
{
"epoch": 5.601317957166392,
"grad_norm": 0.7983795110267299,
"learning_rate": 4.68145841389032e-06,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2452123761177063,
"step": 3400,
"valid_targets_mean": 3621.4,
"valid_targets_min": 868
},
{
"epoch": 5.6095551894563425,
"grad_norm": 0.6939388117607412,
"learning_rate": 4.6287683403089845e-06,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1813758760690689,
"step": 3405,
"valid_targets_mean": 3380.9,
"valid_targets_min": 1276
},
{
"epoch": 5.617792421746294,
"grad_norm": 0.7353689335564925,
"learning_rate": 4.576337632130281e-06,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14547865092754364,
"step": 3410,
"valid_targets_mean": 2548.1,
"valid_targets_min": 750
},
{
"epoch": 5.626029654036244,
"grad_norm": 0.6926011113099905,
"learning_rate": 4.524167174040106e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14587116241455078,
"step": 3415,
"valid_targets_mean": 2785.8,
"valid_targets_min": 288
},
{
"epoch": 5.634266886326195,
"grad_norm": 0.7100090253616618,
"learning_rate": 4.472257846333028e-06,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12672248482704163,
"step": 3420,
"valid_targets_mean": 2911.2,
"valid_targets_min": 1017
},
{
"epoch": 5.642504118616145,
"grad_norm": 0.8387847090896776,
"learning_rate": 4.4206105248974595e-06,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17093172669410706,
"step": 3425,
"valid_targets_mean": 2210.1,
"valid_targets_min": 633
},
{
"epoch": 5.650741350906095,
"grad_norm": 0.8135873943654238,
"learning_rate": 4.3692260812008795e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1717970371246338,
"step": 3430,
"valid_targets_mean": 2176.8,
"valid_targets_min": 866
},
{
"epoch": 5.658978583196046,
"grad_norm": 0.7923907688849422,
"learning_rate": 4.318105382275084e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2087642252445221,
"step": 3435,
"valid_targets_mean": 2451.8,
"valid_targets_min": 666
},
{
"epoch": 5.667215815485997,
"grad_norm": 0.6638888534023216,
"learning_rate": 4.267249290701636e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17858381569385529,
"step": 3440,
"valid_targets_mean": 3964.4,
"valid_targets_min": 307
},
{
"epoch": 5.675453047775948,
"grad_norm": 0.8617516970063258,
"learning_rate": 4.216658664597224e-06,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18910962343215942,
"step": 3445,
"valid_targets_mean": 2019.4,
"valid_targets_min": 506
},
{
"epoch": 5.683690280065898,
"grad_norm": 0.7634977977727311,
"learning_rate": 4.166334357599246e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1956837773323059,
"step": 3450,
"valid_targets_mean": 2368.8,
"valid_targets_min": 562
},
{
"epoch": 5.691927512355848,
"grad_norm": 0.7838029896349801,
"learning_rate": 4.116277218851383e-06,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17025712132453918,
"step": 3455,
"valid_targets_mean": 2937.7,
"valid_targets_min": 668
},
{
"epoch": 5.700164744645799,
"grad_norm": 0.7044949991777757,
"learning_rate": 4.066488092989256e-06,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2160659283399582,
"step": 3460,
"valid_targets_mean": 3333.1,
"valid_targets_min": 1031
},
{
"epoch": 5.7084019769357495,
"grad_norm": 0.9783577658970115,
"learning_rate": 4.016967820126205e-06,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18528926372528076,
"step": 3465,
"valid_targets_mean": 2410.6,
"valid_targets_min": 683
},
{
"epoch": 5.716639209225701,
"grad_norm": 0.7036357285381335,
"learning_rate": 3.967717235839086e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1655019372701645,
"step": 3470,
"valid_targets_mean": 2925.2,
"valid_targets_min": 834
},
{
"epoch": 5.724876441515651,
"grad_norm": 0.6713767526809996,
"learning_rate": 3.918737171154192e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13649466633796692,
"step": 3475,
"valid_targets_mean": 2739.8,
"valid_targets_min": 230
},
{
"epoch": 5.733113673805601,
"grad_norm": 0.7714880924709924,
"learning_rate": 3.870028452533221e-06,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1947619915008545,
"step": 3480,
"valid_targets_mean": 2570.9,
"valid_targets_min": 708
},
{
"epoch": 5.741350906095552,
"grad_norm": 0.6732219111117853,
"learning_rate": 3.8215919018593295e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13189196586608887,
"step": 3485,
"valid_targets_mean": 3156.6,
"valid_targets_min": 1248
},
{
"epoch": 5.749588138385502,
"grad_norm": 0.7828985393778445,
"learning_rate": 3.7734283364232747e-06,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14875520765781403,
"step": 3490,
"valid_targets_mean": 2533.2,
"valid_targets_min": 685
},
{
"epoch": 5.757825370675453,
"grad_norm": 0.6734972968776775,
"learning_rate": 3.725538568909599e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20598509907722473,
"step": 3495,
"valid_targets_mean": 3320.4,
"valid_targets_min": 327
},
{
"epoch": 5.766062602965404,
"grad_norm": 0.6820313312676656,
"learning_rate": 3.6779234073829528e-06,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16222935914993286,
"step": 3500,
"valid_targets_mean": 3013.1,
"valid_targets_min": 414
},
{
"epoch": 5.774299835255354,
"grad_norm": 0.6881508771610351,
"learning_rate": 3.63058365527444e-06,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17598870396614075,
"step": 3505,
"valid_targets_mean": 3021.1,
"valid_targets_min": 260
},
{
"epoch": 5.782537067545305,
"grad_norm": 0.9256567228616236,
"learning_rate": 3.5835201113680463e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18399620056152344,
"step": 3510,
"valid_targets_mean": 3049.4,
"valid_targets_min": 780
},
{
"epoch": 5.790774299835255,
"grad_norm": 0.7127835516858468,
"learning_rate": 3.536733569787194e-06,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14168041944503784,
"step": 3515,
"valid_targets_mean": 2699.2,
"valid_targets_min": 1104
},
{
"epoch": 5.799011532125206,
"grad_norm": 0.7360005045380545,
"learning_rate": 3.4902248199813203e-06,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13892826437950134,
"step": 3520,
"valid_targets_mean": 2244.3,
"valid_targets_min": 602
},
{
"epoch": 5.8072487644151565,
"grad_norm": 0.7455487123063135,
"learning_rate": 3.443994646712567e-06,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16907833516597748,
"step": 3525,
"valid_targets_mean": 2390.0,
"valid_targets_min": 781
},
{
"epoch": 5.815485996705107,
"grad_norm": 0.7953720238270837,
"learning_rate": 3.3980438300425324e-06,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514473408460617,
"step": 3530,
"valid_targets_mean": 2531.9,
"valid_targets_min": 838
},
{
"epoch": 5.823723228995058,
"grad_norm": 0.8642656461553999,
"learning_rate": 3.3523731453190987e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16404001414775848,
"step": 3535,
"valid_targets_mean": 1984.9,
"valid_targets_min": 808
},
{
"epoch": 5.831960461285008,
"grad_norm": 0.7256800913138621,
"learning_rate": 3.306983363163381e-06,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12058289349079132,
"step": 3540,
"valid_targets_mean": 2846.2,
"valid_targets_min": 786
},
{
"epoch": 5.840197693574959,
"grad_norm": 0.8398559139673432,
"learning_rate": 3.2618752494566854e-06,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21678978204727173,
"step": 3545,
"valid_targets_mean": 2182.9,
"valid_targets_min": 807
},
{
"epoch": 5.848434925864909,
"grad_norm": 0.6879487573765043,
"learning_rate": 3.217049565327619e-06,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13484476506710052,
"step": 3550,
"valid_targets_mean": 2719.2,
"valid_targets_min": 688
},
{
"epoch": 5.8566721581548595,
"grad_norm": 0.8490732841663783,
"learning_rate": 3.17250706713923e-06,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21391984820365906,
"step": 3555,
"valid_targets_mean": 2457.4,
"valid_targets_min": 241
},
{
"epoch": 5.864909390444811,
"grad_norm": 0.7426460128321304,
"learning_rate": 3.128248506476246e-06,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14091576635837555,
"step": 3560,
"valid_targets_mean": 2596.6,
"valid_targets_min": 245
},
{
"epoch": 5.873146622734761,
"grad_norm": 0.7853668676403339,
"learning_rate": 3.0842746301324e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17900870740413666,
"step": 3565,
"valid_targets_mean": 2629.8,
"valid_targets_min": 848
},
{
"epoch": 5.881383855024712,
"grad_norm": 0.6294725390125606,
"learning_rate": 3.040586180097811e-06,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14573122560977936,
"step": 3570,
"valid_targets_mean": 3388.9,
"valid_targets_min": 980
},
{
"epoch": 5.889621087314662,
"grad_norm": 0.635131125967507,
"learning_rate": 2.9971838935464915e-06,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18714481592178345,
"step": 3575,
"valid_targets_mean": 3639.6,
"valid_targets_min": 1601
},
{
"epoch": 5.897858319604612,
"grad_norm": 0.6935148132102796,
"learning_rate": 2.9540685028238925e-06,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18102405965328217,
"step": 3580,
"valid_targets_mean": 2775.3,
"valid_targets_min": 318
},
{
"epoch": 5.9060955518945635,
"grad_norm": 0.8574201407311213,
"learning_rate": 2.9112407354345375e-06,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605670988559723,
"step": 3585,
"valid_targets_mean": 2246.1,
"valid_targets_min": 327
},
{
"epoch": 5.914332784184514,
"grad_norm": 0.9115993171771825,
"learning_rate": 2.8687013140297695e-06,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1853502094745636,
"step": 3590,
"valid_targets_mean": 2516.3,
"valid_targets_min": 1178
},
{
"epoch": 5.922570016474465,
"grad_norm": 0.711616625135048,
"learning_rate": 2.826450956395532e-06,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21265952289104462,
"step": 3595,
"valid_targets_mean": 3306.9,
"valid_targets_min": 1654
},
{
"epoch": 5.930807248764415,
"grad_norm": 0.6932061364220065,
"learning_rate": 2.7844903754402963e-06,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19808021187782288,
"step": 3600,
"valid_targets_mean": 3391.8,
"valid_targets_min": 346
},
{
"epoch": 5.939044481054366,
"grad_norm": 0.7566426671217025,
"learning_rate": 2.7428202791829763e-06,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16674354672431946,
"step": 3605,
"valid_targets_mean": 2808.9,
"valid_targets_min": 287
},
{
"epoch": 5.947281713344316,
"grad_norm": 0.8418388087549749,
"learning_rate": 2.7014413707410357e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16913406550884247,
"step": 3610,
"valid_targets_mean": 2207.9,
"valid_targets_min": 644
},
{
"epoch": 5.9555189456342665,
"grad_norm": 0.7988681269945298,
"learning_rate": 2.6603543483185966e-06,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.159542053937912,
"step": 3615,
"valid_targets_mean": 2564.2,
"valid_targets_min": 687
},
{
"epoch": 5.963756177924218,
"grad_norm": 1.2032980721393542,
"learning_rate": 2.6195599051946465e-06,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19994597136974335,
"step": 3620,
"valid_targets_mean": 2516.3,
"valid_targets_min": 987
},
{
"epoch": 5.971993410214168,
"grad_norm": 0.7714977813745794,
"learning_rate": 2.579058729711379e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823139488697052,
"step": 3625,
"valid_targets_mean": 2836.2,
"valid_targets_min": 263
},
{
"epoch": 5.980230642504119,
"grad_norm": 0.8014540368577482,
"learning_rate": 2.538851505262545e-06,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15929174423217773,
"step": 3630,
"valid_targets_mean": 2114.4,
"valid_targets_min": 320
},
{
"epoch": 5.988467874794069,
"grad_norm": 0.7461862435721606,
"learning_rate": 2.498938910281927e-06,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749926060438156,
"step": 3635,
"valid_targets_mean": 2477.5,
"valid_targets_min": 770
},
{
"epoch": 5.996705107084019,
"grad_norm": 0.7368517970426673,
"learning_rate": 2.4593216182319203e-06,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15466895699501038,
"step": 3640,
"valid_targets_mean": 2621.8,
"valid_targets_min": 245
},
{
"epoch": 6.0049423393739705,
"grad_norm": 1.1139077443534142,
"learning_rate": 2.42000029759212e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14994430541992188,
"step": 3645,
"valid_targets_mean": 2619.9,
"valid_targets_min": 636
},
{
"epoch": 6.013179571663921,
"grad_norm": 0.7501461411955563,
"learning_rate": 2.3809756118480887e-06,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1623890995979309,
"step": 3650,
"valid_targets_mean": 2354.2,
"valid_targets_min": 614
},
{
"epoch": 6.021416803953872,
"grad_norm": 0.6157972732215693,
"learning_rate": 2.3422482194801257e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15174467861652374,
"step": 3655,
"valid_targets_mean": 3239.4,
"valid_targets_min": 764
},
{
"epoch": 6.029654036243822,
"grad_norm": 0.7350556411709983,
"learning_rate": 2.30381877395218e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17065928876399994,
"step": 3660,
"valid_targets_mean": 2507.8,
"valid_targets_min": 650
},
{
"epoch": 6.037891268533772,
"grad_norm": 0.6901704684540658,
"learning_rate": 2.265687923700821e-06,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16900062561035156,
"step": 3665,
"valid_targets_mean": 2752.2,
"valid_targets_min": 1188
},
{
"epoch": 6.046128500823723,
"grad_norm": 0.7086734284825671,
"learning_rate": 2.2278563121242722e-06,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20763811469078064,
"step": 3670,
"valid_targets_mean": 3084.0,
"valid_targets_min": 307
},
{
"epoch": 6.0543657331136735,
"grad_norm": 0.6385356293662908,
"learning_rate": 2.190324577571592e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14509770274162292,
"step": 3675,
"valid_targets_mean": 3518.7,
"valid_targets_min": 527
},
{
"epoch": 6.062602965403625,
"grad_norm": 0.7028174328512578,
"learning_rate": 2.153093353331881e-06,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15137967467308044,
"step": 3680,
"valid_targets_mean": 3283.1,
"valid_targets_min": 246
},
{
"epoch": 6.070840197693575,
"grad_norm": 0.7222091137953284,
"learning_rate": 2.1161632676235967e-06,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20794406533241272,
"step": 3685,
"valid_targets_mean": 3220.8,
"valid_targets_min": 219
},
{
"epoch": 6.079077429983526,
"grad_norm": 0.6855245337047342,
"learning_rate": 2.0795349435839606e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12052720040082932,
"step": 3690,
"valid_targets_mean": 2771.8,
"valid_targets_min": 281
},
{
"epoch": 6.087314662273476,
"grad_norm": 0.707804572172083,
"learning_rate": 2.0432089992584326e-06,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15237155556678772,
"step": 3695,
"valid_targets_mean": 2842.4,
"valid_targets_min": 1123
},
{
"epoch": 6.095551894563426,
"grad_norm": 0.6707345478391269,
"learning_rate": 2.007186047590297e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14419394731521606,
"step": 3700,
"valid_targets_mean": 3254.1,
"valid_targets_min": 849
},
{
"epoch": 6.1037891268533775,
"grad_norm": 0.7003141972567551,
"learning_rate": 1.971466696410309e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1416216790676117,
"step": 3705,
"valid_targets_mean": 2684.4,
"valid_targets_min": 1045
},
{
"epoch": 6.112026359143328,
"grad_norm": 0.7825738433775659,
"learning_rate": 1.936051548426443e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1420452892780304,
"step": 3710,
"valid_targets_mean": 2350.9,
"valid_targets_min": 338
},
{
"epoch": 6.120263591433279,
"grad_norm": 0.7115145095325718,
"learning_rate": 1.9009412012137218e-06,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1335878074169159,
"step": 3715,
"valid_targets_mean": 2756.2,
"valid_targets_min": 251
},
{
"epoch": 6.128500823723229,
"grad_norm": 0.6743967837978332,
"learning_rate": 1.8661362472041355e-06,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1492428481578827,
"step": 3720,
"valid_targets_mean": 2904.1,
"valid_targets_min": 725
},
{
"epoch": 6.136738056013179,
"grad_norm": 0.7703129690601694,
"learning_rate": 1.8316372736766452e-06,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20545321702957153,
"step": 3725,
"valid_targets_mean": 3010.5,
"valid_targets_min": 278
},
{
"epoch": 6.14497528830313,
"grad_norm": 0.7888666022596672,
"learning_rate": 1.7974448627472618e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17078402638435364,
"step": 3730,
"valid_targets_mean": 2981.3,
"valid_targets_min": 766
},
{
"epoch": 6.1532125205930805,
"grad_norm": 0.7723578107116098,
"learning_rate": 1.763559591359243e-06,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601790189743042,
"step": 3735,
"valid_targets_mean": 2846.0,
"valid_targets_min": 298
},
{
"epoch": 6.161449752883032,
"grad_norm": 0.6714966512844651,
"learning_rate": 1.7299820312733518e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19277028739452362,
"step": 3740,
"valid_targets_mean": 4139.1,
"valid_targets_min": 334
},
{
"epoch": 6.169686985172982,
"grad_norm": 0.6556105712174505,
"learning_rate": 1.6967127490581892e-06,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1665448248386383,
"step": 3745,
"valid_targets_mean": 3238.6,
"valid_targets_min": 747
},
{
"epoch": 6.177924217462932,
"grad_norm": 0.7965390505057974,
"learning_rate": 1.6637523060806749e-06,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16333314776420593,
"step": 3750,
"valid_targets_mean": 2388.4,
"valid_targets_min": 783
},
{
"epoch": 6.186161449752883,
"grad_norm": 0.66375569184018,
"learning_rate": 1.6311012584965257e-06,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21853406727313995,
"step": 3755,
"valid_targets_mean": 3801.9,
"valid_targets_min": 317
},
{
"epoch": 6.194398682042833,
"grad_norm": 0.669378716443229,
"learning_rate": 1.5987601572409195e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1353456974029541,
"step": 3760,
"valid_targets_mean": 3566.6,
"valid_targets_min": 275
},
{
"epoch": 6.2026359143327845,
"grad_norm": 0.7658647113291661,
"learning_rate": 1.566729548019168e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1602291613817215,
"step": 3765,
"valid_targets_mean": 2423.1,
"valid_targets_min": 937
},
{
"epoch": 6.210873146622735,
"grad_norm": 0.6590955988866615,
"learning_rate": 1.5350099712975097e-06,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12900327146053314,
"step": 3770,
"valid_targets_mean": 3467.8,
"valid_targets_min": 789
},
{
"epoch": 6.219110378912685,
"grad_norm": 0.6919074917450025,
"learning_rate": 1.50360196229401e-06,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2072930634021759,
"step": 3775,
"valid_targets_mean": 3171.7,
"valid_targets_min": 969
},
{
"epoch": 6.227347611202636,
"grad_norm": 0.874989495696985,
"learning_rate": 1.4725060509695088e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21609821915626526,
"step": 3780,
"valid_targets_mean": 2349.0,
"valid_targets_min": 716
},
{
"epoch": 6.235584843492586,
"grad_norm": 0.7463878847371747,
"learning_rate": 1.4417227620186935e-06,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16198115050792694,
"step": 3785,
"valid_targets_mean": 2775.0,
"valid_targets_min": 299
},
{
"epoch": 6.243822075782537,
"grad_norm": 0.6615073957168196,
"learning_rate": 1.4112526148612381e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12445035576820374,
"step": 3790,
"valid_targets_mean": 2758.4,
"valid_targets_min": 586
},
{
"epoch": 6.2520593080724876,
"grad_norm": 0.6921577907753451,
"learning_rate": 1.3810961236330345e-06,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1393837332725525,
"step": 3795,
"valid_targets_mean": 3353.4,
"valid_targets_min": 1125
},
{
"epoch": 6.260296540362438,
"grad_norm": 0.8382225209020714,
"learning_rate": 1.3512537971775407e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19350308179855347,
"step": 3800,
"valid_targets_mean": 2176.9,
"valid_targets_min": 731
},
{
"epoch": 6.268533772652389,
"grad_norm": 0.6084781353758029,
"learning_rate": 1.321726139037156e-06,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1659453809261322,
"step": 3805,
"valid_targets_mean": 3997.4,
"valid_targets_min": 797
},
{
"epoch": 6.276771004942339,
"grad_norm": 0.7719108277276304,
"learning_rate": 1.2925136474447575e-06,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.155721515417099,
"step": 3810,
"valid_targets_mean": 2487.1,
"valid_targets_min": 219
},
{
"epoch": 6.28500823723229,
"grad_norm": 0.6385197418328769,
"learning_rate": 1.2636168153152828e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13569995760917664,
"step": 3815,
"valid_targets_mean": 3099.1,
"valid_targets_min": 391
},
{
"epoch": 6.29324546952224,
"grad_norm": 0.7174793871853767,
"learning_rate": 1.2350361302374037e-06,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1641596257686615,
"step": 3820,
"valid_targets_mean": 2929.2,
"valid_targets_min": 760
},
{
"epoch": 6.3014827018121915,
"grad_norm": 0.651538874031102,
"learning_rate": 1.2067720744653167e-06,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12000978738069534,
"step": 3825,
"valid_targets_mean": 2685.2,
"valid_targets_min": 939
},
{
"epoch": 6.309719934102142,
"grad_norm": 0.8511093562682773,
"learning_rate": 1.178825124910583e-06,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23789116740226746,
"step": 3830,
"valid_targets_mean": 2482.9,
"valid_targets_min": 896
},
{
"epoch": 6.317957166392092,
"grad_norm": 0.6180405933314328,
"learning_rate": 1.1511957531341067e-06,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11477728188037872,
"step": 3835,
"valid_targets_mean": 3123.0,
"valid_targets_min": 811
},
{
"epoch": 6.326194398682043,
"grad_norm": 0.6803850559923774,
"learning_rate": 1.123884425338162e-06,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1466941237449646,
"step": 3840,
"valid_targets_mean": 3088.1,
"valid_targets_min": 944
},
{
"epoch": 6.334431630971993,
"grad_norm": 0.7546973039836182,
"learning_rate": 1.0968916023585252e-06,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14515511691570282,
"step": 3845,
"valid_targets_mean": 2963.4,
"valid_targets_min": 941
},
{
"epoch": 6.342668863261944,
"grad_norm": 0.8849963117408646,
"learning_rate": 1.0702177396567114e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2112627923488617,
"step": 3850,
"valid_targets_mean": 1949.1,
"valid_targets_min": 345
},
{
"epoch": 6.350906095551895,
"grad_norm": 0.7459355712021345,
"learning_rate": 1.0438632873122746e-06,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15826204419136047,
"step": 3855,
"valid_targets_mean": 2619.4,
"valid_targets_min": 677
},
{
"epoch": 6.359143327841845,
"grad_norm": 0.7772343391993064,
"learning_rate": 1.0178286900152234e-06,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23661720752716064,
"step": 3860,
"valid_targets_mean": 2736.1,
"valid_targets_min": 836
},
{
"epoch": 6.367380560131796,
"grad_norm": 0.6357761439560725,
"learning_rate": 9.921143870585204e-07,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19213977456092834,
"step": 3865,
"valid_targets_mean": 3818.3,
"valid_targets_min": 618
},
{
"epoch": 6.375617792421746,
"grad_norm": 0.7752815261134633,
"learning_rate": 9.667208123306504e-07,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1300448477268219,
"step": 3870,
"valid_targets_mean": 2181.9,
"valid_targets_min": 335
},
{
"epoch": 6.383855024711697,
"grad_norm": 1.0569445961287538,
"learning_rate": 9.416483943083254e-07,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16549789905548096,
"step": 3875,
"valid_targets_mean": 3206.5,
"valid_targets_min": 1031
},
{
"epoch": 6.392092257001647,
"grad_norm": 0.7208101885756489,
"learning_rate": 9.168975560492365e-07,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14495733380317688,
"step": 3880,
"valid_targets_mean": 3358.2,
"valid_targets_min": 1197
},
{
"epoch": 6.400329489291598,
"grad_norm": 0.7429014255052777,
"learning_rate": 8.924687151849287e-07,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14917151629924774,
"step": 3885,
"valid_targets_mean": 2492.2,
"valid_targets_min": 890
},
{
"epoch": 6.408566721581549,
"grad_norm": 0.7462560187876585,
"learning_rate": 8.683622839137306e-07,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23635666072368622,
"step": 3890,
"valid_targets_mean": 2909.4,
"valid_targets_min": 923
},
{
"epoch": 6.416803953871499,
"grad_norm": 0.8102243606807108,
"learning_rate": 8.445786689938295e-07,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12910988926887512,
"step": 3895,
"valid_targets_mean": 2163.8,
"valid_targets_min": 429
},
{
"epoch": 6.42504118616145,
"grad_norm": 0.80398663184621,
"learning_rate": 8.211182717363897e-07,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19596856832504272,
"step": 3900,
"valid_targets_mean": 2539.6,
"valid_targets_min": 857
},
{
"epoch": 6.4332784184514,
"grad_norm": 0.7481982084445109,
"learning_rate": 7.979814879987824e-07,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17043043673038483,
"step": 3905,
"valid_targets_mean": 2694.1,
"valid_targets_min": 799
},
{
"epoch": 6.441515650741351,
"grad_norm": 0.6789946169423258,
"learning_rate": 7.751687081779091e-07,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19388365745544434,
"step": 3910,
"valid_targets_mean": 3303.7,
"valid_targets_min": 347
},
{
"epoch": 6.449752883031302,
"grad_norm": 0.6422614423127603,
"learning_rate": 7.526803172036157e-07,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11945605278015137,
"step": 3915,
"valid_targets_mean": 2707.4,
"valid_targets_min": 184
},
{
"epoch": 6.457990115321252,
"grad_norm": 0.7156633329528237,
"learning_rate": 7.305166945321973e-07,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19679643213748932,
"step": 3920,
"valid_targets_mean": 3079.4,
"valid_targets_min": 875
},
{
"epoch": 6.466227347611203,
"grad_norm": 0.7680662464415903,
"learning_rate": 7.086782141399906e-07,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1780366599559784,
"step": 3925,
"valid_targets_mean": 2651.0,
"valid_targets_min": 460
},
{
"epoch": 6.474464579901153,
"grad_norm": 1.0095018002402179,
"learning_rate": 6.871652445170651e-07,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1527692675590515,
"step": 3930,
"valid_targets_mean": 3270.0,
"valid_targets_min": 258
},
{
"epoch": 6.482701812191104,
"grad_norm": 0.8515545672589472,
"learning_rate": 6.659781486610129e-07,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22965921461582184,
"step": 3935,
"valid_targets_mean": 3471.1,
"valid_targets_min": 1364
},
{
"epoch": 6.490939044481054,
"grad_norm": 0.712226673890132,
"learning_rate": 6.451172840708087e-07,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16279277205467224,
"step": 3940,
"valid_targets_mean": 3104.0,
"valid_targets_min": 460
},
{
"epoch": 6.499176276771005,
"grad_norm": 0.7787226581803016,
"learning_rate": 6.245830027407973e-07,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16567203402519226,
"step": 3945,
"valid_targets_mean": 2723.2,
"valid_targets_min": 649
},
{
"epoch": 6.507413509060956,
"grad_norm": 0.7502856008513566,
"learning_rate": 6.043756511547427e-07,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16041092574596405,
"step": 3950,
"valid_targets_mean": 3132.1,
"valid_targets_min": 248
},
{
"epoch": 6.515650741350906,
"grad_norm": 0.675892844554783,
"learning_rate": 5.84495570279966e-07,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15754902362823486,
"step": 3955,
"valid_targets_mean": 3227.8,
"valid_targets_min": 304
},
{
"epoch": 6.523887973640857,
"grad_norm": 0.7664735528399342,
"learning_rate": 5.649430955616365e-07,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18401801586151123,
"step": 3960,
"valid_targets_mean": 2677.6,
"valid_targets_min": 821
},
{
"epoch": 6.532125205930807,
"grad_norm": 0.8538927050950035,
"learning_rate": 5.457185569170609e-07,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640760451555252,
"step": 3965,
"valid_targets_mean": 2824.4,
"valid_targets_min": 319
},
{
"epoch": 6.5403624382207575,
"grad_norm": 0.7882400286252053,
"learning_rate": 5.268222787301502e-07,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17009207606315613,
"step": 3970,
"valid_targets_mean": 2632.1,
"valid_targets_min": 783
},
{
"epoch": 6.548599670510709,
"grad_norm": 0.7311404280782681,
"learning_rate": 5.082545798459348e-07,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18268424272537231,
"step": 3975,
"valid_targets_mean": 3112.3,
"valid_targets_min": 702
},
{
"epoch": 6.556836902800659,
"grad_norm": 0.7146800124090497,
"learning_rate": 4.900157735651779e-07,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.163301020860672,
"step": 3980,
"valid_targets_mean": 3048.5,
"valid_targets_min": 964
},
{
"epoch": 6.56507413509061,
"grad_norm": 0.7405738502525695,
"learning_rate": 4.721061676391081e-07,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14739716053009033,
"step": 3985,
"valid_targets_mean": 2616.9,
"valid_targets_min": 321
},
{
"epoch": 6.57331136738056,
"grad_norm": 0.7244028411140117,
"learning_rate": 4.5452606426420466e-07,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1695755273103714,
"step": 3990,
"valid_targets_mean": 3027.8,
"valid_targets_min": 257
},
{
"epoch": 6.58154859967051,
"grad_norm": 0.7322525481149665,
"learning_rate": 4.372757600771116e-07,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2116568684577942,
"step": 3995,
"valid_targets_mean": 3028.4,
"valid_targets_min": 917
},
{
"epoch": 6.589785831960461,
"grad_norm": 0.7470670386639713,
"learning_rate": 4.203555461496378e-07,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15893974900245667,
"step": 4000,
"valid_targets_mean": 3174.8,
"valid_targets_min": 731
},
{
"epoch": 6.598023064250412,
"grad_norm": 0.8075055424213986,
"learning_rate": 4.0376570798382084e-07,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15712273120880127,
"step": 4005,
"valid_targets_mean": 2127.1,
"valid_targets_min": 259
},
{
"epoch": 6.606260296540363,
"grad_norm": 0.7269307165713284,
"learning_rate": 3.875065255071442e-07,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24262076616287231,
"step": 4010,
"valid_targets_mean": 3033.4,
"valid_targets_min": 989
},
{
"epoch": 6.614497528830313,
"grad_norm": 0.9343679862401862,
"learning_rate": 3.715782730677786e-07,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1790003478527069,
"step": 4015,
"valid_targets_mean": 1810.2,
"valid_targets_min": 620
},
{
"epoch": 6.622734761120263,
"grad_norm": 0.7559108888626762,
"learning_rate": 3.559812194299794e-07,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2013910859823227,
"step": 4020,
"valid_targets_mean": 3094.5,
"valid_targets_min": 1049
},
{
"epoch": 6.630971993410214,
"grad_norm": 0.7245273592521206,
"learning_rate": 3.407156277695456e-07,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1565759778022766,
"step": 4025,
"valid_targets_mean": 4298.2,
"valid_targets_min": 935
},
{
"epoch": 6.6392092257001645,
"grad_norm": 0.6500329190512484,
"learning_rate": 3.257817556693654e-07,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11484387516975403,
"step": 4030,
"valid_targets_mean": 2797.9,
"valid_targets_min": 779
},
{
"epoch": 6.647446457990116,
"grad_norm": 0.7052895181792681,
"learning_rate": 3.1117985511508686e-07,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.132914736866951,
"step": 4035,
"valid_targets_mean": 2802.5,
"valid_targets_min": 438
},
{
"epoch": 6.655683690280066,
"grad_norm": 0.7468505902354071,
"learning_rate": 2.969101724908585e-07,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2299904227256775,
"step": 4040,
"valid_targets_mean": 3584.6,
"valid_targets_min": 978
},
{
"epoch": 6.663920922570016,
"grad_norm": 0.7150895108441544,
"learning_rate": 2.829729485751731e-07,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14426125586032867,
"step": 4045,
"valid_targets_mean": 2814.2,
"valid_targets_min": 382
},
{
"epoch": 6.672158154859967,
"grad_norm": 0.5991220098063653,
"learning_rate": 2.6936841853680397e-07,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12172479182481766,
"step": 4050,
"valid_targets_mean": 3342.2,
"valid_targets_min": 405
},
{
"epoch": 6.680395387149917,
"grad_norm": 0.6822342950062912,
"learning_rate": 2.560968119308349e-07,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19796040654182434,
"step": 4055,
"valid_targets_mean": 3490.1,
"valid_targets_min": 838
},
{
"epoch": 6.688632619439868,
"grad_norm": 0.6514055359914713,
"learning_rate": 2.4315835269479446e-07,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1311188042163849,
"step": 4060,
"valid_targets_mean": 3191.2,
"valid_targets_min": 380
},
{
"epoch": 6.696869851729819,
"grad_norm": 0.7294000714400222,
"learning_rate": 2.305532591448678e-07,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14557018876075745,
"step": 4065,
"valid_targets_mean": 2508.8,
"valid_targets_min": 724
},
{
"epoch": 6.70510708401977,
"grad_norm": 0.5934845642808244,
"learning_rate": 2.1828174397222179e-07,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12286630272865295,
"step": 4070,
"valid_targets_mean": 3624.8,
"valid_targets_min": 843
},
{
"epoch": 6.71334431630972,
"grad_norm": 0.7921124334514694,
"learning_rate": 2.0634401423940797e-07,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18661408126354218,
"step": 4075,
"valid_targets_mean": 2451.5,
"valid_targets_min": 717
},
{
"epoch": 6.72158154859967,
"grad_norm": 0.5932236802274212,
"learning_rate": 1.9474027137687425e-07,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.183675616979599,
"step": 4080,
"valid_targets_mean": 4072.7,
"valid_targets_min": 808
},
{
"epoch": 6.729818780889621,
"grad_norm": 0.793939849451655,
"learning_rate": 1.834707111795675e-07,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18774361908435822,
"step": 4085,
"valid_targets_mean": 2594.6,
"valid_targets_min": 743
},
{
"epoch": 6.7380560131795715,
"grad_norm": 0.7977767421315517,
"learning_rate": 1.725355238036208e-07,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23956944048404694,
"step": 4090,
"valid_targets_mean": 2484.7,
"valid_targets_min": 271
},
{
"epoch": 6.746293245469523,
"grad_norm": 0.8987888128978652,
"learning_rate": 1.6193489376315375e-07,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18341073393821716,
"step": 4095,
"valid_targets_mean": 1867.1,
"valid_targets_min": 346
},
{
"epoch": 6.754530477759473,
"grad_norm": 0.7775999067743287,
"learning_rate": 1.5166899992715922e-07,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15121757984161377,
"step": 4100,
"valid_targets_mean": 2914.3,
"valid_targets_min": 287
},
{
"epoch": 6.762767710049423,
"grad_norm": 0.8019192495560047,
"learning_rate": 1.417380155164727e-07,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22095879912376404,
"step": 4105,
"valid_targets_mean": 2675.8,
"valid_targets_min": 239
},
{
"epoch": 6.771004942339374,
"grad_norm": 0.8608991084693377,
"learning_rate": 1.3214210810087224e-07,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19388195872306824,
"step": 4110,
"valid_targets_mean": 2775.4,
"valid_targets_min": 915
},
{
"epoch": 6.779242174629324,
"grad_norm": 0.6496355441738153,
"learning_rate": 1.2288143959622523e-07,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1336159110069275,
"step": 4115,
"valid_targets_mean": 3077.2,
"valid_targets_min": 935
},
{
"epoch": 6.787479406919275,
"grad_norm": 0.9623189464394726,
"learning_rate": 1.1395616626177718e-07,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18686145544052124,
"step": 4120,
"valid_targets_mean": 1904.4,
"valid_targets_min": 377
},
{
"epoch": 6.795716639209226,
"grad_norm": 0.8506497654414124,
"learning_rate": 1.0536643869750508e-07,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23170790076255798,
"step": 4125,
"valid_targets_mean": 2162.9,
"valid_targets_min": 1039
},
{
"epoch": 6.803953871499177,
"grad_norm": 0.647365705379033,
"learning_rate": 9.711240184157255e-08,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19694972038269043,
"step": 4130,
"valid_targets_mean": 4015.7,
"valid_targets_min": 1299
},
{
"epoch": 6.812191103789127,
"grad_norm": 0.6899146547611903,
"learning_rate": 8.919419496789428e-08,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13986879587173462,
"step": 4135,
"valid_targets_mean": 3022.9,
"valid_targets_min": 1184
},
{
"epoch": 6.820428336079077,
"grad_norm": 0.6826690079265932,
"learning_rate": 8.161195168378211e-08,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13281051814556122,
"step": 4140,
"valid_targets_mean": 3272.3,
"valid_targets_min": 232
},
{
"epoch": 6.828665568369028,
"grad_norm": 0.6641391234585438,
"learning_rate": 7.4365799927687e-08,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14258205890655518,
"step": 4145,
"valid_targets_mean": 3228.8,
"valid_targets_min": 1676
},
{
"epoch": 6.8369028006589785,
"grad_norm": 0.6748162422562181,
"learning_rate": 6.745586196704512e-08,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14117348194122314,
"step": 4150,
"valid_targets_mean": 3223.8,
"valid_targets_min": 377
},
{
"epoch": 6.84514003294893,
"grad_norm": 0.8649156647091603,
"learning_rate": 6.088225439620621e-08,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.216533362865448,
"step": 4155,
"valid_targets_mean": 2923.2,
"valid_targets_min": 610
},
{
"epoch": 6.85337726523888,
"grad_norm": 0.9134316166153748,
"learning_rate": 5.464508813448621e-08,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17572906613349915,
"step": 4160,
"valid_targets_mean": 2606.5,
"valid_targets_min": 290
},
{
"epoch": 6.86161449752883,
"grad_norm": 0.6317158342753643,
"learning_rate": 4.874446842426883e-08,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13150852918624878,
"step": 4165,
"valid_targets_mean": 3455.3,
"valid_targets_min": 1075
},
{
"epoch": 6.869851729818781,
"grad_norm": 0.78925360032166,
"learning_rate": 4.318049482924913e-08,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1530526578426361,
"step": 4170,
"valid_targets_mean": 2389.6,
"valid_targets_min": 708
},
{
"epoch": 6.878088962108731,
"grad_norm": 0.6158559873310975,
"learning_rate": 3.7953261232743785e-08,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1563345193862915,
"step": 4175,
"valid_targets_mean": 3645.4,
"valid_targets_min": 848
},
{
"epoch": 6.886326194398682,
"grad_norm": 0.8168240860097061,
"learning_rate": 3.3062855836119014e-08,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15081787109375,
"step": 4180,
"valid_targets_mean": 2565.6,
"valid_targets_min": 1303
},
{
"epoch": 6.894563426688633,
"grad_norm": 0.6402154892970332,
"learning_rate": 2.8509361157285088e-08,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2066039741039276,
"step": 4185,
"valid_targets_mean": 4142.2,
"valid_targets_min": 326
},
{
"epoch": 6.902800658978583,
"grad_norm": 0.6139396948124894,
"learning_rate": 2.429285402931525e-08,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13339337706565857,
"step": 4190,
"valid_targets_mean": 3607.2,
"valid_targets_min": 776
},
{
"epoch": 6.911037891268534,
"grad_norm": 0.8049219522828062,
"learning_rate": 2.041340559914895e-08,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16743309795856476,
"step": 4195,
"valid_targets_mean": 2342.8,
"valid_targets_min": 611
},
{
"epoch": 6.919275123558484,
"grad_norm": 0.7235236484755135,
"learning_rate": 1.6871081326388372e-08,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1539749652147293,
"step": 4200,
"valid_targets_mean": 2721.6,
"valid_targets_min": 255
},
{
"epoch": 6.927512355848435,
"grad_norm": 0.6996590910363392,
"learning_rate": 1.366594098219487e-08,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14047235250473022,
"step": 4205,
"valid_targets_mean": 3126.0,
"valid_targets_min": 340
},
{
"epoch": 6.9357495881383855,
"grad_norm": 0.9081681836064551,
"learning_rate": 1.0798038648278664e-08,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15091955661773682,
"step": 4210,
"valid_targets_mean": 2809.3,
"valid_targets_min": 829
},
{
"epoch": 6.943986820428336,
"grad_norm": 0.6676226069756183,
"learning_rate": 8.26742271598846e-09,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17465578019618988,
"step": 4215,
"valid_targets_mean": 3463.6,
"valid_targets_min": 915
},
{
"epoch": 6.952224052718287,
"grad_norm": 0.7700986208930122,
"learning_rate": 6.074135885498767e-09,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17234516143798828,
"step": 4220,
"valid_targets_mean": 2481.6,
"valid_targets_min": 943
},
{
"epoch": 6.960461285008237,
"grad_norm": 0.679973114052915,
"learning_rate": 4.218215165077144e-09,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1480589061975479,
"step": 4225,
"valid_targets_mean": 3207.2,
"valid_targets_min": 287
},
{
"epoch": 6.968698517298188,
"grad_norm": 1.0661673612936513,
"learning_rate": 2.699691870473586e-09,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14552760124206543,
"step": 4230,
"valid_targets_mean": 2714.8,
"valid_targets_min": 832
},
{
"epoch": 6.976935749588138,
"grad_norm": 0.7275517602358317,
"learning_rate": 1.5185916243876108e-09,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17081902921199799,
"step": 4235,
"valid_targets_mean": 2979.4,
"valid_targets_min": 1228
},
{
"epoch": 6.9851729818780885,
"grad_norm": 0.8670521747754626,
"learning_rate": 6.749343560286114e-10,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18648138642311096,
"step": 4240,
"valid_targets_mean": 2214.1,
"valid_targets_min": 311
},
{
"epoch": 6.99341021416804,
"grad_norm": 0.8106614308590394,
"learning_rate": 1.6873430078945264e-10,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821575999259949,
"step": 4245,
"valid_targets_mean": 3544.4,
"valid_targets_min": 980
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17179973423480988,
"step": 4249,
"total_flos": 835464024555520.0,
"train_loss": 0.2412474821612088,
"train_runtime": 18396.3609,
"train_samples_per_second": 3.695,
"train_steps_per_second": 0.231,
"valid_targets_mean": 2603.9,
"valid_targets_min": 249
}
],
"logging_steps": 5,
"max_steps": 4249,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 835464024555520.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}