penfever's picture
End of training
3560cbb verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 2814,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.012437810945273632,
"grad_norm": 13.380951406456147,
"learning_rate": 5.673758865248227e-07,
"loss": 0.7822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7657574415206909,
"step": 5,
"valid_targets_mean": 4010.9,
"valid_targets_min": 1767
},
{
"epoch": 0.024875621890547265,
"grad_norm": 12.545654526351226,
"learning_rate": 1.276595744680851e-06,
"loss": 0.8056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8114880919456482,
"step": 10,
"valid_targets_mean": 3892.8,
"valid_targets_min": 2200
},
{
"epoch": 0.03731343283582089,
"grad_norm": 9.667916880642556,
"learning_rate": 1.9858156028368797e-06,
"loss": 0.7418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6924527287483215,
"step": 15,
"valid_targets_mean": 4415.2,
"valid_targets_min": 1889
},
{
"epoch": 0.04975124378109453,
"grad_norm": 6.112913024339798,
"learning_rate": 2.695035460992908e-06,
"loss": 0.6973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.668594241142273,
"step": 20,
"valid_targets_mean": 3674.9,
"valid_targets_min": 191
},
{
"epoch": 0.06218905472636816,
"grad_norm": 4.866305911621686,
"learning_rate": 3.4042553191489363e-06,
"loss": 0.6624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.644311785697937,
"step": 25,
"valid_targets_mean": 3697.1,
"valid_targets_min": 355
},
{
"epoch": 0.07462686567164178,
"grad_norm": 4.31903460986635,
"learning_rate": 4.113475177304965e-06,
"loss": 0.6025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.569460391998291,
"step": 30,
"valid_targets_mean": 4055.9,
"valid_targets_min": 1675
},
{
"epoch": 0.08706467661691543,
"grad_norm": 1.8781712293982455,
"learning_rate": 4.822695035460993e-06,
"loss": 0.5493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5322237014770508,
"step": 35,
"valid_targets_mean": 3793.4,
"valid_targets_min": 1413
},
{
"epoch": 0.09950248756218906,
"grad_norm": 1.3648445070279718,
"learning_rate": 5.531914893617022e-06,
"loss": 0.5353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5094773769378662,
"step": 40,
"valid_targets_mean": 3781.3,
"valid_targets_min": 1421
},
{
"epoch": 0.11194029850746269,
"grad_norm": 0.9598535483295971,
"learning_rate": 6.24113475177305e-06,
"loss": 0.4963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4716443717479706,
"step": 45,
"valid_targets_mean": 4314.4,
"valid_targets_min": 1362
},
{
"epoch": 0.12437810945273632,
"grad_norm": 0.8095195355924959,
"learning_rate": 6.950354609929079e-06,
"loss": 0.4842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4684237241744995,
"step": 50,
"valid_targets_mean": 4619.2,
"valid_targets_min": 2128
},
{
"epoch": 0.13681592039800994,
"grad_norm": 0.9535042747879249,
"learning_rate": 7.659574468085107e-06,
"loss": 0.4799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.502250611782074,
"step": 55,
"valid_targets_mean": 3554.8,
"valid_targets_min": 2013
},
{
"epoch": 0.14925373134328357,
"grad_norm": 0.7738334376355982,
"learning_rate": 8.368794326241135e-06,
"loss": 0.4574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49030762910842896,
"step": 60,
"valid_targets_mean": 3948.2,
"valid_targets_min": 2060
},
{
"epoch": 0.16169154228855723,
"grad_norm": 0.7133304690095129,
"learning_rate": 9.078014184397164e-06,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41507917642593384,
"step": 65,
"valid_targets_mean": 4287.1,
"valid_targets_min": 2085
},
{
"epoch": 0.17412935323383086,
"grad_norm": 0.6718539217454166,
"learning_rate": 9.787234042553192e-06,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41251397132873535,
"step": 70,
"valid_targets_mean": 4147.2,
"valid_targets_min": 2291
},
{
"epoch": 0.1865671641791045,
"grad_norm": 0.6888672437166001,
"learning_rate": 1.049645390070922e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4331628978252411,
"step": 75,
"valid_targets_mean": 3984.5,
"valid_targets_min": 1357
},
{
"epoch": 0.19900497512437812,
"grad_norm": 0.7612883410877886,
"learning_rate": 1.120567375886525e-05,
"loss": 0.3944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3932691514492035,
"step": 80,
"valid_targets_mean": 3577.6,
"valid_targets_min": 1628
},
{
"epoch": 0.21144278606965175,
"grad_norm": 0.6889250639530377,
"learning_rate": 1.1914893617021277e-05,
"loss": 0.3975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4268104135990143,
"step": 85,
"valid_targets_mean": 4420.2,
"valid_targets_min": 2703
},
{
"epoch": 0.22388059701492538,
"grad_norm": 0.7389874437127749,
"learning_rate": 1.2624113475177307e-05,
"loss": 0.3817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38703107833862305,
"step": 90,
"valid_targets_mean": 3759.1,
"valid_targets_min": 2311
},
{
"epoch": 0.236318407960199,
"grad_norm": 0.6632832871080014,
"learning_rate": 1.3333333333333333e-05,
"loss": 0.3705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3471001982688904,
"step": 95,
"valid_targets_mean": 4546.7,
"valid_targets_min": 2457
},
{
"epoch": 0.24875621890547264,
"grad_norm": 0.6773454789521931,
"learning_rate": 1.4042553191489363e-05,
"loss": 0.3705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37445783615112305,
"step": 100,
"valid_targets_mean": 3990.8,
"valid_targets_min": 1875
},
{
"epoch": 0.26119402985074625,
"grad_norm": 0.5679953534246097,
"learning_rate": 1.475177304964539e-05,
"loss": 0.35,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3382793068885803,
"step": 105,
"valid_targets_mean": 5048.9,
"valid_targets_min": 1979
},
{
"epoch": 0.2736318407960199,
"grad_norm": 0.6335472342807328,
"learning_rate": 1.546099290780142e-05,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36811989545822144,
"step": 110,
"valid_targets_mean": 3544.6,
"valid_targets_min": 2019
},
{
"epoch": 0.2860696517412935,
"grad_norm": 0.5873605193729509,
"learning_rate": 1.6170212765957446e-05,
"loss": 0.35,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3602096438407898,
"step": 115,
"valid_targets_mean": 4335.9,
"valid_targets_min": 2097
},
{
"epoch": 0.29850746268656714,
"grad_norm": 0.6603180715772641,
"learning_rate": 1.6879432624113476e-05,
"loss": 0.3513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36116451025009155,
"step": 120,
"valid_targets_mean": 3368.5,
"valid_targets_min": 1322
},
{
"epoch": 0.31094527363184077,
"grad_norm": 0.6177290895347114,
"learning_rate": 1.7588652482269506e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35631102323532104,
"step": 125,
"valid_targets_mean": 4271.0,
"valid_targets_min": 2572
},
{
"epoch": 0.32338308457711445,
"grad_norm": 0.5970279991046994,
"learning_rate": 1.8297872340425533e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3269408345222473,
"step": 130,
"valid_targets_mean": 4144.0,
"valid_targets_min": 2433
},
{
"epoch": 0.3358208955223881,
"grad_norm": 0.6988436544880555,
"learning_rate": 1.9007092198581563e-05,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3329390287399292,
"step": 135,
"valid_targets_mean": 3773.1,
"valid_targets_min": 1880
},
{
"epoch": 0.3482587064676617,
"grad_norm": 0.5663119370039671,
"learning_rate": 1.971631205673759e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33959251642227173,
"step": 140,
"valid_targets_mean": 5226.4,
"valid_targets_min": 1685
},
{
"epoch": 0.36069651741293535,
"grad_norm": 0.7382656927862868,
"learning_rate": 2.0425531914893616e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2998434901237488,
"step": 145,
"valid_targets_mean": 3405.1,
"valid_targets_min": 1997
},
{
"epoch": 0.373134328358209,
"grad_norm": 0.6399598041440727,
"learning_rate": 2.113475177304965e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3149760365486145,
"step": 150,
"valid_targets_mean": 4147.7,
"valid_targets_min": 1051
},
{
"epoch": 0.3855721393034826,
"grad_norm": 0.6190347784845001,
"learning_rate": 2.1843971631205676e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32194218039512634,
"step": 155,
"valid_targets_mean": 3982.0,
"valid_targets_min": 1776
},
{
"epoch": 0.39800995024875624,
"grad_norm": 0.6629989034109828,
"learning_rate": 2.2553191489361703e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29769569635391235,
"step": 160,
"valid_targets_mean": 3653.1,
"valid_targets_min": 2275
},
{
"epoch": 0.41044776119402987,
"grad_norm": 0.6705243113369573,
"learning_rate": 2.326241134751773e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31587380170822144,
"step": 165,
"valid_targets_mean": 4081.2,
"valid_targets_min": 2034
},
{
"epoch": 0.4228855721393035,
"grad_norm": 0.9424068832053736,
"learning_rate": 2.3971631205673763e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3107619285583496,
"step": 170,
"valid_targets_mean": 3648.3,
"valid_targets_min": 1597
},
{
"epoch": 0.43532338308457713,
"grad_norm": 0.6511358668082933,
"learning_rate": 2.468085106382979e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34112197160720825,
"step": 175,
"valid_targets_mean": 3819.4,
"valid_targets_min": 1782
},
{
"epoch": 0.44776119402985076,
"grad_norm": 0.6476380044242603,
"learning_rate": 2.5390070921985816e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29842424392700195,
"step": 180,
"valid_targets_mean": 3789.5,
"valid_targets_min": 1876
},
{
"epoch": 0.4601990049751244,
"grad_norm": 0.627368462104055,
"learning_rate": 2.609929078014185e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33267688751220703,
"step": 185,
"valid_targets_mean": 4517.8,
"valid_targets_min": 228
},
{
"epoch": 0.472636815920398,
"grad_norm": 0.6466632344322205,
"learning_rate": 2.6808510638297876e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29927682876586914,
"step": 190,
"valid_targets_mean": 4185.9,
"valid_targets_min": 1492
},
{
"epoch": 0.48507462686567165,
"grad_norm": 0.6662800469045165,
"learning_rate": 2.7517730496453903e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3514325022697449,
"step": 195,
"valid_targets_mean": 4175.0,
"valid_targets_min": 443
},
{
"epoch": 0.4975124378109453,
"grad_norm": 0.6517689188685865,
"learning_rate": 2.822695035460993e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3168841302394867,
"step": 200,
"valid_targets_mean": 4177.4,
"valid_targets_min": 853
},
{
"epoch": 0.5099502487562189,
"grad_norm": 0.6855031086226197,
"learning_rate": 2.8936170212765963e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2854161858558655,
"step": 205,
"valid_targets_mean": 3589.5,
"valid_targets_min": 1106
},
{
"epoch": 0.5223880597014925,
"grad_norm": 0.6720194490881026,
"learning_rate": 2.964539007092199e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2903139591217041,
"step": 210,
"valid_targets_mean": 3750.4,
"valid_targets_min": 1685
},
{
"epoch": 0.5348258706467661,
"grad_norm": 0.6995838272080971,
"learning_rate": 3.0354609929078016e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29320502281188965,
"step": 215,
"valid_targets_mean": 3562.6,
"valid_targets_min": 831
},
{
"epoch": 0.5472636815920398,
"grad_norm": 0.5930224509626889,
"learning_rate": 3.1063829787234046e-05,
"loss": 0.3155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33783021569252014,
"step": 220,
"valid_targets_mean": 4651.5,
"valid_targets_min": 2381
},
{
"epoch": 0.5597014925373134,
"grad_norm": 0.6173823876530793,
"learning_rate": 3.1773049645390076e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30158767104148865,
"step": 225,
"valid_targets_mean": 4075.6,
"valid_targets_min": 2042
},
{
"epoch": 0.572139303482587,
"grad_norm": 0.7805956934434903,
"learning_rate": 3.24822695035461e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31823039054870605,
"step": 230,
"valid_targets_mean": 3906.0,
"valid_targets_min": 1425
},
{
"epoch": 0.5845771144278606,
"grad_norm": 0.6419587125168111,
"learning_rate": 3.319148936170213e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31326407194137573,
"step": 235,
"valid_targets_mean": 3665.2,
"valid_targets_min": 1696
},
{
"epoch": 0.5970149253731343,
"grad_norm": 0.8679447185514305,
"learning_rate": 3.390070921985816e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29827624559402466,
"step": 240,
"valid_targets_mean": 3904.9,
"valid_targets_min": 2058
},
{
"epoch": 0.6094527363184079,
"grad_norm": 0.6810499039895173,
"learning_rate": 3.460992907801419e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2755545377731323,
"step": 245,
"valid_targets_mean": 3971.8,
"valid_targets_min": 2000
},
{
"epoch": 0.6218905472636815,
"grad_norm": 0.6597104835502321,
"learning_rate": 3.531914893617022e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2824779152870178,
"step": 250,
"valid_targets_mean": 3968.2,
"valid_targets_min": 1270
},
{
"epoch": 0.6343283582089553,
"grad_norm": 0.740278069571726,
"learning_rate": 3.602836879432624e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2923567593097687,
"step": 255,
"valid_targets_mean": 3380.2,
"valid_targets_min": 2111
},
{
"epoch": 0.6467661691542289,
"grad_norm": 0.6593440154558078,
"learning_rate": 3.673758865248227e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.315481960773468,
"step": 260,
"valid_targets_mean": 3845.1,
"valid_targets_min": 1793
},
{
"epoch": 0.6592039800995025,
"grad_norm": 0.5518441987402686,
"learning_rate": 3.74468085106383e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2802160084247589,
"step": 265,
"valid_targets_mean": 4580.6,
"valid_targets_min": 2473
},
{
"epoch": 0.6716417910447762,
"grad_norm": 0.8104837314241858,
"learning_rate": 3.815602836879433e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3234109878540039,
"step": 270,
"valid_targets_mean": 3906.8,
"valid_targets_min": 2167
},
{
"epoch": 0.6840796019900498,
"grad_norm": 0.574610630199438,
"learning_rate": 3.8865248226950355e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707560956478119,
"step": 275,
"valid_targets_mean": 4401.9,
"valid_targets_min": 2550
},
{
"epoch": 0.6965174129353234,
"grad_norm": 0.6473677332767744,
"learning_rate": 3.9574468085106385e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29438745975494385,
"step": 280,
"valid_targets_mean": 4070.2,
"valid_targets_min": 2058
},
{
"epoch": 0.7089552238805971,
"grad_norm": 0.6669914526756555,
"learning_rate": 3.999993842107385e-05,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29622241854667664,
"step": 285,
"valid_targets_mean": 3670.9,
"valid_targets_min": 1575
},
{
"epoch": 0.7213930348258707,
"grad_norm": 0.6040016655187556,
"learning_rate": 3.999924566250946e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25055813789367676,
"step": 290,
"valid_targets_mean": 4318.6,
"valid_targets_min": 2013
},
{
"epoch": 0.7338308457711443,
"grad_norm": 0.6412537411386398,
"learning_rate": 3.999778319847388e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983705401420593,
"step": 295,
"valid_targets_mean": 4027.8,
"valid_targets_min": 1756
},
{
"epoch": 0.746268656716418,
"grad_norm": 0.7602229991895589,
"learning_rate": 3.999555108525255e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2838355004787445,
"step": 300,
"valid_targets_mean": 4391.4,
"valid_targets_min": 1883
},
{
"epoch": 0.7587064676616916,
"grad_norm": 0.5443397707250325,
"learning_rate": 3.999254940875221e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30530381202697754,
"step": 305,
"valid_targets_mean": 4607.9,
"valid_targets_min": 1976
},
{
"epoch": 0.7711442786069652,
"grad_norm": 0.7644982978652062,
"learning_rate": 3.998877828449755e-05,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29389941692352295,
"step": 310,
"valid_targets_mean": 3338.8,
"valid_targets_min": 1997
},
{
"epoch": 0.7835820895522388,
"grad_norm": 0.6097921931378489,
"learning_rate": 3.99842378576268e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2719549834728241,
"step": 315,
"valid_targets_mean": 4149.0,
"valid_targets_min": 2106
},
{
"epoch": 0.7960199004975125,
"grad_norm": 0.6026543056079762,
"learning_rate": 3.997892830288611e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28515109419822693,
"step": 320,
"valid_targets_mean": 3764.9,
"valid_targets_min": 2243
},
{
"epoch": 0.8084577114427861,
"grad_norm": 0.7013246853914047,
"learning_rate": 3.997284982462286e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32851818203926086,
"step": 325,
"valid_targets_mean": 3250.0,
"valid_targets_min": 196
},
{
"epoch": 0.8208955223880597,
"grad_norm": 0.6272103188781436,
"learning_rate": 3.9966002656777775e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2576582133769989,
"step": 330,
"valid_targets_mean": 3494.9,
"valid_targets_min": 471
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.6106794281804707,
"learning_rate": 3.9958387062875924e-05,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28204280138015747,
"step": 335,
"valid_targets_mean": 3829.8,
"valid_targets_min": 1935
},
{
"epoch": 0.845771144278607,
"grad_norm": 0.5489443050050972,
"learning_rate": 3.9950003336016564e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528287172317505,
"step": 340,
"valid_targets_mean": 4614.7,
"valid_targets_min": 2051
},
{
"epoch": 0.8582089552238806,
"grad_norm": 0.5465751723442666,
"learning_rate": 3.99408517988619e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26588577032089233,
"step": 345,
"valid_targets_mean": 4694.1,
"valid_targets_min": 2446
},
{
"epoch": 0.8706467661691543,
"grad_norm": 0.5320142976407558,
"learning_rate": 3.993093280362462e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25479674339294434,
"step": 350,
"valid_targets_mean": 4793.0,
"valid_targets_min": 2890
},
{
"epoch": 0.8830845771144279,
"grad_norm": 0.643787133545081,
"learning_rate": 3.9920246732054374e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2818455398082733,
"step": 355,
"valid_targets_mean": 4366.5,
"valid_targets_min": 1670
},
{
"epoch": 0.8955223880597015,
"grad_norm": 0.6844127977814671,
"learning_rate": 3.990879399542305e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2798788845539093,
"step": 360,
"valid_targets_mean": 3420.6,
"valid_targets_min": 1241
},
{
"epoch": 0.9079601990049752,
"grad_norm": 0.5798388818266013,
"learning_rate": 3.989657503450898e-05,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28030702471733093,
"step": 365,
"valid_targets_mean": 4205.9,
"valid_targets_min": 2328
},
{
"epoch": 0.9203980099502488,
"grad_norm": 0.5693045180329982,
"learning_rate": 3.9883590319579966e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3048206567764282,
"step": 370,
"valid_targets_mean": 4680.9,
"valid_targets_min": 2049
},
{
"epoch": 0.9328358208955224,
"grad_norm": 0.77488630073332,
"learning_rate": 3.986984035037514e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770192325115204,
"step": 375,
"valid_targets_mean": 3701.6,
"valid_targets_min": 374
},
{
"epoch": 0.945273631840796,
"grad_norm": 0.5726365998589211,
"learning_rate": 3.9855325656085815e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29798316955566406,
"step": 380,
"valid_targets_mean": 4057.5,
"valid_targets_min": 1639
},
{
"epoch": 0.9577114427860697,
"grad_norm": 0.5794218327334973,
"learning_rate": 3.984004679533502e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2974611520767212,
"step": 385,
"valid_targets_mean": 4386.4,
"valid_targets_min": 1244
},
{
"epoch": 0.9701492537313433,
"grad_norm": 0.6200804315597975,
"learning_rate": 3.982400435615608e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26094967126846313,
"step": 390,
"valid_targets_mean": 3871.4,
"valid_targets_min": 2061
},
{
"epoch": 0.9825870646766169,
"grad_norm": 0.5663415236256595,
"learning_rate": 3.980719895596994e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2790575921535492,
"step": 395,
"valid_targets_mean": 4268.0,
"valid_targets_min": 819
},
{
"epoch": 0.9950248756218906,
"grad_norm": 0.5335095669700068,
"learning_rate": 3.978963124156141e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25512856245040894,
"step": 400,
"valid_targets_mean": 4742.2,
"valid_targets_min": 2403
},
{
"epoch": 1.007462686567164,
"grad_norm": 0.6706949371800399,
"learning_rate": 3.977130188905429e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25862938165664673,
"step": 405,
"valid_targets_mean": 3975.2,
"valid_targets_min": 1886
},
{
"epoch": 1.0199004975124377,
"grad_norm": 0.6198638973234687,
"learning_rate": 3.975221160388535e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2816004753112793,
"step": 410,
"valid_targets_mean": 4115.3,
"valid_targets_min": 1240
},
{
"epoch": 1.0323383084577114,
"grad_norm": 0.5477295121301582,
"learning_rate": 3.973236112077712e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2588885724544525,
"step": 415,
"valid_targets_mean": 4426.1,
"valid_targets_min": 2062
},
{
"epoch": 1.044776119402985,
"grad_norm": 0.6101761931142692,
"learning_rate": 3.971175120370971e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26513034105300903,
"step": 420,
"valid_targets_mean": 4070.8,
"valid_targets_min": 1988
},
{
"epoch": 1.0572139303482586,
"grad_norm": 0.5897683101564732,
"learning_rate": 3.969038264589132e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25092267990112305,
"step": 425,
"valid_targets_mean": 4073.1,
"valid_targets_min": 443
},
{
"epoch": 1.0696517412935322,
"grad_norm": 0.5625409270111561,
"learning_rate": 3.966825626972777e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2630409002304077,
"step": 430,
"valid_targets_mean": 4102.7,
"valid_targets_min": 1379
},
{
"epoch": 1.0820895522388059,
"grad_norm": 0.565867121844965,
"learning_rate": 3.964537292679081e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534593641757965,
"step": 435,
"valid_targets_mean": 4240.8,
"valid_targets_min": 1908
},
{
"epoch": 1.0945273631840795,
"grad_norm": 0.6406440477946179,
"learning_rate": 3.962173349778538e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28820428252220154,
"step": 440,
"valid_targets_mean": 3382.1,
"valid_targets_min": 1769
},
{
"epoch": 1.1069651741293531,
"grad_norm": 0.5787142049618801,
"learning_rate": 3.959733889251569e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2697809636592865,
"step": 445,
"valid_targets_mean": 4141.3,
"valid_targets_min": 1130
},
{
"epoch": 1.1194029850746268,
"grad_norm": 0.5835970548274867,
"learning_rate": 3.9572190049850186e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2650759518146515,
"step": 450,
"valid_targets_mean": 3681.7,
"valid_targets_min": 1929
},
{
"epoch": 1.1318407960199006,
"grad_norm": 0.6578060953434757,
"learning_rate": 3.9546287937685485e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2592794895172119,
"step": 455,
"valid_targets_mean": 3309.7,
"valid_targets_min": 1400
},
{
"epoch": 1.144278606965174,
"grad_norm": 0.5127241563740503,
"learning_rate": 3.9519633552909054e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23262007534503937,
"step": 460,
"valid_targets_mean": 5108.5,
"valid_targets_min": 2353
},
{
"epoch": 1.1567164179104479,
"grad_norm": 0.6164622352052561,
"learning_rate": 3.949222792136087e-05,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23169252276420593,
"step": 465,
"valid_targets_mean": 4548.3,
"valid_targets_min": 1282
},
{
"epoch": 1.1691542288557213,
"grad_norm": 0.6496210536118021,
"learning_rate": 3.946407209779395e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2703050374984741,
"step": 470,
"valid_targets_mean": 3854.2,
"valid_targets_min": 2534
},
{
"epoch": 1.1815920398009951,
"grad_norm": 0.6983143179255165,
"learning_rate": 3.9435167165833724e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26550132036209106,
"step": 475,
"valid_targets_mean": 3896.3,
"valid_targets_min": 2130
},
{
"epoch": 1.1940298507462686,
"grad_norm": 0.5555184412354105,
"learning_rate": 3.940551423793638e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535971403121948,
"step": 480,
"valid_targets_mean": 4125.7,
"valid_targets_min": 1715
},
{
"epoch": 1.2064676616915424,
"grad_norm": 0.5704921624189617,
"learning_rate": 3.937511445534599e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26805728673934937,
"step": 485,
"valid_targets_mean": 3877.7,
"valid_targets_min": 2189
},
{
"epoch": 1.2189054726368158,
"grad_norm": 0.6495765923740222,
"learning_rate": 3.934396898805064e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24718452990055084,
"step": 490,
"valid_targets_mean": 3588.3,
"valid_targets_min": 1692
},
{
"epoch": 1.2313432835820897,
"grad_norm": 0.5876505289888774,
"learning_rate": 3.931207903473737e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569234371185303,
"step": 495,
"valid_targets_mean": 4021.1,
"valid_targets_min": 1943
},
{
"epoch": 1.243781094527363,
"grad_norm": 0.5703559162652219,
"learning_rate": 3.9279445822746045e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23905381560325623,
"step": 500,
"valid_targets_mean": 3682.4,
"valid_targets_min": 1850
},
{
"epoch": 1.256218905472637,
"grad_norm": 0.6506750265611713,
"learning_rate": 3.9246070608022125e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26591765880584717,
"step": 505,
"valid_targets_mean": 3393.1,
"valid_targets_min": 2128
},
{
"epoch": 1.2686567164179103,
"grad_norm": 0.5787258957804087,
"learning_rate": 3.921195467506833e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2495618611574173,
"step": 510,
"valid_targets_mean": 3888.8,
"valid_targets_min": 1134
},
{
"epoch": 1.2810945273631842,
"grad_norm": 0.519436549423975,
"learning_rate": 3.917709933689519e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26761433482170105,
"step": 515,
"valid_targets_mean": 4347.1,
"valid_targets_min": 1773
},
{
"epoch": 1.2935323383084576,
"grad_norm": 0.6076968588802545,
"learning_rate": 3.914150593497054e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2475341260433197,
"step": 520,
"valid_targets_mean": 3474.6,
"valid_targets_min": 777
},
{
"epoch": 1.3059701492537314,
"grad_norm": 0.6306744703358103,
"learning_rate": 3.910517583916783e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28335511684417725,
"step": 525,
"valid_targets_mean": 3507.3,
"valid_targets_min": 1850
},
{
"epoch": 1.3184079601990049,
"grad_norm": 0.5110706633146148,
"learning_rate": 3.90681104477135e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23450972139835358,
"step": 530,
"valid_targets_mean": 4537.1,
"valid_targets_min": 1051
},
{
"epoch": 1.3308457711442787,
"grad_norm": 0.6389986218399706,
"learning_rate": 3.903031118713307e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26319772005081177,
"step": 535,
"valid_targets_mean": 3198.9,
"valid_targets_min": 1306
},
{
"epoch": 1.3432835820895521,
"grad_norm": 0.6465328887813366,
"learning_rate": 3.8991779512196294e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25991159677505493,
"step": 540,
"valid_targets_mean": 3375.8,
"valid_targets_min": 1682
},
{
"epoch": 1.355721393034826,
"grad_norm": 0.5736019923931159,
"learning_rate": 3.8952516905861155e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2686164379119873,
"step": 545,
"valid_targets_mean": 4258.2,
"valid_targets_min": 1889
},
{
"epoch": 1.3681592039800994,
"grad_norm": 0.5067100499995646,
"learning_rate": 3.89125248792168e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23678192496299744,
"step": 550,
"valid_targets_mean": 4387.9,
"valid_targets_min": 1724
},
{
"epoch": 1.3805970149253732,
"grad_norm": 0.5477380240295115,
"learning_rate": 3.8871804971425353e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501421570777893,
"step": 555,
"valid_targets_mean": 3848.6,
"valid_targets_min": 1156
},
{
"epoch": 1.3930348258706466,
"grad_norm": 0.5863449356154877,
"learning_rate": 3.883035874966273e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24096009135246277,
"step": 560,
"valid_targets_mean": 3734.2,
"valid_targets_min": 1872
},
{
"epoch": 1.4054726368159205,
"grad_norm": 0.5379477926228984,
"learning_rate": 3.878818780905826e-05,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23347872495651245,
"step": 565,
"valid_targets_mean": 4070.9,
"valid_targets_min": 2509
},
{
"epoch": 1.417910447761194,
"grad_norm": 0.5419932690009873,
"learning_rate": 3.874529377263335e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25849100947380066,
"step": 570,
"valid_targets_mean": 4307.4,
"valid_targets_min": 1746
},
{
"epoch": 1.4303482587064678,
"grad_norm": 0.5729702092975528,
"learning_rate": 3.870167829123899e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2920796871185303,
"step": 575,
"valid_targets_mean": 4220.1,
"valid_targets_min": 1363
},
{
"epoch": 1.4427860696517412,
"grad_norm": 0.5205776739120929,
"learning_rate": 3.865734304349224e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23339340090751648,
"step": 580,
"valid_targets_mean": 4367.3,
"valid_targets_min": 1685
},
{
"epoch": 1.455223880597015,
"grad_norm": 0.5536951564209288,
"learning_rate": 3.861228973571158e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24707631766796112,
"step": 585,
"valid_targets_mean": 4527.9,
"valid_targets_min": 1406
},
{
"epoch": 1.4676616915422884,
"grad_norm": 0.564511967740949,
"learning_rate": 3.856652010185128e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2429649531841278,
"step": 590,
"valid_targets_mean": 3914.8,
"valid_targets_min": 2402
},
{
"epoch": 1.4800995024875623,
"grad_norm": 0.5579953289935093,
"learning_rate": 3.852003590343467e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21945007145404816,
"step": 595,
"valid_targets_mean": 4183.3,
"valid_targets_min": 1280
},
{
"epoch": 1.4925373134328357,
"grad_norm": 0.5631837154917557,
"learning_rate": 3.847283892948631e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27015361189842224,
"step": 600,
"valid_targets_mean": 3908.9,
"valid_targets_min": 1638
},
{
"epoch": 1.5049751243781095,
"grad_norm": 0.5901864513013043,
"learning_rate": 3.8424930996463173e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25428202748298645,
"step": 605,
"valid_targets_mean": 4185.3,
"valid_targets_min": 1322
},
{
"epoch": 1.517412935323383,
"grad_norm": 0.5161889221577463,
"learning_rate": 3.837631394818471e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310006320476532,
"step": 610,
"valid_targets_mean": 4516.8,
"valid_targets_min": 1988
},
{
"epoch": 1.5298507462686568,
"grad_norm": 0.5359807008019226,
"learning_rate": 3.832698965576189e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637181878089905,
"step": 615,
"valid_targets_mean": 3867.1,
"valid_targets_min": 2465
},
{
"epoch": 1.5422885572139302,
"grad_norm": 0.5674145217928909,
"learning_rate": 3.8276960017525197e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22988495230674744,
"step": 620,
"valid_targets_mean": 4242.8,
"valid_targets_min": 1588
},
{
"epoch": 1.554726368159204,
"grad_norm": 0.5723411242257961,
"learning_rate": 3.822622695895157e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25821536779403687,
"step": 625,
"valid_targets_mean": 4392.1,
"valid_targets_min": 1765
},
{
"epoch": 1.5671641791044775,
"grad_norm": 0.5376996090192159,
"learning_rate": 3.8174792432590294e-05,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23149748146533966,
"step": 630,
"valid_targets_mean": 4030.4,
"valid_targets_min": 1742
},
{
"epoch": 1.5796019900497513,
"grad_norm": 0.5681703694899468,
"learning_rate": 3.8122658417987854e-05,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24532127380371094,
"step": 635,
"valid_targets_mean": 3592.2,
"valid_targets_min": 963
},
{
"epoch": 1.5920398009950247,
"grad_norm": 0.5672170181926013,
"learning_rate": 3.8069826921611736e-05,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25750595331192017,
"step": 640,
"valid_targets_mean": 3691.6,
"valid_targets_min": 2389
},
{
"epoch": 1.6044776119402986,
"grad_norm": 0.5840248420927169,
"learning_rate": 3.8016299976773215e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24948638677597046,
"step": 645,
"valid_targets_mean": 3554.7,
"valid_targets_min": 2311
},
{
"epoch": 1.616915422885572,
"grad_norm": 0.5359793017604382,
"learning_rate": 3.796207964354911e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.236485093832016,
"step": 650,
"valid_targets_mean": 4295.7,
"valid_targets_min": 2176
},
{
"epoch": 1.6293532338308458,
"grad_norm": 0.5407696413708218,
"learning_rate": 3.7907168008702485e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24842476844787598,
"step": 655,
"valid_targets_mean": 4364.2,
"valid_targets_min": 1789
},
{
"epoch": 1.6417910447761193,
"grad_norm": 0.5209593522870282,
"learning_rate": 3.785156718560234e-05,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23498183488845825,
"step": 660,
"valid_targets_mean": 4318.7,
"valid_targets_min": 2193
},
{
"epoch": 1.654228855721393,
"grad_norm": 0.550433073135447,
"learning_rate": 3.779527931414227e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22987571358680725,
"step": 665,
"valid_targets_mean": 4133.3,
"valid_targets_min": 1619
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.5574429313585283,
"learning_rate": 3.773830656065811e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2494204193353653,
"step": 670,
"valid_targets_mean": 4016.2,
"valid_targets_min": 2044
},
{
"epoch": 1.6791044776119404,
"grad_norm": 0.6329586119901996,
"learning_rate": 3.768065111784457e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2279907613992691,
"step": 675,
"valid_targets_mean": 3598.1,
"valid_targets_min": 819
},
{
"epoch": 1.6915422885572138,
"grad_norm": 0.5334914217295829,
"learning_rate": 3.762231520467082e-05,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509036362171173,
"step": 680,
"valid_targets_mean": 3799.6,
"valid_targets_min": 1225
},
{
"epoch": 1.7039800995024876,
"grad_norm": 0.5489580465491168,
"learning_rate": 3.7563301066295144e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2305251657962799,
"step": 685,
"valid_targets_mean": 3473.2,
"valid_targets_min": 992
},
{
"epoch": 1.716417910447761,
"grad_norm": 0.5288516281459692,
"learning_rate": 3.750361097397844e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23850487172603607,
"step": 690,
"valid_targets_mean": 4001.9,
"valid_targets_min": 1741
},
{
"epoch": 1.728855721393035,
"grad_norm": 0.5800907388120042,
"learning_rate": 3.74432472249969e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25247111916542053,
"step": 695,
"valid_targets_mean": 3964.8,
"valid_targets_min": 1725
},
{
"epoch": 1.7412935323383083,
"grad_norm": 0.5153130568766624,
"learning_rate": 3.7382212142553526e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23832815885543823,
"step": 700,
"valid_targets_mean": 5047.1,
"valid_targets_min": 2105
},
{
"epoch": 1.7537313432835822,
"grad_norm": 0.4775135414376218,
"learning_rate": 3.732050807568878e-05,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2324645072221756,
"step": 705,
"valid_targets_mean": 5206.6,
"valid_targets_min": 2405
},
{
"epoch": 1.7661691542288556,
"grad_norm": 0.6038057766815212,
"learning_rate": 3.7258137399190104e-05,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23930123448371887,
"step": 710,
"valid_targets_mean": 4152.9,
"valid_targets_min": 1787
},
{
"epoch": 1.7786069651741294,
"grad_norm": 0.5565167118827314,
"learning_rate": 3.71951025135006e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660183310508728,
"step": 715,
"valid_targets_mean": 3864.9,
"valid_targets_min": 1404
},
{
"epoch": 1.7910447761194028,
"grad_norm": 0.6001026329663603,
"learning_rate": 3.713140584462659e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2475225031375885,
"step": 720,
"valid_targets_mean": 3926.4,
"valid_targets_min": 196
},
{
"epoch": 1.8034825870646767,
"grad_norm": 0.5652238036041524,
"learning_rate": 3.7067049844044246e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24355122447013855,
"step": 725,
"valid_targets_mean": 4200.6,
"valid_targets_min": 2117
},
{
"epoch": 1.81592039800995,
"grad_norm": 0.5488019914228596,
"learning_rate": 3.700203698860528e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2313595861196518,
"step": 730,
"valid_targets_mean": 3598.3,
"valid_targets_min": 2223
},
{
"epoch": 1.828358208955224,
"grad_norm": 0.51796472681004,
"learning_rate": 3.6936369780441605e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24363797903060913,
"step": 735,
"valid_targets_mean": 4339.6,
"valid_targets_min": 2214
},
{
"epoch": 1.8407960199004973,
"grad_norm": 0.5659545424872905,
"learning_rate": 3.6870050746869e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24636013805866241,
"step": 740,
"valid_targets_mean": 4091.0,
"valid_targets_min": 1926
},
{
"epoch": 1.8532338308457712,
"grad_norm": 0.5096718996130041,
"learning_rate": 3.680308244028988e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21994280815124512,
"step": 745,
"valid_targets_mean": 4172.7,
"valid_targets_min": 1149
},
{
"epoch": 1.8656716417910446,
"grad_norm": 0.5065361527427243,
"learning_rate": 3.673546743809507e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23863369226455688,
"step": 750,
"valid_targets_mean": 4798.6,
"valid_targets_min": 2111
},
{
"epoch": 1.8781094527363185,
"grad_norm": 0.5931017170469689,
"learning_rate": 3.666720834256456e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788572311401367,
"step": 755,
"valid_targets_mean": 4347.8,
"valid_targets_min": 2099
},
{
"epoch": 1.890547263681592,
"grad_norm": 0.5455237703990018,
"learning_rate": 3.659830778076741e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23518797755241394,
"step": 760,
"valid_targets_mean": 4198.4,
"valid_targets_min": 2807
},
{
"epoch": 1.9029850746268657,
"grad_norm": 0.5393054024523214,
"learning_rate": 3.65287684044606e-05,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718955874443054,
"step": 765,
"valid_targets_mean": 3854.9,
"valid_targets_min": 2330
},
{
"epoch": 1.9154228855721394,
"grad_norm": 0.8356397481562335,
"learning_rate": 3.6458592889986986e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25400418043136597,
"step": 770,
"valid_targets_mean": 4668.4,
"valid_targets_min": 2281
},
{
"epoch": 1.927860696517413,
"grad_norm": 0.5065732254922442,
"learning_rate": 3.638778393817233e-05,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2371484339237213,
"step": 775,
"valid_targets_mean": 4130.5,
"valid_targets_min": 2548
},
{
"epoch": 1.9402985074626866,
"grad_norm": 0.5421381515387088,
"learning_rate": 3.6316344274221276e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25802528858184814,
"step": 780,
"valid_targets_mean": 4095.2,
"valid_targets_min": 2527
},
{
"epoch": 1.9527363184079602,
"grad_norm": 0.5365802561261709,
"learning_rate": 3.624427664761254e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23089924454689026,
"step": 785,
"valid_targets_mean": 3962.5,
"valid_targets_min": 2058
},
{
"epoch": 1.9651741293532339,
"grad_norm": 0.5643291821086128,
"learning_rate": 3.6171583831993076e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25705310702323914,
"step": 790,
"valid_targets_mean": 4278.8,
"valid_targets_min": 2126
},
{
"epoch": 1.9776119402985075,
"grad_norm": 0.5790941804858589,
"learning_rate": 3.609826862507128e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2411389946937561,
"step": 795,
"valid_targets_mean": 3969.7,
"valid_targets_min": 2089
},
{
"epoch": 1.9900497512437811,
"grad_norm": 0.48846796864819103,
"learning_rate": 3.6024333848509384e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23043224215507507,
"step": 800,
"valid_targets_mean": 4327.9,
"valid_targets_min": 1962
},
{
"epoch": 2.0024875621890548,
"grad_norm": 0.5849877152700085,
"learning_rate": 3.594978234781481e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23692670464515686,
"step": 805,
"valid_targets_mean": 3665.8,
"valid_targets_min": 2020
},
{
"epoch": 2.014925373134328,
"grad_norm": 0.538247528051884,
"learning_rate": 3.587461699223067e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2252245843410492,
"step": 810,
"valid_targets_mean": 4359.8,
"valid_targets_min": 1739
},
{
"epoch": 2.027363184079602,
"grad_norm": 0.5381268521719818,
"learning_rate": 3.579884067462535e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2488606870174408,
"step": 815,
"valid_targets_mean": 4062.9,
"valid_targets_min": 2410
},
{
"epoch": 2.0398009950248754,
"grad_norm": 0.6115694003336873,
"learning_rate": 3.572245631138116e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2483055591583252,
"step": 820,
"valid_targets_mean": 3527.8,
"valid_targets_min": 1282
},
{
"epoch": 2.0522388059701493,
"grad_norm": 0.5094263989797099,
"learning_rate": 3.564546684228209e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991591900587082,
"step": 825,
"valid_targets_mean": 4397.8,
"valid_targets_min": 1706
},
{
"epoch": 2.0646766169154227,
"grad_norm": 0.5601385200195886,
"learning_rate": 3.556787523040069e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520599961280823,
"step": 830,
"valid_targets_mean": 3847.5,
"valid_targets_min": 1319
},
{
"epoch": 2.0771144278606966,
"grad_norm": 0.5380726404824564,
"learning_rate": 3.548968446198398e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21053871512413025,
"step": 835,
"valid_targets_mean": 4242.5,
"valid_targets_min": 973
},
{
"epoch": 2.08955223880597,
"grad_norm": 0.5025117595976427,
"learning_rate": 3.54108975463386e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2069125920534134,
"step": 840,
"valid_targets_mean": 4396.9,
"valid_targets_min": 2427
},
{
"epoch": 2.101990049751244,
"grad_norm": 0.5354301465480238,
"learning_rate": 3.533151751571489e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2244517207145691,
"step": 845,
"valid_targets_mean": 3890.4,
"valid_targets_min": 1859
},
{
"epoch": 2.1144278606965172,
"grad_norm": 0.5610413426394177,
"learning_rate": 3.5251547425190294e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24040347337722778,
"step": 850,
"valid_targets_mean": 4252.7,
"valid_targets_min": 1379
},
{
"epoch": 2.126865671641791,
"grad_norm": 0.7445240143199634,
"learning_rate": 3.51709903525517e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22202104330062866,
"step": 855,
"valid_targets_mean": 3389.6,
"valid_targets_min": 1472
},
{
"epoch": 2.1393034825870645,
"grad_norm": 0.5584087371143899,
"learning_rate": 3.5089849398177013e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25943320989608765,
"step": 860,
"valid_targets_mean": 4247.4,
"valid_targets_min": 1713
},
{
"epoch": 2.1517412935323383,
"grad_norm": 0.5832938350626173,
"learning_rate": 3.500812768491586e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2365805208683014,
"step": 865,
"valid_targets_mean": 4043.2,
"valid_targets_min": 1548
},
{
"epoch": 2.1641791044776117,
"grad_norm": 0.5400590413107126,
"learning_rate": 3.4925828357969344e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21506357192993164,
"step": 870,
"valid_targets_mean": 3890.4,
"valid_targets_min": 2165
},
{
"epoch": 2.1766169154228856,
"grad_norm": 0.5408725543370927,
"learning_rate": 3.484295458476905e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2199130356311798,
"step": 875,
"valid_targets_mean": 3965.0,
"valid_targets_min": 1830
},
{
"epoch": 2.189054726368159,
"grad_norm": 0.5544609623772936,
"learning_rate": 3.475950955485511e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2255849838256836,
"step": 880,
"valid_targets_mean": 3941.9,
"valid_targets_min": 1907
},
{
"epoch": 2.201492537313433,
"grad_norm": 0.5335810864251953,
"learning_rate": 3.467549647975346e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2269669473171234,
"step": 885,
"valid_targets_mean": 3739.8,
"valid_targets_min": 1409
},
{
"epoch": 2.2139303482587063,
"grad_norm": 0.544212423789675,
"learning_rate": 3.4590918592852214e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22404810786247253,
"step": 890,
"valid_targets_mean": 3947.4,
"valid_targets_min": 2505
},
{
"epoch": 2.22636815920398,
"grad_norm": 0.48777043633608497,
"learning_rate": 3.450577914927728e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2288726568222046,
"step": 895,
"valid_targets_mean": 4936.0,
"valid_targets_min": 1097
},
{
"epoch": 2.2388059701492535,
"grad_norm": 0.5375629176173219,
"learning_rate": 3.442008142576701e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21632421016693115,
"step": 900,
"valid_targets_mean": 4131.2,
"valid_targets_min": 2105
},
{
"epoch": 2.2512437810945274,
"grad_norm": 0.5159769756167506,
"learning_rate": 3.433382872054614e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24016112089157104,
"step": 905,
"valid_targets_mean": 4466.8,
"valid_targets_min": 2033
},
{
"epoch": 2.2636815920398012,
"grad_norm": 0.5464064642346769,
"learning_rate": 3.4247024353198826e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23476913571357727,
"step": 910,
"valid_targets_mean": 4390.9,
"valid_targets_min": 1993
},
{
"epoch": 2.2761194029850746,
"grad_norm": 0.5493349140412681,
"learning_rate": 3.415967166454091e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21979095041751862,
"step": 915,
"valid_targets_mean": 3712.5,
"valid_targets_min": 853
},
{
"epoch": 2.288557213930348,
"grad_norm": 0.5988218138371607,
"learning_rate": 3.4071774016491295e-05,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22979789972305298,
"step": 920,
"valid_targets_mean": 3520.1,
"valid_targets_min": 1018
},
{
"epoch": 2.300995024875622,
"grad_norm": 0.6119392010234547,
"learning_rate": 3.398333479194261e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2250669300556183,
"step": 925,
"valid_targets_mean": 3029.0,
"valid_targets_min": 1741
},
{
"epoch": 2.3134328358208958,
"grad_norm": 0.5738059500201181,
"learning_rate": 3.389435739463099e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22356033325195312,
"step": 930,
"valid_targets_mean": 3890.4,
"valid_targets_min": 1947
},
{
"epoch": 2.325870646766169,
"grad_norm": 0.5200786239469339,
"learning_rate": 3.380484524900506e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.217308908700943,
"step": 935,
"valid_targets_mean": 4040.2,
"valid_targets_min": 1742
},
{
"epoch": 2.3383084577114426,
"grad_norm": 0.5347052584780078,
"learning_rate": 3.371480180009418e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21474695205688477,
"step": 940,
"valid_targets_mean": 3967.4,
"valid_targets_min": 1804
},
{
"epoch": 2.3507462686567164,
"grad_norm": 0.6357404551408977,
"learning_rate": 3.362423051337581e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2433660328388214,
"step": 945,
"valid_targets_mean": 3678.4,
"valid_targets_min": 1041
},
{
"epoch": 2.3631840796019903,
"grad_norm": 0.5200162752679304,
"learning_rate": 3.353313487464217e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21824005246162415,
"step": 950,
"valid_targets_mean": 4523.8,
"valid_targets_min": 2556
},
{
"epoch": 2.3756218905472637,
"grad_norm": 0.5521210931060869,
"learning_rate": 3.3441518389866075e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2285742461681366,
"step": 955,
"valid_targets_mean": 4061.0,
"valid_targets_min": 933
},
{
"epoch": 2.388059701492537,
"grad_norm": 0.5509197209245766,
"learning_rate": 3.334938458506599e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24184472858905792,
"step": 960,
"valid_targets_mean": 4080.4,
"valid_targets_min": 1530
},
{
"epoch": 2.400497512437811,
"grad_norm": 0.5236287052530746,
"learning_rate": 3.325673700617035e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20668141543865204,
"step": 965,
"valid_targets_mean": 4257.0,
"valid_targets_min": 1666
},
{
"epoch": 2.412935323383085,
"grad_norm": 0.6083605097982535,
"learning_rate": 3.316357921888104e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2471916675567627,
"step": 970,
"valid_targets_mean": 3378.9,
"valid_targets_min": 1597
},
{
"epoch": 2.425373134328358,
"grad_norm": 0.5335881223915271,
"learning_rate": 3.306991480853624e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20531508326530457,
"step": 975,
"valid_targets_mean": 4332.2,
"valid_targets_min": 1927
},
{
"epoch": 2.4378109452736316,
"grad_norm": 0.491874909775028,
"learning_rate": 3.2975747379972345e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21635055541992188,
"step": 980,
"valid_targets_mean": 4316.7,
"valid_targets_min": 1860
},
{
"epoch": 2.4502487562189055,
"grad_norm": 0.5761426750570783,
"learning_rate": 3.288108055738531e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2470484972000122,
"step": 985,
"valid_targets_mean": 3830.1,
"valid_targets_min": 1418
},
{
"epoch": 2.4626865671641793,
"grad_norm": 0.5320370757070529,
"learning_rate": 3.278591798419112e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2289409041404724,
"step": 990,
"valid_targets_mean": 4497.8,
"valid_targets_min": 1957
},
{
"epoch": 2.4751243781094527,
"grad_norm": 0.5771119980643729,
"learning_rate": 3.2690263322885564e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23160231113433838,
"step": 995,
"valid_targets_mean": 3809.6,
"valid_targets_min": 1732
},
{
"epoch": 2.487562189054726,
"grad_norm": 0.5428978241749973,
"learning_rate": 3.259412025490331e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22234313189983368,
"step": 1000,
"valid_targets_mean": 3825.9,
"valid_targets_min": 2537
},
{
"epoch": 2.5,
"grad_norm": 0.4988498596419294,
"learning_rate": 3.249749248047619e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2289588749408722,
"step": 1005,
"valid_targets_mean": 4525.5,
"valid_targets_min": 2281
},
{
"epoch": 2.512437810945274,
"grad_norm": 0.5359144087715436,
"learning_rate": 3.24003837184908e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.221797913312912,
"step": 1010,
"valid_targets_mean": 3942.2,
"valid_targets_min": 1802
},
{
"epoch": 2.5248756218905473,
"grad_norm": 0.5568260899912753,
"learning_rate": 3.230279770634538e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21767503023147583,
"step": 1015,
"valid_targets_mean": 4057.7,
"valid_targets_min": 2287
},
{
"epoch": 2.5373134328358207,
"grad_norm": 0.6004807280832435,
"learning_rate": 3.220473819980594e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23624536395072937,
"step": 1020,
"valid_targets_mean": 3945.8,
"valid_targets_min": 1124
},
{
"epoch": 2.5497512437810945,
"grad_norm": 0.5323221469131362,
"learning_rate": 3.2106208972861775e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22079509496688843,
"step": 1025,
"valid_targets_mean": 4226.3,
"valid_targets_min": 2281
},
{
"epoch": 2.5621890547263684,
"grad_norm": 0.5648978978257522,
"learning_rate": 3.2007213817580165e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22475269436836243,
"step": 1030,
"valid_targets_mean": 4073.6,
"valid_targets_min": 2117
},
{
"epoch": 2.574626865671642,
"grad_norm": 0.5796358749507854,
"learning_rate": 3.1907756543960425e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23154105246067047,
"step": 1035,
"valid_targets_mean": 3477.8,
"valid_targets_min": 1170
},
{
"epoch": 2.587064676616915,
"grad_norm": 0.5229192190104138,
"learning_rate": 3.180784097978732e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20573227107524872,
"step": 1040,
"valid_targets_mean": 4331.4,
"valid_targets_min": 2708
},
{
"epoch": 2.599502487562189,
"grad_norm": 0.8210781641217509,
"learning_rate": 3.1707470970483716e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21882575750350952,
"step": 1045,
"valid_targets_mean": 4022.0,
"valid_targets_min": 1396
},
{
"epoch": 2.611940298507463,
"grad_norm": 0.4797756242590163,
"learning_rate": 3.160665037896256e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21537092328071594,
"step": 1050,
"valid_targets_mean": 5050.7,
"valid_targets_min": 2642
},
{
"epoch": 2.6243781094527363,
"grad_norm": 0.5768753494873544,
"learning_rate": 3.150538308547826e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2303762435913086,
"step": 1055,
"valid_targets_mean": 3295.4,
"valid_targets_min": 840
},
{
"epoch": 2.6368159203980097,
"grad_norm": 0.5551715330405659,
"learning_rate": 3.14036729874773e-05,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2432781457901001,
"step": 1060,
"valid_targets_mean": 3878.2,
"valid_targets_min": 1155
},
{
"epoch": 2.6492537313432836,
"grad_norm": 0.5533747207127068,
"learning_rate": 3.130152399944827e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21668297052383423,
"step": 1065,
"valid_targets_mean": 3560.9,
"valid_targets_min": 1236
},
{
"epoch": 2.6616915422885574,
"grad_norm": 0.6091887065700332,
"learning_rate": 3.1198940052771196e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22194230556488037,
"step": 1070,
"valid_targets_mean": 3523.8,
"valid_targets_min": 1943
},
{
"epoch": 2.674129353233831,
"grad_norm": 0.5217859543197857,
"learning_rate": 3.109592509556625e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19868099689483643,
"step": 1075,
"valid_targets_mean": 3734.4,
"valid_targets_min": 1771
},
{
"epoch": 2.6865671641791042,
"grad_norm": 0.5907560446630902,
"learning_rate": 3.0992483092541757e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22035574913024902,
"step": 1080,
"valid_targets_mean": 4186.8,
"valid_targets_min": 1370
},
{
"epoch": 2.699004975124378,
"grad_norm": 0.5354879248422757,
"learning_rate": 3.088861802484168e-05,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22888147830963135,
"step": 1085,
"valid_targets_mean": 4406.8,
"valid_targets_min": 1937
},
{
"epoch": 2.711442786069652,
"grad_norm": 0.5354309571052726,
"learning_rate": 3.078433388989232e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23584789037704468,
"step": 1090,
"valid_targets_mean": 4082.8,
"valid_targets_min": 2016
},
{
"epoch": 2.7238805970149254,
"grad_norm": 0.5230105200073858,
"learning_rate": 3.067963470124852e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21761374175548553,
"step": 1095,
"valid_targets_mean": 4048.8,
"valid_targets_min": 1515
},
{
"epoch": 2.7363184079601988,
"grad_norm": 0.5254789832854005,
"learning_rate": 3.0574524488439166e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21649402379989624,
"step": 1100,
"valid_targets_mean": 3900.8,
"valid_targets_min": 1840
},
{
"epoch": 2.7487562189054726,
"grad_norm": 0.5512516143404952,
"learning_rate": 3.046900729681215e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2197253406047821,
"step": 1105,
"valid_targets_mean": 3859.6,
"valid_targets_min": 1241
},
{
"epoch": 2.7611940298507465,
"grad_norm": 0.4780381184240064,
"learning_rate": 3.0363087187378618e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21492695808410645,
"step": 1110,
"valid_targets_mean": 4405.6,
"valid_targets_min": 2322
},
{
"epoch": 2.77363184079602,
"grad_norm": 0.6383173460840905,
"learning_rate": 3.025676823665671e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23645994067192078,
"step": 1115,
"valid_targets_mean": 3986.8,
"valid_targets_min": 2007
},
{
"epoch": 2.7860696517412933,
"grad_norm": 0.5606483903400612,
"learning_rate": 3.0150054536514655e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2141602337360382,
"step": 1120,
"valid_targets_mean": 3552.6,
"valid_targets_min": 196
},
{
"epoch": 2.798507462686567,
"grad_norm": 0.5372938232844723,
"learning_rate": 3.0042950194013313e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22424790263175964,
"step": 1125,
"valid_targets_mean": 4286.3,
"valid_targets_min": 2746
},
{
"epoch": 2.810945273631841,
"grad_norm": 0.647264121448103,
"learning_rate": 2.993545933124807e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2541235089302063,
"step": 1130,
"valid_targets_mean": 3984.4,
"valid_targets_min": 1033
},
{
"epoch": 2.8233830845771144,
"grad_norm": 0.5395140967298383,
"learning_rate": 2.9827586085190217e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20689839124679565,
"step": 1135,
"valid_targets_mean": 3842.4,
"valid_targets_min": 1140
},
{
"epoch": 2.835820895522388,
"grad_norm": 0.5132101606150065,
"learning_rate": 2.971933460752773e-05,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2214384526014328,
"step": 1140,
"valid_targets_mean": 4829.9,
"valid_targets_min": 1793
},
{
"epoch": 2.8482587064676617,
"grad_norm": 0.545837953147779,
"learning_rate": 2.961070906450548e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24275824427604675,
"step": 1145,
"valid_targets_mean": 4090.0,
"valid_targets_min": 1876
},
{
"epoch": 2.8606965174129355,
"grad_norm": 0.545483447551859,
"learning_rate": 2.950171363676488e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21436379849910736,
"step": 1150,
"valid_targets_mean": 3576.0,
"valid_targets_min": 1297
},
{
"epoch": 2.873134328358209,
"grad_norm": 0.5046264457103875,
"learning_rate": 2.9392352519183003e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2066916823387146,
"step": 1155,
"valid_targets_mean": 4762.8,
"valid_targets_min": 2454
},
{
"epoch": 2.8855721393034823,
"grad_norm": 0.5186125948476298,
"learning_rate": 2.928262992071113e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2164272964000702,
"step": 1160,
"valid_targets_mean": 3770.9,
"valid_targets_min": 1244
},
{
"epoch": 2.898009950248756,
"grad_norm": 0.5004644338207715,
"learning_rate": 2.9172550064212747e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1974021941423416,
"step": 1165,
"valid_targets_mean": 4147.8,
"valid_targets_min": 2450
},
{
"epoch": 2.91044776119403,
"grad_norm": 0.5284009585202385,
"learning_rate": 2.906211718630104e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23019076883792877,
"step": 1170,
"valid_targets_mean": 3926.6,
"valid_targets_min": 2084
},
{
"epoch": 2.9228855721393034,
"grad_norm": 0.5437530454710895,
"learning_rate": 2.895133553717582e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22214023768901825,
"step": 1175,
"valid_targets_mean": 3957.7,
"valid_targets_min": 1130
},
{
"epoch": 2.935323383084577,
"grad_norm": 0.5309034940862213,
"learning_rate": 2.8840209380459983e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027333378791809,
"step": 1180,
"valid_targets_mean": 3732.1,
"valid_targets_min": 1670
},
{
"epoch": 2.9477611940298507,
"grad_norm": 0.502018444365329,
"learning_rate": 2.8728742993035376e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20462360978126526,
"step": 1185,
"valid_targets_mean": 3885.9,
"valid_targets_min": 2023
},
{
"epoch": 2.9601990049751246,
"grad_norm": 0.5097178679874955,
"learning_rate": 2.8616940664878217e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21697774529457092,
"step": 1190,
"valid_targets_mean": 4445.0,
"valid_targets_min": 1363
},
{
"epoch": 2.972636815920398,
"grad_norm": 0.568255587186467,
"learning_rate": 2.850480669889397e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2217128425836563,
"step": 1195,
"valid_targets_mean": 3645.9,
"valid_targets_min": 2013
},
{
"epoch": 2.9850746268656714,
"grad_norm": 0.5435581128114583,
"learning_rate": 2.839234541075178e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23033751547336578,
"step": 1200,
"valid_targets_mean": 3913.1,
"valid_targets_min": 428
},
{
"epoch": 2.9975124378109452,
"grad_norm": 0.5344645879564283,
"learning_rate": 2.8279561128718324e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1959632784128189,
"step": 1205,
"valid_targets_mean": 3608.3,
"valid_targets_min": 2089
},
{
"epoch": 3.009950248756219,
"grad_norm": 0.49623627025746214,
"learning_rate": 2.8166458193491287e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20732742547988892,
"step": 1210,
"valid_targets_mean": 4868.1,
"valid_targets_min": 2028
},
{
"epoch": 3.0223880597014925,
"grad_norm": 0.5737814175353435,
"learning_rate": 2.805304095803222e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21487167477607727,
"step": 1215,
"valid_targets_mean": 4191.0,
"valid_targets_min": 1524
},
{
"epoch": 3.0348258706467663,
"grad_norm": 0.5106023876957765,
"learning_rate": 2.7939313787399118e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2161100208759308,
"step": 1220,
"valid_targets_mean": 4569.1,
"valid_targets_min": 2916
},
{
"epoch": 3.0472636815920398,
"grad_norm": 0.5564896880436795,
"learning_rate": 2.7825281058578326e-05,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2229604572057724,
"step": 1225,
"valid_targets_mean": 4257.8,
"valid_targets_min": 1109
},
{
"epoch": 3.0597014925373136,
"grad_norm": 0.557147418201146,
"learning_rate": 2.7710947160316145e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20052112638950348,
"step": 1230,
"valid_targets_mean": 4028.7,
"valid_targets_min": 1645
},
{
"epoch": 3.072139303482587,
"grad_norm": 0.5878465938206581,
"learning_rate": 2.759631649294989e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22095069289207458,
"step": 1235,
"valid_targets_mean": 4023.8,
"valid_targets_min": 1998
},
{
"epoch": 3.084577114427861,
"grad_norm": 0.5194814837667161,
"learning_rate": 2.7481393468238558e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19190478324890137,
"step": 1240,
"valid_targets_mean": 4377.2,
"valid_targets_min": 2378
},
{
"epoch": 3.0970149253731343,
"grad_norm": 0.5898646554241795,
"learning_rate": 2.7366182509193e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20672670006752014,
"step": 1245,
"valid_targets_mean": 3683.2,
"valid_targets_min": 1530
},
{
"epoch": 3.109452736318408,
"grad_norm": 0.5408382733969814,
"learning_rate": 2.725068804990575e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22049081325531006,
"step": 1250,
"valid_targets_mean": 4423.6,
"valid_targets_min": 1725
},
{
"epoch": 3.1218905472636815,
"grad_norm": 0.5240915497470742,
"learning_rate": 2.7134914535380305e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19481924176216125,
"step": 1255,
"valid_targets_mean": 4028.4,
"valid_targets_min": 831
},
{
"epoch": 3.1343283582089554,
"grad_norm": 0.586082749576896,
"learning_rate": 2.7018866421360114e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22566986083984375,
"step": 1260,
"valid_targets_mean": 3726.2,
"valid_targets_min": 844
},
{
"epoch": 3.146766169154229,
"grad_norm": 0.5224048615979382,
"learning_rate": 2.6902548174157028e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.219328373670578,
"step": 1265,
"valid_targets_mean": 4112.4,
"valid_targets_min": 1498
},
{
"epoch": 3.1592039800995027,
"grad_norm": 0.501751299595383,
"learning_rate": 2.6785964270479472e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1844957172870636,
"step": 1270,
"valid_targets_mean": 4384.2,
"valid_targets_min": 2813
},
{
"epoch": 3.171641791044776,
"grad_norm": 0.5831574633686978,
"learning_rate": 2.66691191972601e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2090991735458374,
"step": 1275,
"valid_targets_mean": 3494.6,
"valid_targets_min": 1780
},
{
"epoch": 3.18407960199005,
"grad_norm": 0.5850385454163992,
"learning_rate": 2.6552017451483136e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21853281557559967,
"step": 1280,
"valid_targets_mean": 4045.5,
"valid_targets_min": 1823
},
{
"epoch": 3.1965174129353233,
"grad_norm": 0.5599684535438738,
"learning_rate": 2.6434663540011278e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.219620943069458,
"step": 1285,
"valid_targets_mean": 4112.5,
"valid_targets_min": 2313
},
{
"epoch": 3.208955223880597,
"grad_norm": 0.9513235022639203,
"learning_rate": 2.631706197941227e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1958315670490265,
"step": 1290,
"valid_targets_mean": 4007.0,
"valid_targets_min": 1381
},
{
"epoch": 3.2213930348258706,
"grad_norm": 0.548449991410438,
"learning_rate": 2.619921729578504e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20220553874969482,
"step": 1295,
"valid_targets_mean": 3707.1,
"valid_targets_min": 1997
},
{
"epoch": 3.2338308457711444,
"grad_norm": 0.5435395454910702,
"learning_rate": 2.6081134024585558e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19983190298080444,
"step": 1300,
"valid_targets_mean": 3682.4,
"valid_targets_min": 1533
},
{
"epoch": 3.246268656716418,
"grad_norm": 0.5396400851922742,
"learning_rate": 2.5962816710452217e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19172373414039612,
"step": 1305,
"valid_targets_mean": 4202.8,
"valid_targets_min": 1828
},
{
"epoch": 3.2587064676616917,
"grad_norm": 0.5528015303255912,
"learning_rate": 2.5844269907030972e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21026234328746796,
"step": 1310,
"valid_targets_mean": 3956.2,
"valid_targets_min": 2237
},
{
"epoch": 3.271144278606965,
"grad_norm": 0.6555416969802464,
"learning_rate": 2.5725498176800053e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20781803131103516,
"step": 1315,
"valid_targets_mean": 3484.7,
"valid_targets_min": 1823
},
{
"epoch": 3.283582089552239,
"grad_norm": 0.5520065160976478,
"learning_rate": 2.560650609089441e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21545690298080444,
"step": 1320,
"valid_targets_mean": 3796.1,
"valid_targets_min": 2150
},
{
"epoch": 3.2960199004975124,
"grad_norm": 0.5594356265872277,
"learning_rate": 2.5487298228929746e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19716203212738037,
"step": 1325,
"valid_targets_mean": 4177.7,
"valid_targets_min": 2666
},
{
"epoch": 3.308457711442786,
"grad_norm": 0.5673243925575643,
"learning_rate": 2.5367879178826278e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21999700367450714,
"step": 1330,
"valid_targets_mean": 3577.8,
"valid_targets_min": 1379
},
{
"epoch": 3.3208955223880596,
"grad_norm": 0.5112451211401966,
"learning_rate": 2.5248253536632176e-05,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20441888272762299,
"step": 1335,
"valid_targets_mean": 4252.4,
"valid_targets_min": 1758
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.5701315285018725,
"learning_rate": 2.512842590634664e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.228561133146286,
"step": 1340,
"valid_targets_mean": 3937.6,
"valid_targets_min": 1865
},
{
"epoch": 3.345771144278607,
"grad_norm": 0.5421666508199918,
"learning_rate": 2.5008400899742757e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20633219182491302,
"step": 1345,
"valid_targets_mean": 4439.9,
"valid_targets_min": 3260
},
{
"epoch": 3.3582089552238807,
"grad_norm": 0.49279685109536914,
"learning_rate": 2.4888183136189952e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1922161877155304,
"step": 1350,
"valid_targets_mean": 4147.8,
"valid_targets_min": 2538
},
{
"epoch": 3.370646766169154,
"grad_norm": 0.4688762074597621,
"learning_rate": 2.4767777242476263e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19103196263313293,
"step": 1355,
"valid_targets_mean": 5005.8,
"valid_targets_min": 2533
},
{
"epoch": 3.383084577114428,
"grad_norm": 0.5500017320569016,
"learning_rate": 2.4647187852630227e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20763391256332397,
"step": 1360,
"valid_targets_mean": 3853.6,
"valid_targets_min": 1548
},
{
"epoch": 3.3955223880597014,
"grad_norm": 0.5872147896176038,
"learning_rate": 2.4526419607742543e-05,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22904819250106812,
"step": 1365,
"valid_targets_mean": 3977.2,
"valid_targets_min": 2209
},
{
"epoch": 3.4079601990049753,
"grad_norm": 0.5155674931487689,
"learning_rate": 2.4405477155787457e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21794819831848145,
"step": 1370,
"valid_targets_mean": 4300.1,
"valid_targets_min": 1567
},
{
"epoch": 3.4203980099502487,
"grad_norm": 0.5958084420992633,
"learning_rate": 2.4284365151443892e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21897193789482117,
"step": 1375,
"valid_targets_mean": 3848.8,
"valid_targets_min": 1201
},
{
"epoch": 3.4328358208955225,
"grad_norm": 0.5269624601178255,
"learning_rate": 2.416308825591626e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867186725139618,
"step": 1380,
"valid_targets_mean": 4206.9,
"valid_targets_min": 1330
},
{
"epoch": 3.445273631840796,
"grad_norm": 0.5745335400755156,
"learning_rate": 2.4041651136755112e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21894606947898865,
"step": 1385,
"valid_targets_mean": 4212.0,
"valid_targets_min": 1793
},
{
"epoch": 3.45771144278607,
"grad_norm": 0.5062989296925714,
"learning_rate": 2.3920058467677475e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19788777828216553,
"step": 1390,
"valid_targets_mean": 4500.6,
"valid_targets_min": 1771
},
{
"epoch": 3.470149253731343,
"grad_norm": 0.5291231334084273,
"learning_rate": 2.3798314928386986e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19889307022094727,
"step": 1395,
"valid_targets_mean": 4059.6,
"valid_targets_min": 1629
},
{
"epoch": 3.482587064676617,
"grad_norm": 0.6204408757812566,
"learning_rate": 2.367642520439378e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2038464993238449,
"step": 1400,
"valid_targets_mean": 3189.2,
"valid_targets_min": 941
},
{
"epoch": 3.4950248756218905,
"grad_norm": 0.5860309965160757,
"learning_rate": 2.3554393986834173e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18992196023464203,
"step": 1405,
"valid_targets_mean": 4013.2,
"valid_targets_min": 777
},
{
"epoch": 3.5074626865671643,
"grad_norm": 0.5323469940034676,
"learning_rate": 2.3432225972290086e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1906590759754181,
"step": 1410,
"valid_targets_mean": 4144.9,
"valid_targets_min": 1661
},
{
"epoch": 3.5199004975124377,
"grad_norm": 0.5720751778006824,
"learning_rate": 2.3309925862608318e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1970103681087494,
"step": 1415,
"valid_targets_mean": 3570.9,
"valid_targets_min": 1244
},
{
"epoch": 3.5323383084577116,
"grad_norm": 0.5077487997895391,
"learning_rate": 2.3187498364719576e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1936759650707245,
"step": 1420,
"valid_targets_mean": 4038.2,
"valid_targets_min": 2313
},
{
"epoch": 3.544776119402985,
"grad_norm": 0.5828341436838554,
"learning_rate": 2.3064948190457335e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18977367877960205,
"step": 1425,
"valid_targets_mean": 3396.9,
"valid_targets_min": 2106
},
{
"epoch": 3.557213930348259,
"grad_norm": 0.5735838721354387,
"learning_rate": 2.2942280056376457e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20034313201904297,
"step": 1430,
"valid_targets_mean": 3937.6,
"valid_targets_min": 1627
},
{
"epoch": 3.5696517412935322,
"grad_norm": 0.5234257291474523,
"learning_rate": 2.2819498683571718e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20040658116340637,
"step": 1435,
"valid_targets_mean": 4346.8,
"valid_targets_min": 2323
},
{
"epoch": 3.582089552238806,
"grad_norm": 0.5271233727171688,
"learning_rate": 2.2696608797496045e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1866839975118637,
"step": 1440,
"valid_targets_mean": 3945.6,
"valid_targets_min": 1378
},
{
"epoch": 3.5945273631840795,
"grad_norm": 0.5242920703023999,
"learning_rate": 2.2573615127778733e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19095249474048615,
"step": 1445,
"valid_targets_mean": 3907.6,
"valid_targets_min": 1780
},
{
"epoch": 3.6069651741293534,
"grad_norm": 0.6005933256936844,
"learning_rate": 2.2450522408043324e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2235599309206009,
"step": 1450,
"valid_targets_mean": 3177.5,
"valid_targets_min": 992
},
{
"epoch": 3.6194029850746268,
"grad_norm": 0.5536958757152657,
"learning_rate": 2.232733537572551e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20974500477313995,
"step": 1455,
"valid_targets_mean": 3999.3,
"valid_targets_min": 1643
},
{
"epoch": 3.6318407960199006,
"grad_norm": 0.45147835839349537,
"learning_rate": 2.2204058771890735e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19078528881072998,
"step": 1460,
"valid_targets_mean": 4792.8,
"valid_targets_min": 1685
},
{
"epoch": 3.644278606965174,
"grad_norm": 0.6125570787690607,
"learning_rate": 2.2080697341051777e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21356597542762756,
"step": 1465,
"valid_targets_mean": 3559.8,
"valid_targets_min": 2038
},
{
"epoch": 3.656716417910448,
"grad_norm": 0.5118359172048365,
"learning_rate": 2.195725583098611e-05,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20302622020244598,
"step": 1470,
"valid_targets_mean": 4243.6,
"valid_targets_min": 2620
},
{
"epoch": 3.6691542288557213,
"grad_norm": 0.5524385866849025,
"learning_rate": 2.183373899255321e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972339153289795,
"step": 1475,
"valid_targets_mean": 3786.9,
"valid_targets_min": 2602
},
{
"epoch": 3.681592039800995,
"grad_norm": 0.5519280039906248,
"learning_rate": 2.171015157951169e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23621603846549988,
"step": 1480,
"valid_targets_mean": 4710.5,
"valid_targets_min": 2121
},
{
"epoch": 3.6940298507462686,
"grad_norm": 0.4961853443443449,
"learning_rate": 2.158649834833636e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21436795592308044,
"step": 1485,
"valid_targets_mean": 4526.8,
"valid_targets_min": 2490
},
{
"epoch": 3.7064676616915424,
"grad_norm": 0.5544971340683077,
"learning_rate": 2.146278405803512e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20669138431549072,
"step": 1490,
"valid_targets_mean": 3391.8,
"valid_targets_min": 228
},
{
"epoch": 3.718905472636816,
"grad_norm": 0.5059854792152241,
"learning_rate": 2.133901346996588e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2086849957704544,
"step": 1495,
"valid_targets_mean": 4446.4,
"valid_targets_min": 2480
},
{
"epoch": 3.7313432835820897,
"grad_norm": 0.5008031450948552,
"learning_rate": 2.1215191347653227e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20051947236061096,
"step": 1500,
"valid_targets_mean": 4183.6,
"valid_targets_min": 1422
},
{
"epoch": 3.743781094527363,
"grad_norm": 0.5016740412477303,
"learning_rate": 2.109132245660517e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2014276683330536,
"step": 1505,
"valid_targets_mean": 4293.1,
"valid_targets_min": 2065
},
{
"epoch": 3.756218905472637,
"grad_norm": 0.5773401034416584,
"learning_rate": 2.096741156412967e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24956290423870087,
"step": 1510,
"valid_targets_mean": 4016.8,
"valid_targets_min": 2328
},
{
"epoch": 3.7686567164179103,
"grad_norm": 0.5557509017649421,
"learning_rate": 2.084346343915118e-05,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21007095277309418,
"step": 1515,
"valid_targets_mean": 4184.1,
"valid_targets_min": 2042
},
{
"epoch": 3.781094527363184,
"grad_norm": 0.5069995725105243,
"learning_rate": 2.0719482852027122e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19801217317581177,
"step": 1520,
"valid_targets_mean": 4527.2,
"valid_targets_min": 2586
},
{
"epoch": 3.7935323383084576,
"grad_norm": 0.5072359725349612,
"learning_rate": 2.059547457436429e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21030068397521973,
"step": 1525,
"valid_targets_mean": 4119.2,
"valid_targets_min": 1876
},
{
"epoch": 3.8059701492537314,
"grad_norm": 0.5809162860083377,
"learning_rate": 2.0471443378835173e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20429758727550507,
"step": 1530,
"valid_targets_mean": 3375.6,
"valid_targets_min": 423
},
{
"epoch": 3.818407960199005,
"grad_norm": 0.6146168591855865,
"learning_rate": 2.0347394038994305e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20681461691856384,
"step": 1535,
"valid_targets_mean": 3487.4,
"valid_targets_min": 1170
},
{
"epoch": 3.8308457711442787,
"grad_norm": 0.5243852804360046,
"learning_rate": 2.0223331329094534e-05,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20334434509277344,
"step": 1540,
"valid_targets_mean": 3998.9,
"valid_targets_min": 1988
},
{
"epoch": 3.843283582089552,
"grad_norm": 0.5291633419029611,
"learning_rate": 2.0099260023903286e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18365240097045898,
"step": 1545,
"valid_targets_mean": 4010.1,
"valid_targets_min": 1927
},
{
"epoch": 3.855721393034826,
"grad_norm": 0.5121951623491455,
"learning_rate": 1.997518489851878e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20143933594226837,
"step": 1550,
"valid_targets_mean": 4428.3,
"valid_targets_min": 2098
},
{
"epoch": 3.8681592039800994,
"grad_norm": 0.5327816071630699,
"learning_rate": 1.985111072818626e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2264530062675476,
"step": 1555,
"valid_targets_mean": 4157.4,
"valid_targets_min": 1472
},
{
"epoch": 3.8805970149253732,
"grad_norm": 0.5872325233516333,
"learning_rate": 1.9727042288114223e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21333108842372894,
"step": 1560,
"valid_targets_mean": 3713.8,
"valid_targets_min": 1874
},
{
"epoch": 3.8930348258706466,
"grad_norm": 0.5465903196708187,
"learning_rate": 1.9602984353290627e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20426753163337708,
"step": 1565,
"valid_targets_mean": 3976.4,
"valid_targets_min": 1752
},
{
"epoch": 3.9054726368159205,
"grad_norm": 0.48170818915584446,
"learning_rate": 1.9478941698299108e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19036681950092316,
"step": 1570,
"valid_targets_mean": 5013.6,
"valid_targets_min": 1987
},
{
"epoch": 3.917910447761194,
"grad_norm": 0.5470516146085361,
"learning_rate": 1.9354919097135233e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20237231254577637,
"step": 1575,
"valid_targets_mean": 3921.6,
"valid_targets_min": 2194
},
{
"epoch": 3.9303482587064678,
"grad_norm": 0.49608737593410446,
"learning_rate": 1.9230921323022777e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19408315420150757,
"step": 1580,
"valid_targets_mean": 4462.3,
"valid_targets_min": 2876
},
{
"epoch": 3.942786069651741,
"grad_norm": 0.5215118271002951,
"learning_rate": 1.9106953148229986e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20697835087776184,
"step": 1585,
"valid_targets_mean": 4175.0,
"valid_targets_min": 2020
},
{
"epoch": 3.955223880597015,
"grad_norm": 0.5461860904207121,
"learning_rate": 1.8983019343885937e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2104094922542572,
"step": 1590,
"valid_targets_mean": 3759.0,
"valid_targets_min": 1717
},
{
"epoch": 3.9676616915422884,
"grad_norm": 0.5231042143924045,
"learning_rate": 1.8859124679796893e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21831703186035156,
"step": 1595,
"valid_targets_mean": 4261.8,
"valid_targets_min": 2399
},
{
"epoch": 3.9800995024875623,
"grad_norm": 0.5222686881020943,
"learning_rate": 1.8735273924262727e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033132016658783,
"step": 1600,
"valid_targets_mean": 4387.1,
"valid_targets_min": 2804
},
{
"epoch": 3.9925373134328357,
"grad_norm": 0.6234021033332222,
"learning_rate": 1.8611471843893447e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19351506233215332,
"step": 1605,
"valid_targets_mean": 3928.3,
"valid_targets_min": 1828
},
{
"epoch": 4.0049751243781095,
"grad_norm": 0.5228099382124228,
"learning_rate": 1.848772320342568e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1864427924156189,
"step": 1610,
"valid_targets_mean": 4102.9,
"valid_targets_min": 2681
},
{
"epoch": 4.017412935323383,
"grad_norm": 0.5441470808752659,
"learning_rate": 1.8364032765539355e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033585011959076,
"step": 1615,
"valid_targets_mean": 4462.2,
"valid_targets_min": 2005
},
{
"epoch": 4.029850746268656,
"grad_norm": 0.5740596060113697,
"learning_rate": 1.8240405290674348e-05,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972273290157318,
"step": 1620,
"valid_targets_mean": 3756.9,
"valid_targets_min": 1255
},
{
"epoch": 4.04228855721393,
"grad_norm": 0.5719711729617718,
"learning_rate": 1.8116845536847306e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19884632527828217,
"step": 1625,
"valid_targets_mean": 4049.6,
"valid_targets_min": 374
},
{
"epoch": 4.054726368159204,
"grad_norm": 0.4974824417143702,
"learning_rate": 1.799335825946853e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18048778176307678,
"step": 1630,
"valid_targets_mean": 4554.6,
"valid_targets_min": 2925
},
{
"epoch": 4.067164179104478,
"grad_norm": 0.544654409825013,
"learning_rate": 1.7869948211158898e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17982539534568787,
"step": 1635,
"valid_targets_mean": 4247.0,
"valid_targets_min": 1548
},
{
"epoch": 4.079601990049751,
"grad_norm": 0.5337906477339353,
"learning_rate": 1.774662014156705e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1838865578174591,
"step": 1640,
"valid_targets_mean": 3586.6,
"valid_targets_min": 1801
},
{
"epoch": 4.092039800995025,
"grad_norm": 0.5334091034891687,
"learning_rate": 1.762337879718649e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20184041559696198,
"step": 1645,
"valid_targets_mean": 4037.2,
"valid_targets_min": 2085
},
{
"epoch": 4.104477611940299,
"grad_norm": 0.48859337981552636,
"learning_rate": 1.750022892117296e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17627070844173431,
"step": 1650,
"valid_targets_mean": 4640.4,
"valid_targets_min": 2534
},
{
"epoch": 4.116915422885572,
"grad_norm": 0.5661329566773484,
"learning_rate": 1.7377175253161907e-05,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17362037301063538,
"step": 1655,
"valid_targets_mean": 4436.4,
"valid_targets_min": 2446
},
{
"epoch": 4.129353233830845,
"grad_norm": 0.5703288632207718,
"learning_rate": 1.7254222529086024e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19699379801750183,
"step": 1660,
"valid_targets_mean": 4017.1,
"valid_targets_min": 2457
},
{
"epoch": 4.141791044776119,
"grad_norm": 0.681732512062585,
"learning_rate": 1.7131375480993014e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18208718299865723,
"step": 1665,
"valid_targets_mean": 4043.7,
"valid_targets_min": 960
},
{
"epoch": 4.154228855721393,
"grad_norm": 0.4723457137036097,
"learning_rate": 1.7008638836863455e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17454874515533447,
"step": 1670,
"valid_targets_mean": 4918.2,
"valid_targets_min": 2042
},
{
"epoch": 4.166666666666667,
"grad_norm": 0.5581086668881344,
"learning_rate": 1.6886017320428817e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18187645077705383,
"step": 1675,
"valid_targets_mean": 3673.4,
"valid_targets_min": 2213
},
{
"epoch": 4.17910447761194,
"grad_norm": 0.6292356323245095,
"learning_rate": 1.676351565098973e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19597412645816803,
"step": 1680,
"valid_targets_mean": 3223.8,
"valid_targets_min": 1178
},
{
"epoch": 4.191542288557214,
"grad_norm": 0.5771443261900594,
"learning_rate": 1.6641138543234253e-05,
"loss": 0.2058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23651202023029327,
"step": 1685,
"valid_targets_mean": 3848.0,
"valid_targets_min": 443
},
{
"epoch": 4.203980099502488,
"grad_norm": 0.5522616677962544,
"learning_rate": 1.6518890707056522e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1811617612838745,
"step": 1690,
"valid_targets_mean": 4084.1,
"valid_targets_min": 1696
},
{
"epoch": 4.2164179104477615,
"grad_norm": 0.5796056383907187,
"learning_rate": 1.639677684737539e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18784770369529724,
"step": 1695,
"valid_targets_mean": 3328.5,
"valid_targets_min": 1507
},
{
"epoch": 4.2288557213930345,
"grad_norm": 0.622905968717353,
"learning_rate": 1.6274801663953415e-05,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1970984935760498,
"step": 1700,
"valid_targets_mean": 3623.7,
"valid_targets_min": 1520
},
{
"epoch": 4.241293532338308,
"grad_norm": 0.5349694808917531,
"learning_rate": 1.6152969851215966e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17795711755752563,
"step": 1705,
"valid_targets_mean": 4193.2,
"valid_targets_min": 1270
},
{
"epoch": 4.253731343283582,
"grad_norm": 0.6065208601441333,
"learning_rate": 1.6031286098070523e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19792214035987854,
"step": 1710,
"valid_targets_mean": 3305.4,
"valid_targets_min": 1130
},
{
"epoch": 4.266169154228856,
"grad_norm": 0.6573570535633596,
"learning_rate": 1.5909755087726265e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19432350993156433,
"step": 1715,
"valid_targets_mean": 4008.4,
"valid_targets_min": 200
},
{
"epoch": 4.278606965174129,
"grad_norm": 0.561968603462814,
"learning_rate": 1.5788381497513784e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1960953325033188,
"step": 1720,
"valid_targets_mean": 4200.1,
"valid_targets_min": 1752
},
{
"epoch": 4.291044776119403,
"grad_norm": 0.5705642184565684,
"learning_rate": 1.5667169998705065e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19628682732582092,
"step": 1725,
"valid_targets_mean": 4268.7,
"valid_targets_min": 2160
},
{
"epoch": 4.303482587064677,
"grad_norm": 0.5543526015290202,
"learning_rate": 1.5546125256333778e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20755350589752197,
"step": 1730,
"valid_targets_mean": 4264.7,
"valid_targets_min": 1388
},
{
"epoch": 4.3159203980099505,
"grad_norm": 0.5131024835801369,
"learning_rate": 1.5425251929015635e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1865994930267334,
"step": 1735,
"valid_targets_mean": 4723.0,
"valid_targets_min": 2825
},
{
"epoch": 4.3283582089552235,
"grad_norm": 0.5369465865720151,
"learning_rate": 1.5304554668769175e-05,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16630160808563232,
"step": 1740,
"valid_targets_mean": 4633.6,
"valid_targets_min": 1557
},
{
"epoch": 4.340796019900497,
"grad_norm": 0.5488638067704708,
"learning_rate": 1.5184038120836678e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19109171628952026,
"step": 1745,
"valid_targets_mean": 4214.2,
"valid_targets_min": 1109
},
{
"epoch": 4.353233830845771,
"grad_norm": 0.6194076089336067,
"learning_rate": 1.5063706923505392e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2046584188938141,
"step": 1750,
"valid_targets_mean": 3853.9,
"valid_targets_min": 2765
},
{
"epoch": 4.365671641791045,
"grad_norm": 0.5294295584701465,
"learning_rate": 1.494356570792905e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18276120722293854,
"step": 1755,
"valid_targets_mean": 4236.4,
"valid_targets_min": 1666
},
{
"epoch": 4.378109452736318,
"grad_norm": 0.585302204807222,
"learning_rate": 1.4823619097949584e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19066128134727478,
"step": 1760,
"valid_targets_mean": 3614.5,
"valid_targets_min": 2120
},
{
"epoch": 4.390547263681592,
"grad_norm": 0.5450990664960823,
"learning_rate": 1.4703871709919217e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1853064000606537,
"step": 1765,
"valid_targets_mean": 4034.2,
"valid_targets_min": 1155
},
{
"epoch": 4.402985074626866,
"grad_norm": 0.5070494966282225,
"learning_rate": 1.4584328152522762e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19450125098228455,
"step": 1770,
"valid_targets_mean": 4716.2,
"valid_targets_min": 970
},
{
"epoch": 4.41542288557214,
"grad_norm": 0.5501844594868129,
"learning_rate": 1.446499302660024e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17513319849967957,
"step": 1775,
"valid_targets_mean": 3711.8,
"valid_targets_min": 2079
},
{
"epoch": 4.4278606965174125,
"grad_norm": 0.591362418900047,
"learning_rate": 1.4345870924969862e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20799198746681213,
"step": 1780,
"valid_targets_mean": 4011.0,
"valid_targets_min": 2539
},
{
"epoch": 4.440298507462686,
"grad_norm": 0.5193747556433063,
"learning_rate": 1.4226966432251201e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19595052301883698,
"step": 1785,
"valid_targets_mean": 4659.1,
"valid_targets_min": 2807
},
{
"epoch": 4.45273631840796,
"grad_norm": 0.5569115821469196,
"learning_rate": 1.4108284124688796e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19918416440486908,
"step": 1790,
"valid_targets_mean": 4438.2,
"valid_targets_min": 1874
},
{
"epoch": 4.465174129353234,
"grad_norm": 0.5283360905638507,
"learning_rate": 1.3989828569976003e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1961868703365326,
"step": 1795,
"valid_targets_mean": 4511.8,
"valid_targets_min": 1407
},
{
"epoch": 4.477611940298507,
"grad_norm": 0.5532204571218482,
"learning_rate": 1.3871604327079184e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1693786382675171,
"step": 1800,
"valid_targets_mean": 3788.8,
"valid_targets_min": 1567
},
{
"epoch": 4.490049751243781,
"grad_norm": 0.5359674168093468,
"learning_rate": 1.37536159460623e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.183126300573349,
"step": 1805,
"valid_targets_mean": 4236.6,
"valid_targets_min": 1831
},
{
"epoch": 4.502487562189055,
"grad_norm": 0.5263751071985473,
"learning_rate": 1.3635867967911734e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18391427397727966,
"step": 1810,
"valid_targets_mean": 4034.3,
"valid_targets_min": 2682
},
{
"epoch": 4.514925373134329,
"grad_norm": 0.6145126374437491,
"learning_rate": 1.3518364924361564e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18755874037742615,
"step": 1815,
"valid_targets_mean": 3663.2,
"valid_targets_min": 941
},
{
"epoch": 4.5273631840796025,
"grad_norm": 0.5461908468497769,
"learning_rate": 1.340111133771913e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19034013152122498,
"step": 1820,
"valid_targets_mean": 4258.0,
"valid_targets_min": 2231
},
{
"epoch": 4.539800995024875,
"grad_norm": 0.5437588969087739,
"learning_rate": 1.3284111720690987e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18442508578300476,
"step": 1825,
"valid_targets_mean": 3990.9,
"valid_targets_min": 2466
},
{
"epoch": 4.552238805970149,
"grad_norm": 0.5315792588743522,
"learning_rate": 1.3167370576209253e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18224917352199554,
"step": 1830,
"valid_targets_mean": 4163.6,
"valid_targets_min": 2181
},
{
"epoch": 4.564676616915423,
"grad_norm": 0.5757247651612372,
"learning_rate": 1.305089239725826e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20078767836093903,
"step": 1835,
"valid_targets_mean": 4150.7,
"valid_targets_min": 1840
},
{
"epoch": 4.577114427860696,
"grad_norm": 0.5938129394057137,
"learning_rate": 1.2934681666701674e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18216751515865326,
"step": 1840,
"valid_targets_mean": 4025.4,
"valid_targets_min": 2013
},
{
"epoch": 4.58955223880597,
"grad_norm": 0.6028091843290723,
"learning_rate": 1.2818742857109947e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19109377264976501,
"step": 1845,
"valid_targets_mean": 3510.1,
"valid_targets_min": 228
},
{
"epoch": 4.601990049751244,
"grad_norm": 0.5776897498789417,
"learning_rate": 1.270308043058816e-05,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18680351972579956,
"step": 1850,
"valid_targets_mean": 3375.8,
"valid_targets_min": 1071
},
{
"epoch": 4.614427860696518,
"grad_norm": 0.5240221774849542,
"learning_rate": 1.2587698838604357e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1797061264514923,
"step": 1855,
"valid_targets_mean": 4271.2,
"valid_targets_min": 1977
},
{
"epoch": 4.6268656716417915,
"grad_norm": 0.5639717377124501,
"learning_rate": 1.2472602521818136e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21001404523849487,
"step": 1860,
"valid_targets_mean": 3991.2,
"valid_targets_min": 1970
},
{
"epoch": 4.6393034825870645,
"grad_norm": 0.5205449157527914,
"learning_rate": 1.2357795909909831e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21091000735759735,
"step": 1865,
"valid_targets_mean": 4543.5,
"valid_targets_min": 1236
},
{
"epoch": 4.651741293532338,
"grad_norm": 0.5642643394569002,
"learning_rate": 1.2243283421409944e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19856856763362885,
"step": 1870,
"valid_targets_mean": 4086.1,
"valid_targets_min": 2486
},
{
"epoch": 4.664179104477612,
"grad_norm": 0.5328298872378295,
"learning_rate": 1.2129069463529147e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1959315538406372,
"step": 1875,
"valid_targets_mean": 4242.9,
"valid_targets_min": 2666
},
{
"epoch": 4.676616915422885,
"grad_norm": 0.553203140113736,
"learning_rate": 1.2015158431988656e-05,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867968738079071,
"step": 1880,
"valid_targets_mean": 4032.2,
"valid_targets_min": 1997
},
{
"epoch": 4.689054726368159,
"grad_norm": 0.579092184466775,
"learning_rate": 1.1901554710851022e-05,
"loss": 0.2058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20128527283668518,
"step": 1885,
"valid_targets_mean": 3413.8,
"valid_targets_min": 973
},
{
"epoch": 4.701492537313433,
"grad_norm": 0.6107118718654273,
"learning_rate": 1.1788262672351451e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19431200623512268,
"step": 1890,
"valid_targets_mean": 3529.1,
"valid_targets_min": 1539
},
{
"epoch": 4.713930348258707,
"grad_norm": 0.5389866374015265,
"learning_rate": 1.1675286676729489e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19274672865867615,
"step": 1895,
"valid_targets_mean": 4071.8,
"valid_targets_min": 2330
},
{
"epoch": 4.726368159203981,
"grad_norm": 0.5466037683250415,
"learning_rate": 1.1562631072061214e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1851121038198471,
"step": 1900,
"valid_targets_mean": 4066.6,
"valid_targets_min": 2216
},
{
"epoch": 4.7388059701492535,
"grad_norm": 0.5172604730124416,
"learning_rate": 1.1450300194091936e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18047800660133362,
"step": 1905,
"valid_targets_mean": 4594.6,
"valid_targets_min": 852
},
{
"epoch": 4.751243781094527,
"grad_norm": 0.5097432319490798,
"learning_rate": 1.1338298366069282e-05,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17912769317626953,
"step": 1910,
"valid_targets_mean": 4337.2,
"valid_targets_min": 921
},
{
"epoch": 4.763681592039801,
"grad_norm": 0.527120343823522,
"learning_rate": 1.1226629898576818e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22057533264160156,
"step": 1915,
"valid_targets_mean": 4766.2,
"valid_targets_min": 2509
},
{
"epoch": 4.776119402985074,
"grad_norm": 0.5341316468563161,
"learning_rate": 1.1115299089368163e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18534281849861145,
"step": 1920,
"valid_targets_mean": 3921.1,
"valid_targets_min": 2193
},
{
"epoch": 4.788557213930348,
"grad_norm": 0.5460035866192121,
"learning_rate": 1.1004310223201567e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20613934099674225,
"step": 1925,
"valid_targets_mean": 4485.4,
"valid_targets_min": 2111
},
{
"epoch": 4.800995024875622,
"grad_norm": 0.5517532913974614,
"learning_rate": 1.089366757167504e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1839025318622589,
"step": 1930,
"valid_targets_mean": 3908.1,
"valid_targets_min": 2332
},
{
"epoch": 4.813432835820896,
"grad_norm": 0.529510753958286,
"learning_rate": 1.0783375393061867e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19102586805820465,
"step": 1935,
"valid_targets_mean": 4116.6,
"valid_targets_min": 2062
},
{
"epoch": 4.82587064676617,
"grad_norm": 0.5194175454337181,
"learning_rate": 1.0673437932146844e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1900445818901062,
"step": 1940,
"valid_targets_mean": 5161.1,
"valid_targets_min": 2400
},
{
"epoch": 4.838308457711443,
"grad_norm": 0.5563197452474851,
"learning_rate": 1.05638594200628e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1914559304714203,
"step": 1945,
"valid_targets_mean": 3629.1,
"valid_targets_min": 1381
},
{
"epoch": 4.850746268656716,
"grad_norm": 0.5125531536441792,
"learning_rate": 1.0454644074127818e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17317280173301697,
"step": 1950,
"valid_targets_mean": 4402.2,
"valid_targets_min": 1409
},
{
"epoch": 4.86318407960199,
"grad_norm": 0.5514274931255213,
"learning_rate": 1.0345796097682896e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1964603066444397,
"step": 1955,
"valid_targets_mean": 4132.4,
"valid_targets_min": 2369
},
{
"epoch": 4.875621890547263,
"grad_norm": 0.542246915785968,
"learning_rate": 1.023731967993018e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19377470016479492,
"step": 1960,
"valid_targets_mean": 4014.6,
"valid_targets_min": 2105
},
{
"epoch": 4.888059701492537,
"grad_norm": 0.5081914366033573,
"learning_rate": 1.0129218995771766e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17151615023612976,
"step": 1965,
"valid_targets_mean": 3851.6,
"valid_targets_min": 196
},
{
"epoch": 4.900497512437811,
"grad_norm": 0.5987169529933362,
"learning_rate": 1.002149820564897e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2023550570011139,
"step": 1970,
"valid_targets_mean": 3578.8,
"valid_targets_min": 1055
},
{
"epoch": 4.912935323383085,
"grad_norm": 0.5582434934098669,
"learning_rate": 9.914161455382215e-06,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1893100142478943,
"step": 1975,
"valid_targets_mean": 3755.3,
"valid_targets_min": 1619
},
{
"epoch": 4.925373134328359,
"grad_norm": 0.524299212994188,
"learning_rate": 9.807212876011528e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19495365023612976,
"step": 1980,
"valid_targets_mean": 4259.8,
"valid_targets_min": 317
},
{
"epoch": 4.937810945273632,
"grad_norm": 0.5458717305766948,
"learning_rate": 9.700656583637484e-06,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18475620448589325,
"step": 1985,
"valid_targets_mean": 3955.7,
"valid_targets_min": 1312
},
{
"epoch": 4.9502487562189055,
"grad_norm": 0.5988339564997255,
"learning_rate": 9.594496679262822e-06,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20608876645565033,
"step": 1990,
"valid_targets_mean": 3641.8,
"valid_targets_min": 1811
},
{
"epoch": 4.962686567164179,
"grad_norm": 0.5140756054780553,
"learning_rate": 9.488737248634603e-06,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21765117347240448,
"step": 1995,
"valid_targets_mean": 5012.4,
"valid_targets_min": 2130
},
{
"epoch": 4.975124378109452,
"grad_norm": 0.5750911579001797,
"learning_rate": 9.383382362086959e-06,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19809523224830627,
"step": 2000,
"valid_targets_mean": 3847.8,
"valid_targets_min": 1889
},
{
"epoch": 4.987562189054726,
"grad_norm": 0.5469643211901647,
"learning_rate": 9.27843607438447e-06,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19203123450279236,
"step": 2005,
"valid_targets_mean": 3831.5,
"valid_targets_min": 1988
},
{
"epoch": 5.0,
"grad_norm": 0.5145051979175338,
"learning_rate": 9.173902424566057e-06,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19573429226875305,
"step": 2010,
"valid_targets_mean": 4327.5,
"valid_targets_min": 2066
},
{
"epoch": 5.012437810945274,
"grad_norm": 0.48975408551998934,
"learning_rate": 9.06978543578957e-06,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17476843297481537,
"step": 2015,
"valid_targets_mean": 4369.6,
"valid_targets_min": 1170
},
{
"epoch": 5.024875621890548,
"grad_norm": 1.1782763959202165,
"learning_rate": 8.966089115176945e-06,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17875716090202332,
"step": 2020,
"valid_targets_mean": 4059.2,
"valid_targets_min": 1149
},
{
"epoch": 5.037313432835821,
"grad_norm": 0.5373043390636772,
"learning_rate": 8.862817453659968e-06,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1860535442829132,
"step": 2025,
"valid_targets_mean": 4277.5,
"valid_targets_min": 2642
},
{
"epoch": 5.0497512437810945,
"grad_norm": 0.5331643182583649,
"learning_rate": 8.759974425826696e-06,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16362561285495758,
"step": 2030,
"valid_targets_mean": 3765.5,
"valid_targets_min": 2097
},
{
"epoch": 5.062189054726368,
"grad_norm": 0.544019833677962,
"learning_rate": 8.657563989768467e-06,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2051907181739807,
"step": 2035,
"valid_targets_mean": 4519.1,
"valid_targets_min": 2674
},
{
"epoch": 5.074626865671641,
"grad_norm": 0.62327450747123,
"learning_rate": 8.555590086927602e-06,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19175231456756592,
"step": 2040,
"valid_targets_mean": 3685.4,
"valid_targets_min": 853
},
{
"epoch": 5.087064676616915,
"grad_norm": 0.5308764481118281,
"learning_rate": 8.454056641945665e-06,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1750047206878662,
"step": 2045,
"valid_targets_mean": 4141.5,
"valid_targets_min": 2422
},
{
"epoch": 5.099502487562189,
"grad_norm": 0.5185262701369572,
"learning_rate": 8.352967562512448e-06,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1702880859375,
"step": 2050,
"valid_targets_mean": 4598.6,
"valid_targets_min": 1330
},
{
"epoch": 5.111940298507463,
"grad_norm": 0.5829644925735894,
"learning_rate": 8.252326739215568e-06,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1757672280073166,
"step": 2055,
"valid_targets_mean": 3722.4,
"valid_targets_min": 1948
},
{
"epoch": 5.124378109452737,
"grad_norm": 0.5984769834446014,
"learning_rate": 8.152138045390725e-06,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19725893437862396,
"step": 2060,
"valid_targets_mean": 3535.5,
"valid_targets_min": 1839
},
{
"epoch": 5.13681592039801,
"grad_norm": 0.4884187116919498,
"learning_rate": 8.052405336972659e-06,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16476622223854065,
"step": 2065,
"valid_targets_mean": 4477.9,
"valid_targets_min": 1939
},
{
"epoch": 5.149253731343284,
"grad_norm": 0.8229280153452522,
"learning_rate": 7.953132452346693e-06,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16132110357284546,
"step": 2070,
"valid_targets_mean": 3924.3,
"valid_targets_min": 1278
},
{
"epoch": 5.161691542288557,
"grad_norm": 0.4724798431111937,
"learning_rate": 7.854323212201047e-06,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17464956641197205,
"step": 2075,
"valid_targets_mean": 5130.9,
"valid_targets_min": 3182
},
{
"epoch": 5.174129353233831,
"grad_norm": 0.6676453133494172,
"learning_rate": 7.75598141937981e-06,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17902524769306183,
"step": 2080,
"valid_targets_mean": 3899.2,
"valid_targets_min": 1769
},
{
"epoch": 5.186567164179104,
"grad_norm": 0.581722657791125,
"learning_rate": 7.658110858736523e-06,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1738991141319275,
"step": 2085,
"valid_targets_mean": 4717.8,
"valid_targets_min": 1597
},
{
"epoch": 5.199004975124378,
"grad_norm": 0.6119229068009544,
"learning_rate": 7.560715296988554e-06,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16843843460083008,
"step": 2090,
"valid_targets_mean": 3586.2,
"valid_targets_min": 1305
},
{
"epoch": 5.211442786069652,
"grad_norm": 0.6296917134765727,
"learning_rate": 7.463798482572122e-06,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17999431490898132,
"step": 2095,
"valid_targets_mean": 3528.2,
"valid_targets_min": 1513
},
{
"epoch": 5.223880597014926,
"grad_norm": 0.545873150726275,
"learning_rate": 7.36736414549802e-06,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18782277405261993,
"step": 2100,
"valid_targets_mean": 4359.8,
"valid_targets_min": 2033
},
{
"epoch": 5.236318407960199,
"grad_norm": 0.5785180015454172,
"learning_rate": 7.271415997208093e-06,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1869148463010788,
"step": 2105,
"valid_targets_mean": 3707.5,
"valid_targets_min": 2328
},
{
"epoch": 5.248756218905473,
"grad_norm": 0.5764954136094295,
"learning_rate": 7.17595773043233e-06,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18479612469673157,
"step": 2110,
"valid_targets_mean": 4026.6,
"valid_targets_min": 2210
},
{
"epoch": 5.2611940298507465,
"grad_norm": 0.5204559401076309,
"learning_rate": 7.080993019046827e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17545653879642487,
"step": 2115,
"valid_targets_mean": 4619.4,
"valid_targets_min": 2520
},
{
"epoch": 5.273631840796019,
"grad_norm": 0.5629684650741945,
"learning_rate": 6.986525517932321e-06,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16429266333580017,
"step": 2120,
"valid_targets_mean": 3826.1,
"valid_targets_min": 1140
},
{
"epoch": 5.286069651741293,
"grad_norm": 0.5207487254296341,
"learning_rate": 6.892558862833569e-06,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17473994195461273,
"step": 2125,
"valid_targets_mean": 4406.2,
"valid_targets_min": 2004
},
{
"epoch": 5.298507462686567,
"grad_norm": 0.6137205942170112,
"learning_rate": 6.799096670219396e-06,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18868446350097656,
"step": 2130,
"valid_targets_mean": 4076.2,
"valid_targets_min": 1472
},
{
"epoch": 5.310945273631841,
"grad_norm": 0.4900273933795682,
"learning_rate": 6.706142537143518e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17624013125896454,
"step": 2135,
"valid_targets_mean": 5214.7,
"valid_targets_min": 1883
},
{
"epoch": 5.323383084577115,
"grad_norm": 0.5288471175274457,
"learning_rate": 6.613700041106119e-06,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18341976404190063,
"step": 2140,
"valid_targets_mean": 4289.6,
"valid_targets_min": 1156
},
{
"epoch": 5.335820895522388,
"grad_norm": 0.5519799885784733,
"learning_rate": 6.521772739916137e-06,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16220718622207642,
"step": 2145,
"valid_targets_mean": 4097.6,
"valid_targets_min": 1881
},
{
"epoch": 5.348258706467662,
"grad_norm": 0.641394208147078,
"learning_rate": 6.430364171554329e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1815165877342224,
"step": 2150,
"valid_targets_mean": 3265.1,
"valid_targets_min": 222
},
{
"epoch": 5.3606965174129355,
"grad_norm": 0.5017060911996063,
"learning_rate": 6.33947785403716e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15326166152954102,
"step": 2155,
"valid_targets_mean": 4282.4,
"valid_targets_min": 1306
},
{
"epoch": 5.373134328358209,
"grad_norm": 0.5629109675071312,
"learning_rate": 6.249117285281348e-06,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19157464802265167,
"step": 2160,
"valid_targets_mean": 4362.0,
"valid_targets_min": 1910
},
{
"epoch": 5.385572139303482,
"grad_norm": 0.5573924452067587,
"learning_rate": 6.159285942969266e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18228746950626373,
"step": 2165,
"valid_targets_mean": 3975.6,
"valid_targets_min": 2189
},
{
"epoch": 5.398009950248756,
"grad_norm": 0.5588862231529654,
"learning_rate": 6.0699872844151e-06,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20605233311653137,
"step": 2170,
"valid_targets_mean": 4185.6,
"valid_targets_min": 1682
},
{
"epoch": 5.41044776119403,
"grad_norm": 0.5819160509013732,
"learning_rate": 5.9812247464317685e-06,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1820629984140396,
"step": 2175,
"valid_targets_mean": 3783.1,
"valid_targets_min": 941
},
{
"epoch": 5.422885572139304,
"grad_norm": 0.5625161894644168,
"learning_rate": 5.893001745198692e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17581865191459656,
"step": 2180,
"valid_targets_mean": 3561.9,
"valid_targets_min": 2275
},
{
"epoch": 5.435323383084577,
"grad_norm": 0.5946540446785107,
"learning_rate": 5.805321676130262e-06,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1829841583967209,
"step": 2185,
"valid_targets_mean": 3860.6,
"valid_targets_min": 2281
},
{
"epoch": 5.447761194029851,
"grad_norm": 0.5531530928449198,
"learning_rate": 5.718187913745199e-06,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640455424785614,
"step": 2190,
"valid_targets_mean": 4010.9,
"valid_targets_min": 1509
},
{
"epoch": 5.460199004975125,
"grad_norm": 0.5893338522051409,
"learning_rate": 5.631603811536668e-06,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1882874071598053,
"step": 2195,
"valid_targets_mean": 3535.2,
"valid_targets_min": 1706
},
{
"epoch": 5.472636815920398,
"grad_norm": 0.6073509265616175,
"learning_rate": 5.545572701843216e-06,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18738335371017456,
"step": 2200,
"valid_targets_mean": 4425.8,
"valid_targets_min": 2013
},
{
"epoch": 5.485074626865671,
"grad_norm": 0.5310642730413633,
"learning_rate": 5.4600978957205135e-06,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168120339512825,
"step": 2205,
"valid_targets_mean": 3844.4,
"valid_targets_min": 1734
},
{
"epoch": 5.497512437810945,
"grad_norm": 0.555820405124083,
"learning_rate": 5.375182682813929e-06,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976512372493744,
"step": 2210,
"valid_targets_mean": 3939.1,
"valid_targets_min": 1724
},
{
"epoch": 5.509950248756219,
"grad_norm": 0.5509023684550313,
"learning_rate": 5.290830331231933e-06,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1776900589466095,
"step": 2215,
"valid_targets_mean": 4289.1,
"valid_targets_min": 1658
},
{
"epoch": 5.522388059701493,
"grad_norm": 0.5113496796090481,
"learning_rate": 5.2070440874202925e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17290140688419342,
"step": 2220,
"valid_targets_mean": 4486.5,
"valid_targets_min": 1644
},
{
"epoch": 5.534825870646766,
"grad_norm": 0.5419706723077836,
"learning_rate": 5.123827176037146e-06,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18113742768764496,
"step": 2225,
"valid_targets_mean": 4176.4,
"valid_targets_min": 1097
},
{
"epoch": 5.54726368159204,
"grad_norm": 0.5714071952278112,
"learning_rate": 5.041182799828888e-06,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16627778112888336,
"step": 2230,
"valid_targets_mean": 3533.5,
"valid_targets_min": 1673
},
{
"epoch": 5.559701492537314,
"grad_norm": 0.5631880598259031,
"learning_rate": 4.959114139506909e-06,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16612115502357483,
"step": 2235,
"valid_targets_mean": 3968.1,
"valid_targets_min": 2003
},
{
"epoch": 5.572139303482587,
"grad_norm": 0.5954530663996263,
"learning_rate": 4.877624353625197e-06,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18126454949378967,
"step": 2240,
"valid_targets_mean": 3962.8,
"valid_targets_min": 2013
},
{
"epoch": 5.58457711442786,
"grad_norm": 0.5504249794441187,
"learning_rate": 4.7967165784587284e-06,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19141951203346252,
"step": 2245,
"valid_targets_mean": 4483.5,
"valid_targets_min": 1041
},
{
"epoch": 5.597014925373134,
"grad_norm": 0.6159216942243276,
"learning_rate": 4.71639392788281e-06,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18392285704612732,
"step": 2250,
"valid_targets_mean": 3742.2,
"valid_targets_min": 1851
},
{
"epoch": 5.609452736318408,
"grad_norm": 0.6025337544936586,
"learning_rate": 4.6366594932532285e-06,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19583985209465027,
"step": 2255,
"valid_targets_mean": 3859.6,
"valid_targets_min": 1696
},
{
"epoch": 5.621890547263682,
"grad_norm": 0.5398477942967179,
"learning_rate": 4.557516343287251e-06,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1676681786775589,
"step": 2260,
"valid_targets_mean": 3899.4,
"valid_targets_min": 448
},
{
"epoch": 5.634328358208955,
"grad_norm": 0.5503845662196336,
"learning_rate": 4.4789675239455385e-06,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17880871891975403,
"step": 2265,
"valid_targets_mean": 3832.9,
"valid_targets_min": 1595
},
{
"epoch": 5.646766169154229,
"grad_norm": 0.5103257331663372,
"learning_rate": 4.401016058314913e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17229273915290833,
"step": 2270,
"valid_targets_mean": 4335.1,
"valid_targets_min": 1417
},
{
"epoch": 5.659203980099503,
"grad_norm": 0.5094018756134759,
"learning_rate": 4.3236649464919986e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16803838312625885,
"step": 2275,
"valid_targets_mean": 4230.3,
"valid_targets_min": 2119
},
{
"epoch": 5.6716417910447765,
"grad_norm": 0.5319736807745282,
"learning_rate": 4.246917165467799e-06,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19026246666908264,
"step": 2280,
"valid_targets_mean": 4721.9,
"valid_targets_min": 2278
},
{
"epoch": 5.6840796019900495,
"grad_norm": 0.5869835916274105,
"learning_rate": 4.170775669013041e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18648019433021545,
"step": 2285,
"valid_targets_mean": 3507.3,
"valid_targets_min": 2093
},
{
"epoch": 5.696517412935323,
"grad_norm": 0.5334102609956934,
"learning_rate": 4.095243387564593e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18063801527023315,
"step": 2290,
"valid_targets_mean": 4553.8,
"valid_targets_min": 2042
},
{
"epoch": 5.708955223880597,
"grad_norm": 0.5694193724204722,
"learning_rate": 4.020323228112604e-06,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1846069097518921,
"step": 2295,
"valid_targets_mean": 4064.2,
"valid_targets_min": 1370
},
{
"epoch": 5.721393034825871,
"grad_norm": 0.5452728006991922,
"learning_rate": 3.9460180740886625e-06,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17648135125637054,
"step": 2300,
"valid_targets_mean": 4065.1,
"valid_targets_min": 2102
},
{
"epoch": 5.733830845771144,
"grad_norm": 0.5669921219625754,
"learning_rate": 3.872330785254803e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18603132665157318,
"step": 2305,
"valid_targets_mean": 3896.8,
"valid_targets_min": 1993
},
{
"epoch": 5.746268656716418,
"grad_norm": 0.5623459293769465,
"learning_rate": 3.7992641975934595e-06,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948518455028534,
"step": 2310,
"valid_targets_mean": 4391.6,
"valid_targets_min": 1950
},
{
"epoch": 5.758706467661692,
"grad_norm": 0.5330298017777138,
"learning_rate": 3.7268211231983185e-06,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1722792387008667,
"step": 2315,
"valid_targets_mean": 4296.8,
"valid_targets_min": 2070
},
{
"epoch": 5.7711442786069655,
"grad_norm": 0.6779738524621803,
"learning_rate": 3.6550043501660736e-06,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17438241839408875,
"step": 2320,
"valid_targets_mean": 3621.8,
"valid_targets_min": 1850
},
{
"epoch": 5.7835820895522385,
"grad_norm": 0.6308227572737273,
"learning_rate": 3.583816642489113e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18285539746284485,
"step": 2325,
"valid_targets_mean": 3364.1,
"valid_targets_min": 1441
},
{
"epoch": 5.796019900497512,
"grad_norm": 0.5466656922264711,
"learning_rate": 3.513260739949196e-06,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.160654678940773,
"step": 2330,
"valid_targets_mean": 3844.6,
"valid_targets_min": 2190
},
{
"epoch": 5.808457711442786,
"grad_norm": 0.5473761351277354,
"learning_rate": 3.4433393580119436e-06,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17680670320987701,
"step": 2335,
"valid_targets_mean": 3974.6,
"valid_targets_min": 1692
},
{
"epoch": 5.82089552238806,
"grad_norm": 0.549317498826441,
"learning_rate": 3.3740551877223647e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17757967114448547,
"step": 2340,
"valid_targets_mean": 3935.1,
"valid_targets_min": 2554
},
{
"epoch": 5.833333333333333,
"grad_norm": 0.5224545749951351,
"learning_rate": 3.30541089560128e-06,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16635212302207947,
"step": 2345,
"valid_targets_mean": 4472.9,
"valid_targets_min": 2049
},
{
"epoch": 5.845771144278607,
"grad_norm": 0.5477440996260752,
"learning_rate": 3.2374091235426918e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16781067848205566,
"step": 2350,
"valid_targets_mean": 3725.6,
"valid_targets_min": 2020
},
{
"epoch": 5.858208955223881,
"grad_norm": 0.6293176391340207,
"learning_rate": 3.1700524887121188e-06,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.193925142288208,
"step": 2355,
"valid_targets_mean": 3524.7,
"valid_targets_min": 1801
},
{
"epoch": 5.870646766169155,
"grad_norm": 0.5849523473688234,
"learning_rate": 3.103343583445848e-06,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18686872720718384,
"step": 2360,
"valid_targets_mean": 3800.3,
"valid_targets_min": 2279
},
{
"epoch": 5.883084577114428,
"grad_norm": 0.546446441498615,
"learning_rate": 3.037284975151182e-06,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.174645334482193,
"step": 2365,
"valid_targets_mean": 4354.5,
"valid_targets_min": 2242
},
{
"epoch": 5.895522388059701,
"grad_norm": 0.6294684870590153,
"learning_rate": 2.9718792062076264e-06,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16901081800460815,
"step": 2370,
"valid_targets_mean": 3182.9,
"valid_targets_min": 960
},
{
"epoch": 5.907960199004975,
"grad_norm": 0.545529756238248,
"learning_rate": 2.9071287938690298e-06,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19544681906700134,
"step": 2375,
"valid_targets_mean": 4001.1,
"valid_targets_min": 915
},
{
"epoch": 5.920398009950249,
"grad_norm": 0.5761291485378018,
"learning_rate": 2.843036230166718e-06,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17292159795761108,
"step": 2380,
"valid_targets_mean": 3945.6,
"valid_targets_min": 1765
},
{
"epoch": 5.932835820895522,
"grad_norm": 0.5200481295816748,
"learning_rate": 2.779603981813568e-06,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1651022732257843,
"step": 2385,
"valid_targets_mean": 4494.5,
"valid_targets_min": 860
},
{
"epoch": 5.945273631840796,
"grad_norm": 0.5690349697582774,
"learning_rate": 2.7168344901091016e-06,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17301228642463684,
"step": 2390,
"valid_targets_mean": 4024.2,
"valid_targets_min": 2194
},
{
"epoch": 5.95771144278607,
"grad_norm": 0.5426341756011361,
"learning_rate": 2.6547301708454877e-06,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19446370005607605,
"step": 2395,
"valid_targets_mean": 4282.0,
"valid_targets_min": 1255
},
{
"epoch": 5.970149253731344,
"grad_norm": 0.6008319137622877,
"learning_rate": 2.5932934142145906e-06,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17186178267002106,
"step": 2400,
"valid_targets_mean": 4482.7,
"valid_targets_min": 1574
},
{
"epoch": 5.982587064676617,
"grad_norm": 0.5514765334050616,
"learning_rate": 2.5325265847159798e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.167934849858284,
"step": 2405,
"valid_targets_mean": 3971.0,
"valid_targets_min": 1741
},
{
"epoch": 5.9950248756218905,
"grad_norm": 0.5743859815483373,
"learning_rate": 2.472432021065918e-06,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17497491836547852,
"step": 2410,
"valid_targets_mean": 4070.7,
"valid_targets_min": 1109
},
{
"epoch": 6.007462686567164,
"grad_norm": 0.5125255425588743,
"learning_rate": 2.4130120361073716e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637192666530609,
"step": 2415,
"valid_targets_mean": 4396.6,
"valid_targets_min": 1850
},
{
"epoch": 6.019900497512438,
"grad_norm": 0.5724876553676014,
"learning_rate": 2.3542689167209563e-06,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17785580456256866,
"step": 2420,
"valid_targets_mean": 3476.4,
"valid_targets_min": 1979
},
{
"epoch": 6.032338308457711,
"grad_norm": 0.5879062795130893,
"learning_rate": 2.2962049237369643e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16875743865966797,
"step": 2425,
"valid_targets_mean": 3416.4,
"valid_targets_min": 1696
},
{
"epoch": 6.044776119402985,
"grad_norm": 0.5588828300455307,
"learning_rate": 2.238822291848344e-06,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17179271578788757,
"step": 2430,
"valid_targets_mean": 3605.9,
"valid_targets_min": 1418
},
{
"epoch": 6.057213930348259,
"grad_norm": 0.5295142510715316,
"learning_rate": 2.182123229524673e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1968148648738861,
"step": 2435,
"valid_targets_mean": 4323.1,
"valid_targets_min": 2235
},
{
"epoch": 6.069651741293533,
"grad_norm": 0.6168460567108859,
"learning_rate": 2.1261099189271792e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1779354065656662,
"step": 2440,
"valid_targets_mean": 3457.3,
"valid_targets_min": 1629
},
{
"epoch": 6.082089552238806,
"grad_norm": 0.5621656463077643,
"learning_rate": 2.070784515824753e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.159359872341156,
"step": 2445,
"valid_targets_mean": 4689.1,
"valid_targets_min": 2366
},
{
"epoch": 6.0945273631840795,
"grad_norm": 0.5487542240351966,
"learning_rate": 2.016149149510975e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16500002145767212,
"step": 2450,
"valid_targets_mean": 4167.4,
"valid_targets_min": 2067
},
{
"epoch": 6.106965174129353,
"grad_norm": 0.5686330625834844,
"learning_rate": 1.9622059227221825e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17375610768795013,
"step": 2455,
"valid_targets_mean": 3917.0,
"valid_targets_min": 1876
},
{
"epoch": 6.119402985074627,
"grad_norm": 0.5233617770605969,
"learning_rate": 1.9089569115565052e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16628089547157288,
"step": 2460,
"valid_targets_mean": 4445.4,
"valid_targets_min": 2398
},
{
"epoch": 6.1318407960199,
"grad_norm": 0.5914278966941198,
"learning_rate": 1.8564041653940123e-06,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16870436072349548,
"step": 2465,
"valid_targets_mean": 4021.4,
"valid_targets_min": 2352
},
{
"epoch": 6.144278606965174,
"grad_norm": 0.5693055333467447,
"learning_rate": 1.8045497068177975e-06,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1836708039045334,
"step": 2470,
"valid_targets_mean": 3719.6,
"valid_targets_min": 1833
},
{
"epoch": 6.156716417910448,
"grad_norm": 0.652372737993125,
"learning_rate": 1.7533955315361551e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1608482003211975,
"step": 2475,
"valid_targets_mean": 3182.6,
"valid_targets_min": 2079
},
{
"epoch": 6.169154228855722,
"grad_norm": 0.533482071857129,
"learning_rate": 1.7029436083057715e-06,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16928087174892426,
"step": 2480,
"valid_targets_mean": 4331.8,
"valid_targets_min": 1303
},
{
"epoch": 6.181592039800995,
"grad_norm": 0.5464490007192712,
"learning_rate": 1.6531958788559465e-06,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16682176291942596,
"step": 2485,
"valid_targets_mean": 3949.8,
"valid_targets_min": 1289
},
{
"epoch": 6.1940298507462686,
"grad_norm": 0.5623683876558216,
"learning_rate": 1.6041542578138746e-06,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18091854453086853,
"step": 2490,
"valid_targets_mean": 4234.9,
"valid_targets_min": 1575
},
{
"epoch": 6.206467661691542,
"grad_norm": 0.5238269588411919,
"learning_rate": 1.5558206326309511e-06,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16900426149368286,
"step": 2495,
"valid_targets_mean": 4697.7,
"valid_targets_min": 1876
},
{
"epoch": 6.218905472636816,
"grad_norm": 0.5716740018491285,
"learning_rate": 1.5081968635101097e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18251916766166687,
"step": 2500,
"valid_targets_mean": 3668.0,
"valid_targets_min": 1509
},
{
"epoch": 6.231343283582089,
"grad_norm": 0.5363180031909048,
"learning_rate": 1.4612847833342759e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1818065345287323,
"step": 2505,
"valid_targets_mean": 4083.4,
"valid_targets_min": 1806
},
{
"epoch": 6.243781094527363,
"grad_norm": 0.6429529839019501,
"learning_rate": 1.4150861975957786e-06,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18589231371879578,
"step": 2510,
"valid_targets_mean": 3552.3,
"valid_targets_min": 1876
},
{
"epoch": 6.256218905472637,
"grad_norm": 0.4975492608341589,
"learning_rate": 1.3696028843268993e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15583984553813934,
"step": 2515,
"valid_targets_mean": 4623.1,
"valid_targets_min": 1947
},
{
"epoch": 6.268656716417911,
"grad_norm": 0.5345304367276562,
"learning_rate": 1.3248365940314067e-06,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1705108880996704,
"step": 2520,
"valid_targets_mean": 4393.9,
"valid_targets_min": 1990
},
{
"epoch": 6.281094527363184,
"grad_norm": 0.5373113443994114,
"learning_rate": 1.2807890496172103e-06,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1581442952156067,
"step": 2525,
"valid_targets_mean": 4299.2,
"valid_targets_min": 1423
},
{
"epoch": 6.293532338308458,
"grad_norm": 0.514081511794592,
"learning_rate": 1.237461946330054e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15877807140350342,
"step": 2530,
"valid_targets_mean": 4525.9,
"valid_targets_min": 2502
},
{
"epoch": 6.3059701492537314,
"grad_norm": 0.560992308158361,
"learning_rate": 1.1948569516882503e-06,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16327780485153198,
"step": 2535,
"valid_targets_mean": 4197.6,
"valid_targets_min": 2315
},
{
"epoch": 6.318407960199005,
"grad_norm": 0.5265783790926104,
"learning_rate": 1.1529757054185176e-06,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17675918340682983,
"step": 2540,
"valid_targets_mean": 4462.6,
"valid_targets_min": 1880
},
{
"epoch": 6.330845771144278,
"grad_norm": 0.5416867779723658,
"learning_rate": 1.111819819392872e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17835187911987305,
"step": 2545,
"valid_targets_mean": 4455.2,
"valid_targets_min": 1971
},
{
"epoch": 6.343283582089552,
"grad_norm": 0.5881401941231864,
"learning_rate": 1.0713908775665827e-06,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16701434552669525,
"step": 2550,
"valid_targets_mean": 3613.5,
"valid_targets_min": 1130
},
{
"epoch": 6.355721393034826,
"grad_norm": 0.5504035044096116,
"learning_rate": 1.0316904359172297e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16181015968322754,
"step": 2555,
"valid_targets_mean": 3846.8,
"valid_targets_min": 1976
},
{
"epoch": 6.3681592039801,
"grad_norm": 0.566462536612002,
"learning_rate": 9.92720022384792e-07,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1657314896583557,
"step": 2560,
"valid_targets_mean": 4052.9,
"valid_targets_min": 2216
},
{
"epoch": 6.380597014925373,
"grad_norm": 0.5700973608301066,
"learning_rate": 9.544811368128703e-07,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17204223573207855,
"step": 2565,
"valid_targets_mean": 4212.5,
"valid_targets_min": 1450
},
{
"epoch": 6.393034825870647,
"grad_norm": 0.5934427501781491,
"learning_rate": 9.169752508909413e-07,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17751480638980865,
"step": 2570,
"valid_targets_mean": 3961.2,
"valid_targets_min": 2303
},
{
"epoch": 6.4054726368159205,
"grad_norm": 0.5691373349683894,
"learning_rate": 8.802038080977305e-07,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17300844192504883,
"step": 2575,
"valid_targets_mean": 3961.4,
"valid_targets_min": 2205
},
{
"epoch": 6.417910447761194,
"grad_norm": 0.6340863357974218,
"learning_rate": 8.441682236456472e-07,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17821021378040314,
"step": 2580,
"valid_targets_mean": 3086.1,
"valid_targets_min": 963
},
{
"epoch": 6.430348258706467,
"grad_norm": 0.579617792634382,
"learning_rate": 8.088698844263243e-07,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16770654916763306,
"step": 2585,
"valid_targets_mean": 3542.5,
"valid_targets_min": 2121
},
{
"epoch": 6.442786069651741,
"grad_norm": 0.5395856283137651,
"learning_rate": 7.743101489572491e-07,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19851364195346832,
"step": 2590,
"valid_targets_mean": 4706.3,
"valid_targets_min": 1763
},
{
"epoch": 6.455223880597015,
"grad_norm": 0.5238594468934492,
"learning_rate": 7.404903473294612e-07,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15577292442321777,
"step": 2595,
"valid_targets_mean": 4178.8,
"valid_targets_min": 1773
},
{
"epoch": 6.467661691542289,
"grad_norm": 0.632754230583396,
"learning_rate": 7.074117811563619e-07,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17483484745025635,
"step": 2600,
"valid_targets_mean": 3031.8,
"valid_targets_min": 344
},
{
"epoch": 6.480099502487562,
"grad_norm": 0.5671291151476788,
"learning_rate": 6.750757235236461e-07,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17332680523395538,
"step": 2605,
"valid_targets_mean": 3747.0,
"valid_targets_min": 1149
},
{
"epoch": 6.492537313432836,
"grad_norm": 0.6093460900077653,
"learning_rate": 6.434834189402716e-07,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18352875113487244,
"step": 2610,
"valid_targets_mean": 3692.0,
"valid_targets_min": 1907
},
{
"epoch": 6.5049751243781095,
"grad_norm": 0.574114276787967,
"learning_rate": 6.126360832905831e-07,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18569818139076233,
"step": 2615,
"valid_targets_mean": 3639.9,
"valid_targets_min": 1544
},
{
"epoch": 6.517412935323383,
"grad_norm": 0.5146553892569846,
"learning_rate": 5.825349037875106e-07,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16424797475337982,
"step": 2620,
"valid_targets_mean": 4595.1,
"valid_targets_min": 1975
},
{
"epoch": 6.529850746268656,
"grad_norm": 0.5252261416414551,
"learning_rate": 5.531810389268732e-07,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15995575487613678,
"step": 2625,
"valid_targets_mean": 4328.8,
"valid_targets_min": 1661
},
{
"epoch": 6.54228855721393,
"grad_norm": 0.5685319838301356,
"learning_rate": 5.245756184428041e-07,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18082097172737122,
"step": 2630,
"valid_targets_mean": 4233.4,
"valid_targets_min": 1916
},
{
"epoch": 6.554726368159204,
"grad_norm": 0.5341982017596594,
"learning_rate": 4.967197432642579e-07,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17173001170158386,
"step": 2635,
"valid_targets_mean": 4326.6,
"valid_targets_min": 2650
},
{
"epoch": 6.567164179104478,
"grad_norm": 0.6401995160355601,
"learning_rate": 4.69614485472647e-07,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17902860045433044,
"step": 2640,
"valid_targets_mean": 3158.5,
"valid_targets_min": 191
},
{
"epoch": 6.579601990049751,
"grad_norm": 0.5667151478749745,
"learning_rate": 4.432608882605771e-07,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17057490348815918,
"step": 2645,
"valid_targets_mean": 3628.1,
"valid_targets_min": 2236
},
{
"epoch": 6.592039800995025,
"grad_norm": 0.5485021773091285,
"learning_rate": 4.1765996589170353e-07,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.179216206073761,
"step": 2650,
"valid_targets_mean": 4233.1,
"valid_targets_min": 1682
},
{
"epoch": 6.604477611940299,
"grad_norm": 0.519072304817314,
"learning_rate": 3.928127036616869e-07,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18321016430854797,
"step": 2655,
"valid_targets_mean": 4888.4,
"valid_targets_min": 1732
},
{
"epoch": 6.616915422885572,
"grad_norm": 0.5786793950538549,
"learning_rate": 3.687200578602812e-07,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17171373963356018,
"step": 2660,
"valid_targets_mean": 4240.3,
"valid_targets_min": 1550
},
{
"epoch": 6.629353233830845,
"grad_norm": 0.5589571697627682,
"learning_rate": 3.453829557345212e-07,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1652020364999771,
"step": 2665,
"valid_targets_mean": 3949.5,
"valid_targets_min": 222
},
{
"epoch": 6.641791044776119,
"grad_norm": 0.5511197102525519,
"learning_rate": 3.228022954530463e-07,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1774759292602539,
"step": 2670,
"valid_targets_mean": 4197.3,
"valid_targets_min": 428
},
{
"epoch": 6.654228855721393,
"grad_norm": 0.5864879776585974,
"learning_rate": 3.009789460715218e-07,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16247567534446716,
"step": 2675,
"valid_targets_mean": 3430.1,
"valid_targets_min": 926
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.5572934258361881,
"learning_rate": 2.799137474991942e-07,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18331031501293182,
"step": 2680,
"valid_targets_mean": 3912.9,
"valid_targets_min": 1883
},
{
"epoch": 6.67910447761194,
"grad_norm": 0.5559560602699174,
"learning_rate": 2.5960751046657296e-07,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17147520184516907,
"step": 2685,
"valid_targets_mean": 4053.0,
"valid_targets_min": 1895
},
{
"epoch": 6.691542288557214,
"grad_norm": 0.5575426373568327,
"learning_rate": 2.400610164942241e-07,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16202571988105774,
"step": 2690,
"valid_targets_mean": 4100.9,
"valid_targets_min": 2530
},
{
"epoch": 6.703980099502488,
"grad_norm": 0.5562136135591627,
"learning_rate": 2.2127501786268546e-07,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15551359951496124,
"step": 2695,
"valid_targets_mean": 4108.9,
"valid_targets_min": 2029
},
{
"epoch": 6.7164179104477615,
"grad_norm": 0.5198839932899565,
"learning_rate": 2.0325023758352545e-07,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17046837508678436,
"step": 2700,
"valid_targets_mean": 4698.8,
"valid_targets_min": 443
},
{
"epoch": 6.7288557213930345,
"grad_norm": 0.5938343168062021,
"learning_rate": 1.859873693715075e-07,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1763916015625,
"step": 2705,
"valid_targets_mean": 4298.5,
"valid_targets_min": 1533
},
{
"epoch": 6.741293532338308,
"grad_norm": 0.5495808847371538,
"learning_rate": 1.6948707761789807e-07,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17928853631019592,
"step": 2710,
"valid_targets_mean": 4255.4,
"valid_targets_min": 1937
},
{
"epoch": 6.753731343283582,
"grad_norm": 0.6045663915002609,
"learning_rate": 1.5374999736488927e-07,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1754097044467926,
"step": 2715,
"valid_targets_mean": 3834.8,
"valid_targets_min": 1388
},
{
"epoch": 6.766169154228856,
"grad_norm": 0.5553708025379133,
"learning_rate": 1.3877673428116302e-07,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19348856806755066,
"step": 2720,
"valid_targets_mean": 4249.7,
"valid_targets_min": 3032
},
{
"epoch": 6.778606965174129,
"grad_norm": 0.629594904612257,
"learning_rate": 1.245678646385784e-07,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17597973346710205,
"step": 2725,
"valid_targets_mean": 3250.0,
"valid_targets_min": 941
},
{
"epoch": 6.791044776119403,
"grad_norm": 0.5963075561787823,
"learning_rate": 1.1112393529000288e-07,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1901685893535614,
"step": 2730,
"valid_targets_mean": 3795.7,
"valid_targets_min": 2540
},
{
"epoch": 6.803482587064677,
"grad_norm": 0.5609315377417177,
"learning_rate": 9.844546364824459e-08,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17084071040153503,
"step": 2735,
"valid_targets_mean": 3876.4,
"valid_targets_min": 1109
},
{
"epoch": 6.8159203980099505,
"grad_norm": 0.5043275099355118,
"learning_rate": 8.653293766615945e-08,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16672548651695251,
"step": 2740,
"valid_targets_mean": 4784.5,
"valid_targets_min": 1905
},
{
"epoch": 6.8283582089552235,
"grad_norm": 0.6108276462294715,
"learning_rate": 7.538681581785945e-08,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18459632992744446,
"step": 2745,
"valid_targets_mean": 3379.5,
"valid_targets_min": 852
},
{
"epoch": 6.840796019900497,
"grad_norm": 0.5499395587166259,
"learning_rate": 6.50075270810735e-08,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16682520508766174,
"step": 2750,
"valid_targets_mean": 4087.9,
"valid_targets_min": 1786
},
{
"epoch": 6.853233830845771,
"grad_norm": 0.5762377369105647,
"learning_rate": 5.539547092063391e-08,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16152673959732056,
"step": 2755,
"valid_targets_mean": 3740.1,
"valid_targets_min": 862
},
{
"epoch": 6.865671641791045,
"grad_norm": 0.6162665248042457,
"learning_rate": 4.655101727310651e-08,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17481867969036102,
"step": 2760,
"valid_targets_mean": 3653.2,
"valid_targets_min": 2037
},
{
"epoch": 6.878109452736318,
"grad_norm": 0.5537138349691514,
"learning_rate": 3.847450653254425e-08,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19818416237831116,
"step": 2765,
"valid_targets_mean": 4187.0,
"valid_targets_min": 2037
},
{
"epoch": 6.890547263681592,
"grad_norm": 0.5538646057123637,
"learning_rate": 3.1166249537402104e-08,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1677202731370926,
"step": 2770,
"valid_targets_mean": 4246.5,
"valid_targets_min": 1887
},
{
"epoch": 6.902985074626866,
"grad_norm": 0.5458989012174927,
"learning_rate": 2.4626527558551106e-08,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16506440937519073,
"step": 2775,
"valid_targets_mean": 4147.2,
"valid_targets_min": 1054
},
{
"epoch": 6.91542288557214,
"grad_norm": 0.5428319526484747,
"learning_rate": 1.885559228847811e-08,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16628624498844147,
"step": 2780,
"valid_targets_mean": 4325.8,
"valid_targets_min": 2837
},
{
"epoch": 6.927860696517413,
"grad_norm": 0.5215809087161279,
"learning_rate": 1.385366583158243e-08,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19465038180351257,
"step": 2785,
"valid_targets_mean": 4546.7,
"valid_targets_min": 2100
},
{
"epoch": 6.940298507462686,
"grad_norm": 0.5104612235616637,
"learning_rate": 9.620940695633797e-09,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1838764250278473,
"step": 2790,
"valid_targets_mean": 4532.4,
"valid_targets_min": 2044
},
{
"epoch": 6.95273631840796,
"grad_norm": 0.5508437850202684,
"learning_rate": 6.15757978435827e-09,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17743362486362457,
"step": 2795,
"valid_targets_mean": 4273.7,
"valid_targets_min": 2596
},
{
"epoch": 6.965174129353234,
"grad_norm": 0.5364623622959384,
"learning_rate": 3.463716391176597e-09,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2021486759185791,
"step": 2800,
"valid_targets_mean": 4783.9,
"valid_targets_min": 1910
},
{
"epoch": 6.977611940298507,
"grad_norm": 0.5071144651033146,
"learning_rate": 1.5394541940705332e-09,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16921557486057281,
"step": 2805,
"valid_targets_mean": 4896.3,
"valid_targets_min": 1519
},
{
"epoch": 6.990049751243781,
"grad_norm": 0.5760603012343628,
"learning_rate": 3.848672515882612e-10,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16937696933746338,
"step": 2810,
"valid_targets_mean": 3735.2,
"valid_targets_min": 2097
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17162613570690155,
"step": 2814,
"total_flos": 1157609273950208.0,
"train_loss": 0.22598929736066897,
"train_runtime": 20554.2284,
"train_samples_per_second": 2.189,
"train_steps_per_second": 0.137,
"valid_targets_mean": 3578.4,
"valid_targets_min": 1983
}
],
"logging_steps": 5,
"max_steps": 2814,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1157609273950208.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}