stack-nl2bashseq / trainer_state.json
hf-reset
Reset repository without checkpoints directories
c70cd67
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 6664,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.005252100840336135,
"grad_norm": 11.793528240093083,
"learning_rate": 2.39880059970015e-07,
"loss": 0.7356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.750144362449646,
"step": 5,
"valid_targets_mean": 3398.8,
"valid_targets_min": 746
},
{
"epoch": 0.01050420168067227,
"grad_norm": 9.544117410382237,
"learning_rate": 5.397301349325338e-07,
"loss": 0.6877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5979838371276855,
"step": 10,
"valid_targets_mean": 4347.4,
"valid_targets_min": 1651
},
{
"epoch": 0.015756302521008403,
"grad_norm": 8.563267976325044,
"learning_rate": 8.395802098950526e-07,
"loss": 0.6892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.607923150062561,
"step": 15,
"valid_targets_mean": 4633.2,
"valid_targets_min": 1560
},
{
"epoch": 0.02100840336134454,
"grad_norm": 8.188017827775615,
"learning_rate": 1.1394302848575713e-06,
"loss": 0.6695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6504963040351868,
"step": 20,
"valid_targets_mean": 3938.1,
"valid_targets_min": 1841
},
{
"epoch": 0.026260504201680673,
"grad_norm": 6.523486790143655,
"learning_rate": 1.43928035982009e-06,
"loss": 0.6875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7029379606246948,
"step": 25,
"valid_targets_mean": 3724.8,
"valid_targets_min": 1374
},
{
"epoch": 0.031512605042016806,
"grad_norm": 5.51646121673247,
"learning_rate": 1.7391304347826088e-06,
"loss": 0.6512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6437787413597107,
"step": 30,
"valid_targets_mean": 3264.8,
"valid_targets_min": 1089
},
{
"epoch": 0.03676470588235294,
"grad_norm": 4.319516286938232,
"learning_rate": 2.0389805097451275e-06,
"loss": 0.5769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6190094947814941,
"step": 35,
"valid_targets_mean": 3374.9,
"valid_targets_min": 627
},
{
"epoch": 0.04201680672268908,
"grad_norm": 3.7446317656639048,
"learning_rate": 2.3388305847076464e-06,
"loss": 0.5953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6246620416641235,
"step": 40,
"valid_targets_mean": 3514.9,
"valid_targets_min": 1574
},
{
"epoch": 0.04726890756302521,
"grad_norm": 2.652464883959148,
"learning_rate": 2.6386806596701653e-06,
"loss": 0.5982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6014484167098999,
"step": 45,
"valid_targets_mean": 3956.7,
"valid_targets_min": 1899
},
{
"epoch": 0.052521008403361345,
"grad_norm": 1.9872458383108076,
"learning_rate": 2.9385307346326843e-06,
"loss": 0.5479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5268915891647339,
"step": 50,
"valid_targets_mean": 4397.6,
"valid_targets_min": 2261
},
{
"epoch": 0.05777310924369748,
"grad_norm": 1.6856790315793377,
"learning_rate": 3.2383808095952024e-06,
"loss": 0.5517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.535837709903717,
"step": 55,
"valid_targets_mean": 3263.8,
"valid_targets_min": 1873
},
{
"epoch": 0.06302521008403361,
"grad_norm": 1.2418730665732476,
"learning_rate": 3.5382308845577213e-06,
"loss": 0.5094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5285685658454895,
"step": 60,
"valid_targets_mean": 3430.2,
"valid_targets_min": 1013
},
{
"epoch": 0.06827731092436974,
"grad_norm": 0.8868118364710539,
"learning_rate": 3.83808095952024e-06,
"loss": 0.4861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4722723364830017,
"step": 65,
"valid_targets_mean": 4041.6,
"valid_targets_min": 1366
},
{
"epoch": 0.07352941176470588,
"grad_norm": 0.9428896232462224,
"learning_rate": 4.137931034482759e-06,
"loss": 0.5037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.53287672996521,
"step": 70,
"valid_targets_mean": 3515.2,
"valid_targets_min": 2050
},
{
"epoch": 0.07878151260504201,
"grad_norm": 0.9383925766489141,
"learning_rate": 4.437781109445278e-06,
"loss": 0.5135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.524086058139801,
"step": 75,
"valid_targets_mean": 3048.9,
"valid_targets_min": 746
},
{
"epoch": 0.08403361344537816,
"grad_norm": 0.9340541727723428,
"learning_rate": 4.737631184407796e-06,
"loss": 0.489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5150220990180969,
"step": 80,
"valid_targets_mean": 2982.6,
"valid_targets_min": 855
},
{
"epoch": 0.08928571428571429,
"grad_norm": 0.7737514488505065,
"learning_rate": 5.037481259370315e-06,
"loss": 0.4923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.498151570558548,
"step": 85,
"valid_targets_mean": 3753.4,
"valid_targets_min": 2125
},
{
"epoch": 0.09453781512605042,
"grad_norm": 0.8574731436330563,
"learning_rate": 5.337331334332834e-06,
"loss": 0.5013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4901542663574219,
"step": 90,
"valid_targets_mean": 2946.8,
"valid_targets_min": 1173
},
{
"epoch": 0.09978991596638656,
"grad_norm": 0.8207916191722505,
"learning_rate": 5.6371814092953526e-06,
"loss": 0.4644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45455610752105713,
"step": 95,
"valid_targets_mean": 3284.2,
"valid_targets_min": 1438
},
{
"epoch": 0.10504201680672269,
"grad_norm": 0.6890899996201467,
"learning_rate": 5.937031484257871e-06,
"loss": 0.4503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3856987953186035,
"step": 100,
"valid_targets_mean": 3818.4,
"valid_targets_min": 1133
},
{
"epoch": 0.11029411764705882,
"grad_norm": 0.7375624963619357,
"learning_rate": 6.2368815592203904e-06,
"loss": 0.4597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42143797874450684,
"step": 105,
"valid_targets_mean": 3339.8,
"valid_targets_min": 1051
},
{
"epoch": 0.11554621848739496,
"grad_norm": 0.7422023625324775,
"learning_rate": 6.536731634182909e-06,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47655802965164185,
"step": 110,
"valid_targets_mean": 3285.1,
"valid_targets_min": 1642
},
{
"epoch": 0.1207983193277311,
"grad_norm": 0.6767508461063624,
"learning_rate": 6.8365817091454274e-06,
"loss": 0.4463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42775917053222656,
"step": 115,
"valid_targets_mean": 3340.8,
"valid_targets_min": 1747
},
{
"epoch": 0.12605042016806722,
"grad_norm": 0.7262880447276591,
"learning_rate": 7.136431784107947e-06,
"loss": 0.4491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4421280324459076,
"step": 120,
"valid_targets_mean": 3218.2,
"valid_targets_min": 1765
},
{
"epoch": 0.13130252100840337,
"grad_norm": 0.7791375198049785,
"learning_rate": 7.436281859070465e-06,
"loss": 0.4446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4363992214202881,
"step": 125,
"valid_targets_mean": 3182.9,
"valid_targets_min": 1233
},
{
"epoch": 0.13655462184873948,
"grad_norm": 0.7376851052403786,
"learning_rate": 7.736131934032984e-06,
"loss": 0.4195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4291246831417084,
"step": 130,
"valid_targets_mean": 3020.8,
"valid_targets_min": 869
},
{
"epoch": 0.14180672268907563,
"grad_norm": 0.7251699149877672,
"learning_rate": 8.035982008995503e-06,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4199424982070923,
"step": 135,
"valid_targets_mean": 3269.2,
"valid_targets_min": 926
},
{
"epoch": 0.14705882352941177,
"grad_norm": 0.7174356234657762,
"learning_rate": 8.335832083958023e-06,
"loss": 0.4209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3915764093399048,
"step": 140,
"valid_targets_mean": 3256.4,
"valid_targets_min": 1016
},
{
"epoch": 0.15231092436974789,
"grad_norm": 0.7429933172485804,
"learning_rate": 8.63568215892054e-06,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4099087417125702,
"step": 145,
"valid_targets_mean": 3058.4,
"valid_targets_min": 1367
},
{
"epoch": 0.15756302521008403,
"grad_norm": 0.6609884978656597,
"learning_rate": 8.93553223388306e-06,
"loss": 0.4275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38431763648986816,
"step": 150,
"valid_targets_mean": 3513.8,
"valid_targets_min": 761
},
{
"epoch": 0.16281512605042017,
"grad_norm": 0.7414117819519422,
"learning_rate": 9.235382308845579e-06,
"loss": 0.4149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41205519437789917,
"step": 155,
"valid_targets_mean": 2834.2,
"valid_targets_min": 1480
},
{
"epoch": 0.16806722689075632,
"grad_norm": 0.766190877937914,
"learning_rate": 9.535232383808097e-06,
"loss": 0.4221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40908199548721313,
"step": 160,
"valid_targets_mean": 2854.1,
"valid_targets_min": 1229
},
{
"epoch": 0.17331932773109243,
"grad_norm": 0.7322988121738653,
"learning_rate": 9.835082458770614e-06,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.409344881772995,
"step": 165,
"valid_targets_mean": 3215.8,
"valid_targets_min": 1727
},
{
"epoch": 0.17857142857142858,
"grad_norm": 0.7036664531547118,
"learning_rate": 1.0134932533733135e-05,
"loss": 0.4117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3934198021888733,
"step": 170,
"valid_targets_mean": 3578.9,
"valid_targets_min": 1860
},
{
"epoch": 0.18382352941176472,
"grad_norm": 0.7504645575443613,
"learning_rate": 1.0434782608695653e-05,
"loss": 0.4176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41233259439468384,
"step": 175,
"valid_targets_mean": 3121.1,
"valid_targets_min": 1145
},
{
"epoch": 0.18907563025210083,
"grad_norm": 0.8540338092213114,
"learning_rate": 1.0734632683658172e-05,
"loss": 0.4206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4257834851741791,
"step": 180,
"valid_targets_mean": 2910.1,
"valid_targets_min": 1195
},
{
"epoch": 0.19432773109243698,
"grad_norm": 0.672825231347177,
"learning_rate": 1.103448275862069e-05,
"loss": 0.4046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37902510166168213,
"step": 185,
"valid_targets_mean": 3215.2,
"valid_targets_min": 1087
},
{
"epoch": 0.19957983193277312,
"grad_norm": 0.7299680458741075,
"learning_rate": 1.1334332833583211e-05,
"loss": 0.4173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3878703713417053,
"step": 190,
"valid_targets_mean": 3842.3,
"valid_targets_min": 730
},
{
"epoch": 0.20483193277310924,
"grad_norm": 0.7452069066845327,
"learning_rate": 1.1634182908545729e-05,
"loss": 0.4012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40164220333099365,
"step": 195,
"valid_targets_mean": 3112.6,
"valid_targets_min": 1097
},
{
"epoch": 0.21008403361344538,
"grad_norm": 0.6701617672469308,
"learning_rate": 1.1934032983508246e-05,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4067269563674927,
"step": 200,
"valid_targets_mean": 3587.6,
"valid_targets_min": 1833
},
{
"epoch": 0.21533613445378152,
"grad_norm": 0.6999892185242177,
"learning_rate": 1.2233883058470766e-05,
"loss": 0.4046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42524561285972595,
"step": 205,
"valid_targets_mean": 3660.6,
"valid_targets_min": 1182
},
{
"epoch": 0.22058823529411764,
"grad_norm": 0.6936596594842792,
"learning_rate": 1.2533733133433283e-05,
"loss": 0.3979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4341742992401123,
"step": 210,
"valid_targets_mean": 3839.4,
"valid_targets_min": 1586
},
{
"epoch": 0.22584033613445378,
"grad_norm": 0.7203275927233951,
"learning_rate": 1.2833583208395803e-05,
"loss": 0.4122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4256739020347595,
"step": 215,
"valid_targets_mean": 3062.7,
"valid_targets_min": 1714
},
{
"epoch": 0.23109243697478993,
"grad_norm": 0.8564716523005904,
"learning_rate": 1.313343328335832e-05,
"loss": 0.4007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4049715995788574,
"step": 220,
"valid_targets_mean": 3611.1,
"valid_targets_min": 1504
},
{
"epoch": 0.23634453781512604,
"grad_norm": 0.6563920907148093,
"learning_rate": 1.3433283358320841e-05,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3269047141075134,
"step": 225,
"valid_targets_mean": 3457.1,
"valid_targets_min": 1170
},
{
"epoch": 0.2415966386554622,
"grad_norm": 0.7196899057898143,
"learning_rate": 1.3733133433283359e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38853204250335693,
"step": 230,
"valid_targets_mean": 3089.3,
"valid_targets_min": 1436
},
{
"epoch": 0.24684873949579833,
"grad_norm": 0.7287732338618192,
"learning_rate": 1.4032983508245878e-05,
"loss": 0.3919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38699156045913696,
"step": 235,
"valid_targets_mean": 3257.2,
"valid_targets_min": 1302
},
{
"epoch": 0.25210084033613445,
"grad_norm": 0.7214311214899903,
"learning_rate": 1.4332833583208396e-05,
"loss": 0.3841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41121745109558105,
"step": 240,
"valid_targets_mean": 3425.1,
"valid_targets_min": 2023
},
{
"epoch": 0.25735294117647056,
"grad_norm": 0.648625366284687,
"learning_rate": 1.4632683658170917e-05,
"loss": 0.361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3404223918914795,
"step": 245,
"valid_targets_mean": 3196.4,
"valid_targets_min": 809
},
{
"epoch": 0.26260504201680673,
"grad_norm": 0.7442737796844059,
"learning_rate": 1.4932533733133435e-05,
"loss": 0.3958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37922531366348267,
"step": 250,
"valid_targets_mean": 3197.8,
"valid_targets_min": 1059
},
{
"epoch": 0.26785714285714285,
"grad_norm": 0.7290285381798371,
"learning_rate": 1.5232383808095954e-05,
"loss": 0.3759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33683687448501587,
"step": 255,
"valid_targets_mean": 3301.7,
"valid_targets_min": 964
},
{
"epoch": 0.27310924369747897,
"grad_norm": 0.7658760733120059,
"learning_rate": 1.5532233883058472e-05,
"loss": 0.3864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3716367483139038,
"step": 260,
"valid_targets_mean": 3694.2,
"valid_targets_min": 1105
},
{
"epoch": 0.27836134453781514,
"grad_norm": 0.8430133851017164,
"learning_rate": 1.5832083958020993e-05,
"loss": 0.3997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4212614893913269,
"step": 265,
"valid_targets_mean": 2612.6,
"valid_targets_min": 1491
},
{
"epoch": 0.28361344537815125,
"grad_norm": 0.7343320220234513,
"learning_rate": 1.613193403298351e-05,
"loss": 0.4027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3935287594795227,
"step": 270,
"valid_targets_mean": 3110.5,
"valid_targets_min": 1091
},
{
"epoch": 0.28886554621848737,
"grad_norm": 0.7657356714112876,
"learning_rate": 1.6431784107946028e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36865124106407166,
"step": 275,
"valid_targets_mean": 3259.2,
"valid_targets_min": 1822
},
{
"epoch": 0.29411764705882354,
"grad_norm": 0.6955693394366955,
"learning_rate": 1.6731634182908546e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36471718549728394,
"step": 280,
"valid_targets_mean": 3547.6,
"valid_targets_min": 1625
},
{
"epoch": 0.29936974789915966,
"grad_norm": 0.7042195932323547,
"learning_rate": 1.7031484257871064e-05,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3420675992965698,
"step": 285,
"valid_targets_mean": 3628.2,
"valid_targets_min": 1415
},
{
"epoch": 0.30462184873949577,
"grad_norm": 0.8809660140825649,
"learning_rate": 1.7331334332833585e-05,
"loss": 0.3791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35459285974502563,
"step": 290,
"valid_targets_mean": 3398.9,
"valid_targets_min": 1460
},
{
"epoch": 0.30987394957983194,
"grad_norm": 0.7752770337054249,
"learning_rate": 1.7631184407796102e-05,
"loss": 0.3838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3816995620727539,
"step": 295,
"valid_targets_mean": 2947.4,
"valid_targets_min": 1079
},
{
"epoch": 0.31512605042016806,
"grad_norm": 0.7665849286642425,
"learning_rate": 1.7931034482758623e-05,
"loss": 0.3576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36882513761520386,
"step": 300,
"valid_targets_mean": 3003.0,
"valid_targets_min": 1274
},
{
"epoch": 0.32037815126050423,
"grad_norm": 0.7763875661157622,
"learning_rate": 1.823088455772114e-05,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3900800943374634,
"step": 305,
"valid_targets_mean": 3306.3,
"valid_targets_min": 914
},
{
"epoch": 0.32563025210084034,
"grad_norm": 0.7724334584719763,
"learning_rate": 1.853073463268366e-05,
"loss": 0.3894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36286020278930664,
"step": 310,
"valid_targets_mean": 3332.2,
"valid_targets_min": 1312
},
{
"epoch": 0.33088235294117646,
"grad_norm": 0.8144297942259716,
"learning_rate": 1.8830584707646176e-05,
"loss": 0.377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.395212858915329,
"step": 315,
"valid_targets_mean": 2601.3,
"valid_targets_min": 987
},
{
"epoch": 0.33613445378151263,
"grad_norm": 0.6210630540146885,
"learning_rate": 1.9130434782608697e-05,
"loss": 0.3653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34900736808776855,
"step": 320,
"valid_targets_mean": 4341.5,
"valid_targets_min": 1856
},
{
"epoch": 0.34138655462184875,
"grad_norm": 0.7382149230509586,
"learning_rate": 1.9430284857571215e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37840932607650757,
"step": 325,
"valid_targets_mean": 3290.9,
"valid_targets_min": 1601
},
{
"epoch": 0.34663865546218486,
"grad_norm": 0.7441687764233078,
"learning_rate": 1.9730134932533736e-05,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3847064971923828,
"step": 330,
"valid_targets_mean": 3119.4,
"valid_targets_min": 1986
},
{
"epoch": 0.35189075630252103,
"grad_norm": 0.6427174614521525,
"learning_rate": 2.0029985007496254e-05,
"loss": 0.3556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38938313722610474,
"step": 335,
"valid_targets_mean": 3777.1,
"valid_targets_min": 974
},
{
"epoch": 0.35714285714285715,
"grad_norm": 0.6767174257258602,
"learning_rate": 2.0329835082458775e-05,
"loss": 0.3632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33448052406311035,
"step": 340,
"valid_targets_mean": 2878.0,
"valid_targets_min": 512
},
{
"epoch": 0.36239495798319327,
"grad_norm": 0.7046783787151958,
"learning_rate": 2.0629685157421292e-05,
"loss": 0.3697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35749202966690063,
"step": 345,
"valid_targets_mean": 3215.4,
"valid_targets_min": 1202
},
{
"epoch": 0.36764705882352944,
"grad_norm": 0.7219690552414987,
"learning_rate": 2.092953523238381e-05,
"loss": 0.3881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37818586826324463,
"step": 350,
"valid_targets_mean": 3693.1,
"valid_targets_min": 1455
},
{
"epoch": 0.37289915966386555,
"grad_norm": 0.6860266938886983,
"learning_rate": 2.1229385307346328e-05,
"loss": 0.3675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34528088569641113,
"step": 355,
"valid_targets_mean": 3477.5,
"valid_targets_min": 1571
},
{
"epoch": 0.37815126050420167,
"grad_norm": 0.7609425900554888,
"learning_rate": 2.152923538230885e-05,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.429862916469574,
"step": 360,
"valid_targets_mean": 2912.1,
"valid_targets_min": 1450
},
{
"epoch": 0.38340336134453784,
"grad_norm": 0.6848089283903739,
"learning_rate": 2.1829085457271363e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3468002676963806,
"step": 365,
"valid_targets_mean": 3323.0,
"valid_targets_min": 1431
},
{
"epoch": 0.38865546218487396,
"grad_norm": 0.7419166645990429,
"learning_rate": 2.2128935532233884e-05,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3837374746799469,
"step": 370,
"valid_targets_mean": 3461.4,
"valid_targets_min": 1147
},
{
"epoch": 0.3939075630252101,
"grad_norm": 0.8576299436135565,
"learning_rate": 2.2428785607196405e-05,
"loss": 0.393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39932119846343994,
"step": 375,
"valid_targets_mean": 2641.6,
"valid_targets_min": 998
},
{
"epoch": 0.39915966386554624,
"grad_norm": 0.7247001275212052,
"learning_rate": 2.2728635682158923e-05,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3718080520629883,
"step": 380,
"valid_targets_mean": 3260.9,
"valid_targets_min": 614
},
{
"epoch": 0.40441176470588236,
"grad_norm": 0.7885722026955804,
"learning_rate": 2.302848575712144e-05,
"loss": 0.3797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39757227897644043,
"step": 385,
"valid_targets_mean": 2796.2,
"valid_targets_min": 1005
},
{
"epoch": 0.4096638655462185,
"grad_norm": 0.7828630662690874,
"learning_rate": 2.3328335832083958e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3814929127693176,
"step": 390,
"valid_targets_mean": 3183.6,
"valid_targets_min": 2298
},
{
"epoch": 0.41491596638655465,
"grad_norm": 0.8409621672836618,
"learning_rate": 2.362818590704648e-05,
"loss": 0.3763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3965279459953308,
"step": 395,
"valid_targets_mean": 2821.2,
"valid_targets_min": 617
},
{
"epoch": 0.42016806722689076,
"grad_norm": 0.6764711962883958,
"learning_rate": 2.3928035982009e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3417738080024719,
"step": 400,
"valid_targets_mean": 3265.2,
"valid_targets_min": 1665
},
{
"epoch": 0.4254201680672269,
"grad_norm": 0.7365452834319242,
"learning_rate": 2.4227886056971515e-05,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3877049684524536,
"step": 405,
"valid_targets_mean": 3019.3,
"valid_targets_min": 1076
},
{
"epoch": 0.43067226890756305,
"grad_norm": 0.6737132753666218,
"learning_rate": 2.4527736131934036e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36130669713020325,
"step": 410,
"valid_targets_mean": 3610.8,
"valid_targets_min": 790
},
{
"epoch": 0.43592436974789917,
"grad_norm": 0.9130730152687944,
"learning_rate": 2.4827586206896553e-05,
"loss": 0.3783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3609384000301361,
"step": 415,
"valid_targets_mean": 3255.8,
"valid_targets_min": 1728
},
{
"epoch": 0.4411764705882353,
"grad_norm": 0.8464202746590961,
"learning_rate": 2.5127436281859074e-05,
"loss": 0.3788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33865395188331604,
"step": 420,
"valid_targets_mean": 3377.2,
"valid_targets_min": 981
},
{
"epoch": 0.44642857142857145,
"grad_norm": 0.7384506566000549,
"learning_rate": 2.542728635682159e-05,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339518904685974,
"step": 425,
"valid_targets_mean": 2839.1,
"valid_targets_min": 1351
},
{
"epoch": 0.45168067226890757,
"grad_norm": 0.6110714780946447,
"learning_rate": 2.572713643178411e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3625059425830841,
"step": 430,
"valid_targets_mean": 4396.7,
"valid_targets_min": 2416
},
{
"epoch": 0.4569327731092437,
"grad_norm": 0.5790619763281034,
"learning_rate": 2.602698650674663e-05,
"loss": 0.3524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32317501306533813,
"step": 435,
"valid_targets_mean": 4668.6,
"valid_targets_min": 1233
},
{
"epoch": 0.46218487394957986,
"grad_norm": 0.642678687454446,
"learning_rate": 2.632683658170915e-05,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3185131549835205,
"step": 440,
"valid_targets_mean": 3936.4,
"valid_targets_min": 1524
},
{
"epoch": 0.46743697478991597,
"grad_norm": 0.5867900140587048,
"learning_rate": 2.6626686656671666e-05,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3317568600177765,
"step": 445,
"valid_targets_mean": 4389.3,
"valid_targets_min": 856
},
{
"epoch": 0.4726890756302521,
"grad_norm": 0.6996864572340856,
"learning_rate": 2.6926536731634184e-05,
"loss": 0.3573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35135549306869507,
"step": 450,
"valid_targets_mean": 3241.3,
"valid_targets_min": 906
},
{
"epoch": 0.47794117647058826,
"grad_norm": 0.6713569052572641,
"learning_rate": 2.7226386806596705e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3594322204589844,
"step": 455,
"valid_targets_mean": 3680.4,
"valid_targets_min": 832
},
{
"epoch": 0.4831932773109244,
"grad_norm": 0.6528374934626601,
"learning_rate": 2.752623688155922e-05,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33547288179397583,
"step": 460,
"valid_targets_mean": 3168.9,
"valid_targets_min": 1484
},
{
"epoch": 0.4884453781512605,
"grad_norm": 0.7585928062211041,
"learning_rate": 2.782608695652174e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34602272510528564,
"step": 465,
"valid_targets_mean": 3667.5,
"valid_targets_min": 1440
},
{
"epoch": 0.49369747899159666,
"grad_norm": 0.7549275178598076,
"learning_rate": 2.812593703148426e-05,
"loss": 0.3689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40832167863845825,
"step": 470,
"valid_targets_mean": 3025.6,
"valid_targets_min": 1349
},
{
"epoch": 0.4989495798319328,
"grad_norm": 0.8305062206700754,
"learning_rate": 2.8425787106446782e-05,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36201930046081543,
"step": 475,
"valid_targets_mean": 2935.8,
"valid_targets_min": 1156
},
{
"epoch": 0.5042016806722689,
"grad_norm": 0.7148304561333289,
"learning_rate": 2.8725637181409296e-05,
"loss": 0.358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3326527178287506,
"step": 480,
"valid_targets_mean": 3190.4,
"valid_targets_min": 993
},
{
"epoch": 0.509453781512605,
"grad_norm": 0.8146565793649729,
"learning_rate": 2.9025487256371818e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3617240786552429,
"step": 485,
"valid_targets_mean": 2785.6,
"valid_targets_min": 1275
},
{
"epoch": 0.5147058823529411,
"grad_norm": 0.7209287114298926,
"learning_rate": 2.9325337331334335e-05,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36016473174095154,
"step": 490,
"valid_targets_mean": 3266.8,
"valid_targets_min": 1669
},
{
"epoch": 0.5199579831932774,
"grad_norm": 0.7172263463358715,
"learning_rate": 2.9625187406296856e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36014240980148315,
"step": 495,
"valid_targets_mean": 3357.5,
"valid_targets_min": 1710
},
{
"epoch": 0.5252100840336135,
"grad_norm": 0.6972857671515527,
"learning_rate": 2.992503748125937e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34464967250823975,
"step": 500,
"valid_targets_mean": 3468.1,
"valid_targets_min": 1685
},
{
"epoch": 0.5304621848739496,
"grad_norm": 0.7173833022077326,
"learning_rate": 3.022488755622189e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35650789737701416,
"step": 505,
"valid_targets_mean": 3659.6,
"valid_targets_min": 1931
},
{
"epoch": 0.5357142857142857,
"grad_norm": 0.7592796407843059,
"learning_rate": 3.052473763118441e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3427087068557739,
"step": 510,
"valid_targets_mean": 3862.3,
"valid_targets_min": 2009
},
{
"epoch": 0.5409663865546218,
"grad_norm": 1.1258165798910273,
"learning_rate": 3.0824587706146934e-05,
"loss": 0.361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.367844820022583,
"step": 515,
"valid_targets_mean": 1792.6,
"valid_targets_min": 777
},
{
"epoch": 0.5462184873949579,
"grad_norm": 1.1349526835427646,
"learning_rate": 3.112443778110945e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122398853302002,
"step": 520,
"valid_targets_mean": 1354.7,
"valid_targets_min": 705
},
{
"epoch": 0.5514705882352942,
"grad_norm": 1.8110765728106655,
"learning_rate": 3.142428785607197e-05,
"loss": 0.3052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3012329041957855,
"step": 525,
"valid_targets_mean": 1556.9,
"valid_targets_min": 914
},
{
"epoch": 0.5567226890756303,
"grad_norm": 1.1404918052705433,
"learning_rate": 3.172413793103448e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664037346839905,
"step": 530,
"valid_targets_mean": 1397.1,
"valid_targets_min": 680
},
{
"epoch": 0.5619747899159664,
"grad_norm": 0.9458053300681202,
"learning_rate": 3.2023988005997004e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289004921913147,
"step": 535,
"valid_targets_mean": 1698.1,
"valid_targets_min": 819
},
{
"epoch": 0.5672268907563025,
"grad_norm": 1.0086441843661589,
"learning_rate": 3.2323838080959525e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26696014404296875,
"step": 540,
"valid_targets_mean": 1393.1,
"valid_targets_min": 734
},
{
"epoch": 0.5724789915966386,
"grad_norm": 1.0260360672408402,
"learning_rate": 3.262368815592204e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2623750567436218,
"step": 545,
"valid_targets_mean": 1443.1,
"valid_targets_min": 655
},
{
"epoch": 0.5777310924369747,
"grad_norm": 0.9985074269719646,
"learning_rate": 3.292353823088456e-05,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26140543818473816,
"step": 550,
"valid_targets_mean": 1392.2,
"valid_targets_min": 737
},
{
"epoch": 0.582983193277311,
"grad_norm": 0.9985105336106163,
"learning_rate": 3.3223388305847075e-05,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25588417053222656,
"step": 555,
"valid_targets_mean": 1386.6,
"valid_targets_min": 759
},
{
"epoch": 0.5882352941176471,
"grad_norm": 1.1959754188425515,
"learning_rate": 3.3523238380809596e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27921628952026367,
"step": 560,
"valid_targets_mean": 1442.9,
"valid_targets_min": 750
},
{
"epoch": 0.5934873949579832,
"grad_norm": 1.001393308800324,
"learning_rate": 3.382308845577212e-05,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664732336997986,
"step": 565,
"valid_targets_mean": 1536.1,
"valid_targets_min": 780
},
{
"epoch": 0.5987394957983193,
"grad_norm": 0.9505908357818789,
"learning_rate": 3.412293853073464e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2818218767642975,
"step": 570,
"valid_targets_mean": 1463.1,
"valid_targets_min": 679
},
{
"epoch": 0.6039915966386554,
"grad_norm": 1.0707192051376093,
"learning_rate": 3.442278860569715e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2692759931087494,
"step": 575,
"valid_targets_mean": 1292.8,
"valid_targets_min": 771
},
{
"epoch": 0.6092436974789915,
"grad_norm": 1.1070031492080266,
"learning_rate": 3.4722638680659673e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2560975253582001,
"step": 580,
"valid_targets_mean": 1542.4,
"valid_targets_min": 878
},
{
"epoch": 0.6144957983193278,
"grad_norm": 0.898740421578359,
"learning_rate": 3.5022488755622194e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23506242036819458,
"step": 585,
"valid_targets_mean": 1506.8,
"valid_targets_min": 942
},
{
"epoch": 0.6197478991596639,
"grad_norm": 0.9882747404397235,
"learning_rate": 3.5322338830584716e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667955756187439,
"step": 590,
"valid_targets_mean": 1401.9,
"valid_targets_min": 675
},
{
"epoch": 0.625,
"grad_norm": 0.9973429121391257,
"learning_rate": 3.562218890554723e-05,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597658038139343,
"step": 595,
"valid_targets_mean": 1483.8,
"valid_targets_min": 892
},
{
"epoch": 0.6302521008403361,
"grad_norm": 1.1184131263781747,
"learning_rate": 3.592203898050975e-05,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2559979557991028,
"step": 600,
"valid_targets_mean": 1356.3,
"valid_targets_min": 656
},
{
"epoch": 0.6355042016806722,
"grad_norm": 1.1551828432063649,
"learning_rate": 3.6221889055472265e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2352353036403656,
"step": 605,
"valid_targets_mean": 1340.6,
"valid_targets_min": 706
},
{
"epoch": 0.6407563025210085,
"grad_norm": 0.9979079936759186,
"learning_rate": 3.6521739130434786e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257199227809906,
"step": 610,
"valid_targets_mean": 1528.6,
"valid_targets_min": 548
},
{
"epoch": 0.6460084033613446,
"grad_norm": 0.9872520856471761,
"learning_rate": 3.68215892053973e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24192388355731964,
"step": 615,
"valid_targets_mean": 1268.9,
"valid_targets_min": 658
},
{
"epoch": 0.6512605042016807,
"grad_norm": 1.0290619368672818,
"learning_rate": 3.712143928035982e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.250153124332428,
"step": 620,
"valid_targets_mean": 1360.1,
"valid_targets_min": 650
},
{
"epoch": 0.6565126050420168,
"grad_norm": 0.9161121685195928,
"learning_rate": 3.742128935532234e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25210872292518616,
"step": 625,
"valid_targets_mean": 1452.3,
"valid_targets_min": 859
},
{
"epoch": 0.6617647058823529,
"grad_norm": 1.231558662443427,
"learning_rate": 3.772113943028486e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508789896965027,
"step": 630,
"valid_targets_mean": 1391.3,
"valid_targets_min": 728
},
{
"epoch": 0.667016806722689,
"grad_norm": 0.8973325739286778,
"learning_rate": 3.802098950524738e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22503423690795898,
"step": 635,
"valid_targets_mean": 1344.4,
"valid_targets_min": 686
},
{
"epoch": 0.6722689075630253,
"grad_norm": 0.9602158780480545,
"learning_rate": 3.83208395802099e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667675018310547,
"step": 640,
"valid_targets_mean": 1545.2,
"valid_targets_min": 697
},
{
"epoch": 0.6775210084033614,
"grad_norm": 0.9207285003363753,
"learning_rate": 3.862068965517242e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23141629993915558,
"step": 645,
"valid_targets_mean": 1354.6,
"valid_targets_min": 779
},
{
"epoch": 0.6827731092436975,
"grad_norm": 0.8852191091332312,
"learning_rate": 3.8920539730134934e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2596163749694824,
"step": 650,
"valid_targets_mean": 1434.1,
"valid_targets_min": 729
},
{
"epoch": 0.6880252100840336,
"grad_norm": 0.912601154449096,
"learning_rate": 3.9220389805097455e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22037877142429352,
"step": 655,
"valid_targets_mean": 1388.2,
"valid_targets_min": 868
},
{
"epoch": 0.6932773109243697,
"grad_norm": 1.015856823111782,
"learning_rate": 3.9520239880059976e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23023347556591034,
"step": 660,
"valid_targets_mean": 1282.3,
"valid_targets_min": 765
},
{
"epoch": 0.6985294117647058,
"grad_norm": 0.9855004619555965,
"learning_rate": 3.982008995502249e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527748942375183,
"step": 665,
"valid_targets_mean": 1457.2,
"valid_targets_min": 793
},
{
"epoch": 0.7037815126050421,
"grad_norm": 0.9177092400221334,
"learning_rate": 3.9999989022799437e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26127058267593384,
"step": 670,
"valid_targets_mean": 1448.5,
"valid_targets_min": 806
},
{
"epoch": 0.7090336134453782,
"grad_norm": 0.8689313261706375,
"learning_rate": 3.9999865529431466e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2190496325492859,
"step": 675,
"valid_targets_mean": 1380.7,
"valid_targets_min": 803
},
{
"epoch": 0.7142857142857143,
"grad_norm": 0.8662595043279143,
"learning_rate": 3.9999604822044886e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22773924469947815,
"step": 680,
"valid_targets_mean": 1515.7,
"valid_targets_min": 660
},
{
"epoch": 0.7195378151260504,
"grad_norm": 0.9275572542299572,
"learning_rate": 3.999920690242835e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21551215648651123,
"step": 685,
"valid_targets_mean": 1402.0,
"valid_targets_min": 837
},
{
"epoch": 0.7247899159663865,
"grad_norm": 0.8209341148096483,
"learning_rate": 3.999867177331189e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22521734237670898,
"step": 690,
"valid_targets_mean": 1574.1,
"valid_targets_min": 719
},
{
"epoch": 0.7300420168067226,
"grad_norm": 0.9448587281311374,
"learning_rate": 3.9997999438366895e-05,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23695966601371765,
"step": 695,
"valid_targets_mean": 1430.1,
"valid_targets_min": 765
},
{
"epoch": 0.7352941176470589,
"grad_norm": 0.9348888815574206,
"learning_rate": 3.9997189902206065e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24235057830810547,
"step": 700,
"valid_targets_mean": 1372.3,
"valid_targets_min": 727
},
{
"epoch": 0.740546218487395,
"grad_norm": 0.898775745123375,
"learning_rate": 3.999624317038344e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20886942744255066,
"step": 705,
"valid_targets_mean": 1192.8,
"valid_targets_min": 655
},
{
"epoch": 0.7457983193277311,
"grad_norm": 0.8896703345645318,
"learning_rate": 3.9995159249394303e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2359616905450821,
"step": 710,
"valid_targets_mean": 1508.0,
"valid_targets_min": 669
},
{
"epoch": 0.7510504201680672,
"grad_norm": 0.9044856336058926,
"learning_rate": 3.999393814667517e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22560223937034607,
"step": 715,
"valid_targets_mean": 1430.2,
"valid_targets_min": 1046
},
{
"epoch": 0.7563025210084033,
"grad_norm": 0.7809432057780077,
"learning_rate": 3.9992579870603695e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2628813087940216,
"step": 720,
"valid_targets_mean": 1651.8,
"valid_targets_min": 692
},
{
"epoch": 0.7615546218487395,
"grad_norm": 0.8587913679452784,
"learning_rate": 3.999108443049869e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24335074424743652,
"step": 725,
"valid_targets_mean": 1540.4,
"valid_targets_min": 846
},
{
"epoch": 0.7668067226890757,
"grad_norm": 0.9548503644681028,
"learning_rate": 3.998945183661997e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418360412120819,
"step": 730,
"valid_targets_mean": 1455.1,
"valid_targets_min": 764
},
{
"epoch": 0.7720588235294118,
"grad_norm": 0.8057865606417343,
"learning_rate": 3.9987682100168376e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21932202577590942,
"step": 735,
"valid_targets_mean": 1497.4,
"valid_targets_min": 822
},
{
"epoch": 0.7773109243697479,
"grad_norm": 0.8569864825362092,
"learning_rate": 3.99857752332856e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24598419666290283,
"step": 740,
"valid_targets_mean": 1543.8,
"valid_targets_min": 982
},
{
"epoch": 0.782563025210084,
"grad_norm": 0.8966461968047943,
"learning_rate": 3.998373124905418e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24538162350654602,
"step": 745,
"valid_targets_mean": 1346.3,
"valid_targets_min": 713
},
{
"epoch": 0.7878151260504201,
"grad_norm": 0.9787609428455722,
"learning_rate": 3.9981550161497375e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22620789706707,
"step": 750,
"valid_targets_mean": 1395.7,
"valid_targets_min": 721
},
{
"epoch": 0.7930672268907563,
"grad_norm": 0.8647918297737699,
"learning_rate": 3.9979231985579074e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22276586294174194,
"step": 755,
"valid_targets_mean": 1290.6,
"valid_targets_min": 741
},
{
"epoch": 0.7983193277310925,
"grad_norm": 0.8550351182526175,
"learning_rate": 3.99767767372037e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24379882216453552,
"step": 760,
"valid_targets_mean": 1568.1,
"valid_targets_min": 734
},
{
"epoch": 0.8035714285714286,
"grad_norm": 0.8680279094247919,
"learning_rate": 3.997418443321609e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23442883789539337,
"step": 765,
"valid_targets_mean": 1703.1,
"valid_targets_min": 744
},
{
"epoch": 0.8088235294117647,
"grad_norm": 0.9333899796386794,
"learning_rate": 3.997145509140138e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25179609656333923,
"step": 770,
"valid_targets_mean": 1652.8,
"valid_targets_min": 620
},
{
"epoch": 0.8140756302521008,
"grad_norm": 0.7856961011675193,
"learning_rate": 3.9968588730484896e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.224946990609169,
"step": 775,
"valid_targets_mean": 1481.8,
"valid_targets_min": 723
},
{
"epoch": 0.819327731092437,
"grad_norm": 0.7761881827856689,
"learning_rate": 3.9965585370132013e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21191829442977905,
"step": 780,
"valid_targets_mean": 1686.5,
"valid_targets_min": 740
},
{
"epoch": 0.8245798319327731,
"grad_norm": 0.8321605983306755,
"learning_rate": 3.996244503094804e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20524507761001587,
"step": 785,
"valid_targets_mean": 1345.1,
"valid_targets_min": 711
},
{
"epoch": 0.8298319327731093,
"grad_norm": 0.8224185017405469,
"learning_rate": 3.995916773447804e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22673243284225464,
"step": 790,
"valid_targets_mean": 1619.1,
"valid_targets_min": 804
},
{
"epoch": 0.8350840336134454,
"grad_norm": 1.5699722200850348,
"learning_rate": 3.995575350320671e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2145438939332962,
"step": 795,
"valid_targets_mean": 1423.2,
"valid_targets_min": 674
},
{
"epoch": 0.8403361344537815,
"grad_norm": 0.8647740397931104,
"learning_rate": 3.995220236055824e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19764792919158936,
"step": 800,
"valid_targets_mean": 1207.4,
"valid_targets_min": 567
},
{
"epoch": 0.8455882352941176,
"grad_norm": 0.8208866711497894,
"learning_rate": 3.99485143308961e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22692370414733887,
"step": 805,
"valid_targets_mean": 1542.4,
"valid_targets_min": 912
},
{
"epoch": 0.8508403361344538,
"grad_norm": 0.7660210546255793,
"learning_rate": 3.994468943952296e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23304234445095062,
"step": 810,
"valid_targets_mean": 1591.0,
"valid_targets_min": 897
},
{
"epoch": 0.8560924369747899,
"grad_norm": 0.8316792538373139,
"learning_rate": 3.994072771268041e-05,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084471583366394,
"step": 815,
"valid_targets_mean": 1290.1,
"valid_targets_min": 773
},
{
"epoch": 0.8613445378151261,
"grad_norm": 0.8668112604053329,
"learning_rate": 3.993662917754885e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24037593603134155,
"step": 820,
"valid_targets_mean": 1407.2,
"valid_targets_min": 679
},
{
"epoch": 0.8665966386554622,
"grad_norm": 0.9891212862372226,
"learning_rate": 3.993239386224732e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22597835958003998,
"step": 825,
"valid_targets_mean": 1600.2,
"valid_targets_min": 818
},
{
"epoch": 0.8718487394957983,
"grad_norm": 0.8365460249899657,
"learning_rate": 3.992802179583322e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22174695134162903,
"step": 830,
"valid_targets_mean": 1442.4,
"valid_targets_min": 790
},
{
"epoch": 0.8771008403361344,
"grad_norm": 0.955688819196928,
"learning_rate": 3.9923513008302204e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23063375055789948,
"step": 835,
"valid_targets_mean": 1426.6,
"valid_targets_min": 592
},
{
"epoch": 0.8823529411764706,
"grad_norm": 0.7775298281309749,
"learning_rate": 3.991886753058792e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21736116707324982,
"step": 840,
"valid_targets_mean": 1430.9,
"valid_targets_min": 662
},
{
"epoch": 0.8876050420168067,
"grad_norm": 0.9219183595495097,
"learning_rate": 3.991408539456182e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2496243417263031,
"step": 845,
"valid_targets_mean": 1412.6,
"valid_targets_min": 622
},
{
"epoch": 0.8928571428571429,
"grad_norm": 0.9447703661465241,
"learning_rate": 3.990916663303293e-05,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532111406326294,
"step": 850,
"valid_targets_mean": 1372.1,
"valid_targets_min": 667
},
{
"epoch": 0.898109243697479,
"grad_norm": 0.7856700847441219,
"learning_rate": 3.990411127974762e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2314455211162567,
"step": 855,
"valid_targets_mean": 1628.1,
"valid_targets_min": 1012
},
{
"epoch": 0.9033613445378151,
"grad_norm": 0.9349349696144393,
"learning_rate": 3.989891936938939e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2500951886177063,
"step": 860,
"valid_targets_mean": 1464.7,
"valid_targets_min": 635
},
{
"epoch": 0.9086134453781513,
"grad_norm": 0.9119192470614107,
"learning_rate": 3.9893590937578634e-05,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2547591030597687,
"step": 865,
"valid_targets_mean": 1745.9,
"valid_targets_min": 689
},
{
"epoch": 0.9138655462184874,
"grad_norm": 0.9202449016918255,
"learning_rate": 3.9888126020872375e-05,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20298632979393005,
"step": 870,
"valid_targets_mean": 1129.1,
"valid_targets_min": 697
},
{
"epoch": 0.9191176470588235,
"grad_norm": 0.8174032516425299,
"learning_rate": 3.988252465676401e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25348424911499023,
"step": 875,
"valid_targets_mean": 1624.6,
"valid_targets_min": 656
},
{
"epoch": 0.9243697478991597,
"grad_norm": 0.7819162668790818,
"learning_rate": 3.98767868836831e-05,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27575284242630005,
"step": 880,
"valid_targets_mean": 1755.8,
"valid_targets_min": 697
},
{
"epoch": 0.9296218487394958,
"grad_norm": 0.8141268835699211,
"learning_rate": 3.987091274099504e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2335035800933838,
"step": 885,
"valid_targets_mean": 1516.4,
"valid_targets_min": 820
},
{
"epoch": 0.9348739495798319,
"grad_norm": 0.7937591348329995,
"learning_rate": 3.986490226900084e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22677749395370483,
"step": 890,
"valid_targets_mean": 1391.4,
"valid_targets_min": 680
},
{
"epoch": 0.9401260504201681,
"grad_norm": 0.8638827876332873,
"learning_rate": 3.985875550893684e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2247205227613449,
"step": 895,
"valid_targets_mean": 1412.4,
"valid_targets_min": 778
},
{
"epoch": 0.9453781512605042,
"grad_norm": 0.7937334625060325,
"learning_rate": 3.9852472502974386e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25422534346580505,
"step": 900,
"valid_targets_mean": 1599.6,
"valid_targets_min": 851
},
{
"epoch": 0.9506302521008403,
"grad_norm": 0.7815070706059014,
"learning_rate": 3.984605329421961e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21097871661186218,
"step": 905,
"valid_targets_mean": 1398.4,
"valid_targets_min": 692
},
{
"epoch": 0.9558823529411765,
"grad_norm": 0.7673078400464335,
"learning_rate": 3.983949792671307e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20964649319648743,
"step": 910,
"valid_targets_mean": 1477.9,
"valid_targets_min": 741
},
{
"epoch": 0.9611344537815126,
"grad_norm": 0.851415365699838,
"learning_rate": 3.9832806445429486e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20876117050647736,
"step": 915,
"valid_targets_mean": 1299.4,
"valid_targets_min": 639
},
{
"epoch": 0.9663865546218487,
"grad_norm": 0.866799347417237,
"learning_rate": 3.982597889627742e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21439066529273987,
"step": 920,
"valid_targets_mean": 1277.9,
"valid_targets_min": 743
},
{
"epoch": 0.9716386554621849,
"grad_norm": 0.7220607995686592,
"learning_rate": 3.981901532609896e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2239415943622589,
"step": 925,
"valid_targets_mean": 1529.9,
"valid_targets_min": 610
},
{
"epoch": 0.976890756302521,
"grad_norm": 0.7774847164190153,
"learning_rate": 3.9811915782669406e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20755037665367126,
"step": 930,
"valid_targets_mean": 1331.6,
"valid_targets_min": 695
},
{
"epoch": 0.9821428571428571,
"grad_norm": 0.7514140462848654,
"learning_rate": 3.980468031469691e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2222648710012436,
"step": 935,
"valid_targets_mean": 1581.9,
"valid_targets_min": 807
},
{
"epoch": 0.9873949579831933,
"grad_norm": 0.7556883989929587,
"learning_rate": 3.9797308971822206e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2113157957792282,
"step": 940,
"valid_targets_mean": 1327.6,
"valid_targets_min": 765
},
{
"epoch": 0.9926470588235294,
"grad_norm": 0.7916476167495613,
"learning_rate": 3.978980180461821e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23679675161838531,
"step": 945,
"valid_targets_mean": 1346.4,
"valid_targets_min": 591
},
{
"epoch": 0.9978991596638656,
"grad_norm": 0.7026077039339454,
"learning_rate": 3.9782158864589696e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20915091037750244,
"step": 950,
"valid_targets_mean": 1483.2,
"valid_targets_min": 692
},
{
"epoch": 1.0031512605042017,
"grad_norm": 0.5638798620218901,
"learning_rate": 3.977438020417293e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33122366666793823,
"step": 955,
"valid_targets_mean": 4404.5,
"valid_targets_min": 1323
},
{
"epoch": 1.0084033613445378,
"grad_norm": 0.5755600203933873,
"learning_rate": 3.9766465876735354e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3643394112586975,
"step": 960,
"valid_targets_mean": 4483.4,
"valid_targets_min": 1005
},
{
"epoch": 1.013655462184874,
"grad_norm": 0.5433500453139155,
"learning_rate": 3.9758415936575155e-05,
"loss": 0.3387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3266267776489258,
"step": 965,
"valid_targets_mean": 4502.1,
"valid_targets_min": 1509
},
{
"epoch": 1.01890756302521,
"grad_norm": 0.6267141368025664,
"learning_rate": 3.975023043892094e-05,
"loss": 0.3404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3264230787754059,
"step": 970,
"valid_targets_mean": 3430.2,
"valid_targets_min": 1561
},
{
"epoch": 1.0241596638655461,
"grad_norm": 0.607104749067981,
"learning_rate": 3.974190943993133e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339942693710327,
"step": 975,
"valid_targets_mean": 3385.4,
"valid_targets_min": 1184
},
{
"epoch": 1.0294117647058822,
"grad_norm": 0.536136082897943,
"learning_rate": 3.973345299669461e-05,
"loss": 0.3558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3149448335170746,
"step": 980,
"valid_targets_mean": 3982.6,
"valid_targets_min": 1413
},
{
"epoch": 1.0346638655462186,
"grad_norm": 0.5075659675082035,
"learning_rate": 3.972486116722828e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32082343101501465,
"step": 985,
"valid_targets_mean": 4911.7,
"valid_targets_min": 2160
},
{
"epoch": 1.0399159663865547,
"grad_norm": 0.5581426071520623,
"learning_rate": 3.971613401047872e-05,
"loss": 0.3346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35363245010375977,
"step": 990,
"valid_targets_mean": 3782.6,
"valid_targets_min": 1511
},
{
"epoch": 1.0451680672268908,
"grad_norm": 0.698413730384984,
"learning_rate": 3.970727158632075e-05,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.374415785074234,
"step": 995,
"valid_targets_mean": 3030.0,
"valid_targets_min": 1462
},
{
"epoch": 1.050420168067227,
"grad_norm": 0.6206079287451801,
"learning_rate": 3.969827395555721e-05,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3208198845386505,
"step": 1000,
"valid_targets_mean": 3772.4,
"valid_targets_min": 874
},
{
"epoch": 1.055672268907563,
"grad_norm": 0.6660693366788901,
"learning_rate": 3.968914117991857e-05,
"loss": 0.3445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3395417630672455,
"step": 1005,
"valid_targets_mean": 3337.1,
"valid_targets_min": 953
},
{
"epoch": 1.0609243697478992,
"grad_norm": 0.6001541700551754,
"learning_rate": 3.967987332206249e-05,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3561500310897827,
"step": 1010,
"valid_targets_mean": 4284.9,
"valid_targets_min": 1265
},
{
"epoch": 1.0661764705882353,
"grad_norm": 0.5433768685257184,
"learning_rate": 3.967047044557341e-05,
"loss": 0.3387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3220909833908081,
"step": 1015,
"valid_targets_mean": 5010.6,
"valid_targets_min": 1596
},
{
"epoch": 1.0714285714285714,
"grad_norm": 0.6300742894051691,
"learning_rate": 3.966093261496208e-05,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3596876561641693,
"step": 1020,
"valid_targets_mean": 3490.4,
"valid_targets_min": 1759
},
{
"epoch": 1.0766806722689075,
"grad_norm": 0.6791244172980975,
"learning_rate": 3.9651259895665146e-05,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36252090334892273,
"step": 1025,
"valid_targets_mean": 3264.3,
"valid_targets_min": 1353
},
{
"epoch": 1.0819327731092436,
"grad_norm": 0.5749237683976328,
"learning_rate": 3.9641452354044687e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31524378061294556,
"step": 1030,
"valid_targets_mean": 3814.6,
"valid_targets_min": 1643
},
{
"epoch": 1.0871848739495797,
"grad_norm": 0.6067338424067318,
"learning_rate": 3.9631510057387765e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32914769649505615,
"step": 1035,
"valid_targets_mean": 3166.1,
"valid_targets_min": 1269
},
{
"epoch": 1.092436974789916,
"grad_norm": 0.6139160246013105,
"learning_rate": 3.962143307390596e-05,
"loss": 0.3648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3532394766807556,
"step": 1040,
"valid_targets_mean": 3617.4,
"valid_targets_min": 1681
},
{
"epoch": 1.0976890756302522,
"grad_norm": 0.5852424169834737,
"learning_rate": 3.961122147273491e-05,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.306821346282959,
"step": 1045,
"valid_targets_mean": 3919.8,
"valid_targets_min": 1477
},
{
"epoch": 1.1029411764705883,
"grad_norm": 0.6196200689994448,
"learning_rate": 3.9600875323933826e-05,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34865230321884155,
"step": 1050,
"valid_targets_mean": 3418.5,
"valid_targets_min": 662
},
{
"epoch": 1.1081932773109244,
"grad_norm": 0.5913392876658434,
"learning_rate": 3.959039469848502e-05,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3537408113479614,
"step": 1055,
"valid_targets_mean": 3706.7,
"valid_targets_min": 2077
},
{
"epoch": 1.1134453781512605,
"grad_norm": 0.6771276206524633,
"learning_rate": 3.9579779668293416e-05,
"loss": 0.3249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203701972961426,
"step": 1060,
"valid_targets_mean": 2878.1,
"valid_targets_min": 1505
},
{
"epoch": 1.1186974789915967,
"grad_norm": 0.6786962469374573,
"learning_rate": 3.956903030618605e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35575729608535767,
"step": 1065,
"valid_targets_mean": 3418.0,
"valid_targets_min": 1957
},
{
"epoch": 1.1239495798319328,
"grad_norm": 0.5934416223711014,
"learning_rate": 3.955814668591156e-05,
"loss": 0.3487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38778382539749146,
"step": 1070,
"valid_targets_mean": 4106.4,
"valid_targets_min": 1704
},
{
"epoch": 1.129201680672269,
"grad_norm": 1.3852530686455735,
"learning_rate": 3.9547128882139735e-05,
"loss": 0.3349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3465884327888489,
"step": 1075,
"valid_targets_mean": 3046.9,
"valid_targets_min": 1422
},
{
"epoch": 1.134453781512605,
"grad_norm": 0.5980418747067316,
"learning_rate": 3.9535976970460925e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092625141143799,
"step": 1080,
"valid_targets_mean": 3447.4,
"valid_targets_min": 1603
},
{
"epoch": 1.1397058823529411,
"grad_norm": 0.7839568612134259,
"learning_rate": 3.9524691027385585e-05,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3626514971256256,
"step": 1085,
"valid_targets_mean": 2597.8,
"valid_targets_min": 1685
},
{
"epoch": 1.1449579831932772,
"grad_norm": 0.6257049596683059,
"learning_rate": 3.95132711303437e-05,
"loss": 0.3294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3430899977684021,
"step": 1090,
"valid_targets_mean": 3290.6,
"valid_targets_min": 1208
},
{
"epoch": 1.1502100840336134,
"grad_norm": 0.9029010729944724,
"learning_rate": 3.9501717357684315e-05,
"loss": 0.3368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.326965868473053,
"step": 1095,
"valid_targets_mean": 2661.8,
"valid_targets_min": 1501
},
{
"epoch": 1.1554621848739495,
"grad_norm": 0.6012247577775289,
"learning_rate": 3.9490029788674934e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3628232479095459,
"step": 1100,
"valid_targets_mean": 3849.0,
"valid_targets_min": 1866
},
{
"epoch": 1.1607142857142858,
"grad_norm": 0.614388950135581,
"learning_rate": 3.9478208503501e-05,
"loss": 0.3242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31284618377685547,
"step": 1105,
"valid_targets_mean": 3397.9,
"valid_targets_min": 1239
},
{
"epoch": 1.165966386554622,
"grad_norm": 0.653467443640438,
"learning_rate": 3.946625358326538e-05,
"loss": 0.3439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.346976101398468,
"step": 1110,
"valid_targets_mean": 3155.5,
"valid_targets_min": 1177
},
{
"epoch": 1.171218487394958,
"grad_norm": 0.579694254639963,
"learning_rate": 3.945416510998775e-05,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32414424419403076,
"step": 1115,
"valid_targets_mean": 3594.5,
"valid_targets_min": 1270
},
{
"epoch": 1.1764705882352942,
"grad_norm": 0.6219350779760418,
"learning_rate": 3.944194316660406e-05,
"loss": 0.3396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3272247314453125,
"step": 1120,
"valid_targets_mean": 3571.2,
"valid_targets_min": 1216
},
{
"epoch": 1.1817226890756303,
"grad_norm": 0.6292410803179813,
"learning_rate": 3.942958783696598e-05,
"loss": 0.3334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32565245032310486,
"step": 1125,
"valid_targets_mean": 3290.8,
"valid_targets_min": 1184
},
{
"epoch": 1.1869747899159664,
"grad_norm": 0.678979812159635,
"learning_rate": 3.94170992058403e-05,
"loss": 0.3349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3311670422554016,
"step": 1130,
"valid_targets_mean": 2986.1,
"valid_targets_min": 1292
},
{
"epoch": 1.1922268907563025,
"grad_norm": 0.6456475043572049,
"learning_rate": 3.9404477358908354e-05,
"loss": 0.3445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3214397132396698,
"step": 1135,
"valid_targets_mean": 3485.4,
"valid_targets_min": 1639
},
{
"epoch": 1.1974789915966386,
"grad_norm": 0.6695778532642306,
"learning_rate": 3.9391722382765445e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35410648584365845,
"step": 1140,
"valid_targets_mean": 2959.4,
"valid_targets_min": 1394
},
{
"epoch": 1.2027310924369747,
"grad_norm": 0.622191556528526,
"learning_rate": 3.937883436492025e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3593181073665619,
"step": 1145,
"valid_targets_mean": 3428.9,
"valid_targets_min": 2280
},
{
"epoch": 1.2079831932773109,
"grad_norm": 0.6333880919334702,
"learning_rate": 3.9365813393794186e-05,
"loss": 0.3265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35325169563293457,
"step": 1150,
"valid_targets_mean": 3233.9,
"valid_targets_min": 810
},
{
"epoch": 1.213235294117647,
"grad_norm": 0.6223354482954172,
"learning_rate": 3.9352659558720836e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3268436789512634,
"step": 1155,
"valid_targets_mean": 3211.6,
"valid_targets_min": 1654
},
{
"epoch": 1.2184873949579833,
"grad_norm": 0.659296380097006,
"learning_rate": 3.933937294994535e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320861279964447,
"step": 1160,
"valid_targets_mean": 3057.8,
"valid_targets_min": 584
},
{
"epoch": 1.2237394957983194,
"grad_norm": 0.636761914351194,
"learning_rate": 3.932595365862379e-05,
"loss": 0.3322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34962353110313416,
"step": 1165,
"valid_targets_mean": 3572.6,
"valid_targets_min": 2498
},
{
"epoch": 1.2289915966386555,
"grad_norm": 0.6592752073339605,
"learning_rate": 3.9312401776822504e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32008883357048035,
"step": 1170,
"valid_targets_mean": 3161.1,
"valid_targets_min": 1350
},
{
"epoch": 1.2342436974789917,
"grad_norm": 0.6063230189221366,
"learning_rate": 3.9298717397517546e-05,
"loss": 0.3365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3388460874557495,
"step": 1175,
"valid_targets_mean": 3486.1,
"valid_targets_min": 1624
},
{
"epoch": 1.2394957983193278,
"grad_norm": 0.687253883898937,
"learning_rate": 3.928490061459396e-05,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3046797513961792,
"step": 1180,
"valid_targets_mean": 2769.6,
"valid_targets_min": 916
},
{
"epoch": 1.2447478991596639,
"grad_norm": 0.5602035515910363,
"learning_rate": 3.927095152284521e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3130587935447693,
"step": 1185,
"valid_targets_mean": 3734.1,
"valid_targets_min": 2209
},
{
"epoch": 1.25,
"grad_norm": 0.6913362496913676,
"learning_rate": 3.925687021797249e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32542842626571655,
"step": 1190,
"valid_targets_mean": 3107.0,
"valid_targets_min": 1259
},
{
"epoch": 1.2552521008403361,
"grad_norm": 0.5736429239269779,
"learning_rate": 3.924265679658407e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30502641201019287,
"step": 1195,
"valid_targets_mean": 3685.6,
"valid_targets_min": 1183
},
{
"epoch": 1.2605042016806722,
"grad_norm": 0.577437241781624,
"learning_rate": 3.922831135619462e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3453516364097595,
"step": 1200,
"valid_targets_mean": 3891.3,
"valid_targets_min": 1101
},
{
"epoch": 1.2657563025210083,
"grad_norm": 0.5958378130959316,
"learning_rate": 3.9213833995224605e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3231067359447479,
"step": 1205,
"valid_targets_mean": 3877.6,
"valid_targets_min": 1658
},
{
"epoch": 1.2710084033613445,
"grad_norm": 0.6735908115281981,
"learning_rate": 3.919922481299952e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3365190923213959,
"step": 1210,
"valid_targets_mean": 3050.1,
"valid_targets_min": 1423
},
{
"epoch": 1.2762605042016806,
"grad_norm": 0.6601685873762229,
"learning_rate": 3.918448390974928e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3299792408943176,
"step": 1215,
"valid_targets_mean": 3202.4,
"valid_targets_min": 1185
},
{
"epoch": 1.2815126050420167,
"grad_norm": 0.6705034899134344,
"learning_rate": 3.9169611386607476e-05,
"loss": 0.3418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34724968671798706,
"step": 1220,
"valid_targets_mean": 3779.1,
"valid_targets_min": 1091
},
{
"epoch": 1.2867647058823528,
"grad_norm": 0.5833278508200939,
"learning_rate": 3.9154607345610746e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3058725893497467,
"step": 1225,
"valid_targets_mean": 3628.9,
"valid_targets_min": 1352
},
{
"epoch": 1.2920168067226891,
"grad_norm": 0.5696798688900944,
"learning_rate": 3.913947188969801e-05,
"loss": 0.3224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32415255904197693,
"step": 1230,
"valid_targets_mean": 4061.2,
"valid_targets_min": 1535
},
{
"epoch": 1.2972689075630253,
"grad_norm": 0.6650203053880857,
"learning_rate": 3.912420512270981e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3156277537345886,
"step": 1235,
"valid_targets_mean": 2753.1,
"valid_targets_min": 854
},
{
"epoch": 1.3025210084033614,
"grad_norm": 0.6404333915329682,
"learning_rate": 3.910880714938757e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30156928300857544,
"step": 1240,
"valid_targets_mean": 2942.5,
"valid_targets_min": 1179
},
{
"epoch": 1.3077731092436975,
"grad_norm": 0.604288417212929,
"learning_rate": 3.909327807537288e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30336058139801025,
"step": 1245,
"valid_targets_mean": 3598.9,
"valid_targets_min": 1290
},
{
"epoch": 1.3130252100840336,
"grad_norm": 0.875497325929702,
"learning_rate": 3.90776180072068e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32053911685943604,
"step": 1250,
"valid_targets_mean": 2332.6,
"valid_targets_min": 642
},
{
"epoch": 1.3182773109243697,
"grad_norm": 0.6151615426766832,
"learning_rate": 3.906182705232909e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063713312149048,
"step": 1255,
"valid_targets_mean": 3670.2,
"valid_targets_min": 1764
},
{
"epoch": 1.3235294117647058,
"grad_norm": 0.6686081770965902,
"learning_rate": 3.904590531907751e-05,
"loss": 0.3375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3719046711921692,
"step": 1260,
"valid_targets_mean": 3528.6,
"valid_targets_min": 1410
},
{
"epoch": 1.328781512605042,
"grad_norm": 0.7395507920156082,
"learning_rate": 3.9029852916687034e-05,
"loss": 0.3145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3327389657497406,
"step": 1265,
"valid_targets_mean": 3147.7,
"valid_targets_min": 1683
},
{
"epoch": 1.334033613445378,
"grad_norm": 0.709030289881482,
"learning_rate": 3.9013669955289136e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3167096972465515,
"step": 1270,
"valid_targets_mean": 3632.5,
"valid_targets_min": 996
},
{
"epoch": 1.3392857142857144,
"grad_norm": 0.6586192793197465,
"learning_rate": 3.899735654591101e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3190867602825165,
"step": 1275,
"valid_targets_mean": 3135.3,
"valid_targets_min": 1349
},
{
"epoch": 1.3445378151260505,
"grad_norm": 0.682140733121633,
"learning_rate": 3.898091280047486e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33190667629241943,
"step": 1280,
"valid_targets_mean": 3391.6,
"valid_targets_min": 1248
},
{
"epoch": 1.3497899159663866,
"grad_norm": 0.5957692884205409,
"learning_rate": 3.896433883179703e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3161918520927429,
"step": 1285,
"valid_targets_mean": 3323.4,
"valid_targets_min": 1445
},
{
"epoch": 1.3550420168067228,
"grad_norm": 0.6350286869649353,
"learning_rate": 3.894763475358736e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3040814995765686,
"step": 1290,
"valid_targets_mean": 3134.3,
"valid_targets_min": 2000
},
{
"epoch": 1.3602941176470589,
"grad_norm": 0.6934797525878172,
"learning_rate": 3.8930800680448275e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32412275671958923,
"step": 1295,
"valid_targets_mean": 2828.3,
"valid_targets_min": 1197
},
{
"epoch": 1.365546218487395,
"grad_norm": 0.6077199732980291,
"learning_rate": 3.891383672787411e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32446929812431335,
"step": 1300,
"valid_targets_mean": 3219.0,
"valid_targets_min": 1223
},
{
"epoch": 1.370798319327731,
"grad_norm": 0.6275476086489861,
"learning_rate": 3.889674301225025e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29918792843818665,
"step": 1305,
"valid_targets_mean": 3199.2,
"valid_targets_min": 869
},
{
"epoch": 1.3760504201680672,
"grad_norm": 0.6746694949290901,
"learning_rate": 3.8879519650852356e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33456575870513916,
"step": 1310,
"valid_targets_mean": 2817.8,
"valid_targets_min": 1603
},
{
"epoch": 1.3813025210084033,
"grad_norm": 0.6421028373174448,
"learning_rate": 3.886216676184555e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090163767337799,
"step": 1315,
"valid_targets_mean": 2942.2,
"valid_targets_min": 1135
},
{
"epoch": 1.3865546218487395,
"grad_norm": 0.5573926446318049,
"learning_rate": 3.8844684464283614e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33767062425613403,
"step": 1320,
"valid_targets_mean": 4077.0,
"valid_targets_min": 1994
},
{
"epoch": 1.3918067226890756,
"grad_norm": 0.637126836573775,
"learning_rate": 3.882707287810817e-05,
"loss": 0.3286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30095210671424866,
"step": 1325,
"valid_targets_mean": 3060.1,
"valid_targets_min": 1066
},
{
"epoch": 1.3970588235294117,
"grad_norm": 0.6321058379302512,
"learning_rate": 3.880933212414786e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33812808990478516,
"step": 1330,
"valid_targets_mean": 3687.4,
"valid_targets_min": 1211
},
{
"epoch": 1.4023109243697478,
"grad_norm": 0.6375112145565428,
"learning_rate": 3.87914623241175e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3038761019706726,
"step": 1335,
"valid_targets_mean": 2972.2,
"valid_targets_min": 1195
},
{
"epoch": 1.407563025210084,
"grad_norm": 0.7592514428689119,
"learning_rate": 3.877346360061728e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361939489841461,
"step": 1340,
"valid_targets_mean": 2429.5,
"valid_targets_min": 484
},
{
"epoch": 1.41281512605042,
"grad_norm": 0.6066430879087057,
"learning_rate": 3.8755336077131894e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3248080015182495,
"step": 1345,
"valid_targets_mean": 3851.9,
"valid_targets_min": 1257
},
{
"epoch": 1.4180672268907564,
"grad_norm": 0.5858554643624372,
"learning_rate": 3.873707987802967e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304246723651886,
"step": 1350,
"valid_targets_mean": 3483.2,
"valid_targets_min": 1372
},
{
"epoch": 1.4233193277310925,
"grad_norm": 0.6612075948640241,
"learning_rate": 3.871869512856179e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3278389275074005,
"step": 1355,
"valid_targets_mean": 3186.8,
"valid_targets_min": 1769
},
{
"epoch": 1.4285714285714286,
"grad_norm": 0.6552998713136254,
"learning_rate": 3.870018195486138e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31067150831222534,
"step": 1360,
"valid_targets_mean": 3407.6,
"valid_targets_min": 1074
},
{
"epoch": 1.4338235294117647,
"grad_norm": 0.5966743275691717,
"learning_rate": 3.868154048394262e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010474741458893,
"step": 1365,
"valid_targets_mean": 3796.4,
"valid_targets_min": 980
},
{
"epoch": 1.4390756302521008,
"grad_norm": 0.7359011060228771,
"learning_rate": 3.8662770843699944e-05,
"loss": 0.3306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3496723771095276,
"step": 1370,
"valid_targets_mean": 2808.1,
"valid_targets_min": 793
},
{
"epoch": 1.444327731092437,
"grad_norm": 0.65437369178061,
"learning_rate": 3.8643873162907086e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3403715491294861,
"step": 1375,
"valid_targets_mean": 3677.5,
"valid_targets_min": 1471
},
{
"epoch": 1.449579831932773,
"grad_norm": 0.6531132095155441,
"learning_rate": 3.862484757121627e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28045761585235596,
"step": 1380,
"valid_targets_mean": 3032.6,
"valid_targets_min": 1353
},
{
"epoch": 1.4548319327731092,
"grad_norm": 0.7024121158190606,
"learning_rate": 3.860569419915727e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31772103905677795,
"step": 1385,
"valid_targets_mean": 2601.9,
"valid_targets_min": 1084
},
{
"epoch": 1.4600840336134453,
"grad_norm": 0.6174258612511311,
"learning_rate": 3.858641317813653e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092023730278015,
"step": 1390,
"valid_targets_mean": 3280.8,
"valid_targets_min": 1428
},
{
"epoch": 1.4653361344537816,
"grad_norm": 0.6773260761366405,
"learning_rate": 3.8567004640436234e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30377262830734253,
"step": 1395,
"valid_targets_mean": 3229.4,
"valid_targets_min": 1193
},
{
"epoch": 1.4705882352941178,
"grad_norm": 0.6442894382965205,
"learning_rate": 3.8547468719213476e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951875925064087,
"step": 1400,
"valid_targets_mean": 3519.2,
"valid_targets_min": 1614
},
{
"epoch": 1.4758403361344539,
"grad_norm": 0.6233027503211065,
"learning_rate": 3.852780554849925e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2837674617767334,
"step": 1405,
"valid_targets_mean": 3699.1,
"valid_targets_min": 974
},
{
"epoch": 1.48109243697479,
"grad_norm": 0.6558871789844729,
"learning_rate": 3.850801526319761e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.277635395526886,
"step": 1410,
"valid_targets_mean": 2730.4,
"valid_targets_min": 1575
},
{
"epoch": 1.486344537815126,
"grad_norm": 0.5993355650257447,
"learning_rate": 3.84880979990847e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289740651845932,
"step": 1415,
"valid_targets_mean": 3345.0,
"valid_targets_min": 1697
},
{
"epoch": 1.4915966386554622,
"grad_norm": 0.5660470420295868,
"learning_rate": 3.846805389280782e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910107374191284,
"step": 1420,
"valid_targets_mean": 3602.2,
"valid_targets_min": 1970
},
{
"epoch": 1.4968487394957983,
"grad_norm": 0.6727298285320141,
"learning_rate": 3.844788308188452e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3241168260574341,
"step": 1425,
"valid_targets_mean": 3128.4,
"valid_targets_min": 887
},
{
"epoch": 1.5021008403361344,
"grad_norm": 0.7266333636248493,
"learning_rate": 3.8427585704701634e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3230634331703186,
"step": 1430,
"valid_targets_mean": 2712.2,
"valid_targets_min": 1279
},
{
"epoch": 1.5073529411764706,
"grad_norm": 0.625826335328431,
"learning_rate": 3.840716190051433e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28237617015838623,
"step": 1435,
"valid_targets_mean": 3052.6,
"valid_targets_min": 1021
},
{
"epoch": 1.5126050420168067,
"grad_norm": 0.643231670297035,
"learning_rate": 3.8386611809445155e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30906054377555847,
"step": 1440,
"valid_targets_mean": 3352.1,
"valid_targets_min": 654
},
{
"epoch": 1.5178571428571428,
"grad_norm": 0.7439322282160008,
"learning_rate": 3.8365935572483095e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3927016258239746,
"step": 1445,
"valid_targets_mean": 2860.6,
"valid_targets_min": 1039
},
{
"epoch": 1.523109243697479,
"grad_norm": 0.5906966913938343,
"learning_rate": 3.834513333148258e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29975053668022156,
"step": 1450,
"valid_targets_mean": 3742.9,
"valid_targets_min": 2459
},
{
"epoch": 1.528361344537815,
"grad_norm": 0.5784262635567486,
"learning_rate": 3.832420522916252e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27920496463775635,
"step": 1455,
"valid_targets_mean": 3435.8,
"valid_targets_min": 1276
},
{
"epoch": 1.5336134453781511,
"grad_norm": 0.5304379397196218,
"learning_rate": 3.830315140910534e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916795015335083,
"step": 1460,
"valid_targets_mean": 4335.8,
"valid_targets_min": 1572
},
{
"epoch": 1.5388655462184873,
"grad_norm": 0.690684220200614,
"learning_rate": 3.8281972015755965e-05,
"loss": 0.309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32439422607421875,
"step": 1465,
"valid_targets_mean": 2975.5,
"valid_targets_min": 791
},
{
"epoch": 1.5441176470588234,
"grad_norm": 0.9031172365787135,
"learning_rate": 3.826066719442086e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22157755494117737,
"step": 1470,
"valid_targets_mean": 1444.9,
"valid_targets_min": 740
},
{
"epoch": 1.5493697478991597,
"grad_norm": 0.8412510599148572,
"learning_rate": 3.823923709126701e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22126498818397522,
"step": 1475,
"valid_targets_mean": 1456.5,
"valid_targets_min": 612
},
{
"epoch": 1.5546218487394958,
"grad_norm": 1.1541206078120574,
"learning_rate": 3.821768185332095e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2107081413269043,
"step": 1480,
"valid_targets_mean": 1432.6,
"valid_targets_min": 826
},
{
"epoch": 1.559873949579832,
"grad_norm": 0.8048779001890545,
"learning_rate": 3.81960016284677e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.192092627286911,
"step": 1485,
"valid_targets_mean": 1432.6,
"valid_targets_min": 742
},
{
"epoch": 1.565126050420168,
"grad_norm": 0.8091682143521767,
"learning_rate": 3.817419656544979e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21445538103580475,
"step": 1490,
"valid_targets_mean": 1387.0,
"valid_targets_min": 718
},
{
"epoch": 1.5703781512605042,
"grad_norm": 0.8028634331257293,
"learning_rate": 3.815226681386626e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21761010587215424,
"step": 1495,
"valid_targets_mean": 1527.4,
"valid_targets_min": 764
},
{
"epoch": 1.5756302521008403,
"grad_norm": 0.7439177233189905,
"learning_rate": 3.8130212524171576e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19787126779556274,
"step": 1500,
"valid_targets_mean": 1353.6,
"valid_targets_min": 725
},
{
"epoch": 1.5808823529411766,
"grad_norm": 0.8142970979200826,
"learning_rate": 3.810803384767465e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1932760328054428,
"step": 1505,
"valid_targets_mean": 1309.9,
"valid_targets_min": 610
},
{
"epoch": 1.5861344537815127,
"grad_norm": 0.7340679359153581,
"learning_rate": 3.808573093653777e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19831883907318115,
"step": 1510,
"valid_targets_mean": 1465.4,
"valid_targets_min": 720
},
{
"epoch": 1.5913865546218489,
"grad_norm": 0.7860661366128959,
"learning_rate": 3.806330394377556e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19419294595718384,
"step": 1515,
"valid_targets_mean": 1379.4,
"valid_targets_min": 615
},
{
"epoch": 1.596638655462185,
"grad_norm": 0.8568638447176881,
"learning_rate": 3.8040753023253956e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2107909917831421,
"step": 1520,
"valid_targets_mean": 1158.2,
"valid_targets_min": 593
},
{
"epoch": 1.601890756302521,
"grad_norm": 0.6995773260097756,
"learning_rate": 3.801807832968912e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1988203525543213,
"step": 1525,
"valid_targets_mean": 1543.1,
"valid_targets_min": 704
},
{
"epoch": 1.6071428571428572,
"grad_norm": 0.7456785948304131,
"learning_rate": 3.799528001864637e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17537815868854523,
"step": 1530,
"valid_targets_mean": 1300.1,
"valid_targets_min": 722
},
{
"epoch": 1.6123949579831933,
"grad_norm": 0.8087741971757628,
"learning_rate": 3.797235824653918e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20719020068645477,
"step": 1535,
"valid_targets_mean": 1401.3,
"valid_targets_min": 642
},
{
"epoch": 1.6176470588235294,
"grad_norm": 0.7888860351461294,
"learning_rate": 3.7949313170628006e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2095479965209961,
"step": 1540,
"valid_targets_mean": 1436.8,
"valid_targets_min": 518
},
{
"epoch": 1.6228991596638656,
"grad_norm": 0.767345470182285,
"learning_rate": 3.79261449490193e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22027720510959625,
"step": 1545,
"valid_targets_mean": 1531.6,
"valid_targets_min": 728
},
{
"epoch": 1.6281512605042017,
"grad_norm": 0.8137805205710857,
"learning_rate": 3.7902853740664356e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21532106399536133,
"step": 1550,
"valid_targets_mean": 1469.6,
"valid_targets_min": 764
},
{
"epoch": 1.6334033613445378,
"grad_norm": 0.9016471374390324,
"learning_rate": 3.7879439705358286e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23087842762470245,
"step": 1555,
"valid_targets_mean": 1437.8,
"valid_targets_min": 818
},
{
"epoch": 1.638655462184874,
"grad_norm": 0.8353128948745288,
"learning_rate": 3.785590300373884e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2092447727918625,
"step": 1560,
"valid_targets_mean": 1327.3,
"valid_targets_min": 625
},
{
"epoch": 1.64390756302521,
"grad_norm": 0.868105384855138,
"learning_rate": 3.7832243797285385e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21071121096611023,
"step": 1565,
"valid_targets_mean": 1685.2,
"valid_targets_min": 790
},
{
"epoch": 1.6491596638655461,
"grad_norm": 0.7919143845079746,
"learning_rate": 3.780846224831775e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2265183925628662,
"step": 1570,
"valid_targets_mean": 1595.3,
"valid_targets_min": 891
},
{
"epoch": 1.6544117647058822,
"grad_norm": 0.7549544772773371,
"learning_rate": 3.7784558519995135e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18298515677452087,
"step": 1575,
"valid_targets_mean": 1381.1,
"valid_targets_min": 719
},
{
"epoch": 1.6596638655462184,
"grad_norm": 0.804144396397427,
"learning_rate": 3.776053277631496e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1860344111919403,
"step": 1580,
"valid_targets_mean": 1345.7,
"valid_targets_min": 657
},
{
"epoch": 1.6649159663865545,
"grad_norm": 0.9064506425487462,
"learning_rate": 3.7736385182111785e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20600754022598267,
"step": 1585,
"valid_targets_mean": 1342.1,
"valid_targets_min": 783
},
{
"epoch": 1.6701680672268906,
"grad_norm": 0.8588049760182106,
"learning_rate": 3.771211590305614e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1966136246919632,
"step": 1590,
"valid_targets_mean": 1450.6,
"valid_targets_min": 629
},
{
"epoch": 1.675420168067227,
"grad_norm": 0.7948243288514434,
"learning_rate": 3.768772510565342e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2040775567293167,
"step": 1595,
"valid_targets_mean": 1461.3,
"valid_targets_min": 678
},
{
"epoch": 1.680672268907563,
"grad_norm": 0.8255403927136926,
"learning_rate": 3.76632129572427e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20673060417175293,
"step": 1600,
"valid_targets_mean": 1723.1,
"valid_targets_min": 1075
},
{
"epoch": 1.6859243697478992,
"grad_norm": 0.7484827437017396,
"learning_rate": 3.763857962599565e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20060554146766663,
"step": 1605,
"valid_targets_mean": 1669.1,
"valid_targets_min": 816
},
{
"epoch": 1.6911764705882353,
"grad_norm": 0.7780511290517912,
"learning_rate": 3.761382528091531e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21109002828598022,
"step": 1610,
"valid_targets_mean": 1521.4,
"valid_targets_min": 957
},
{
"epoch": 1.6964285714285714,
"grad_norm": 0.8261801428366944,
"learning_rate": 3.7588950091834986e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18024760484695435,
"step": 1615,
"valid_targets_mean": 1282.1,
"valid_targets_min": 643
},
{
"epoch": 1.7016806722689075,
"grad_norm": 0.7650069206711103,
"learning_rate": 3.756395422941706e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20178046822547913,
"step": 1620,
"valid_targets_mean": 1499.7,
"valid_targets_min": 726
},
{
"epoch": 1.7069327731092439,
"grad_norm": 0.7087222035820604,
"learning_rate": 3.753883786515181e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19103536009788513,
"step": 1625,
"valid_targets_mean": 1621.1,
"valid_targets_min": 705
},
{
"epoch": 1.71218487394958,
"grad_norm": 0.8887563433958335,
"learning_rate": 3.751360117135628e-05,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20276349782943726,
"step": 1630,
"valid_targets_mean": 1390.9,
"valid_targets_min": 700
},
{
"epoch": 1.717436974789916,
"grad_norm": 0.8362395348050953,
"learning_rate": 3.7488244321173025e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18552342057228088,
"step": 1635,
"valid_targets_mean": 1254.4,
"valid_targets_min": 627
},
{
"epoch": 1.7226890756302522,
"grad_norm": 0.8655931910128335,
"learning_rate": 3.746276748856898e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18865495920181274,
"step": 1640,
"valid_targets_mean": 1479.2,
"valid_targets_min": 817
},
{
"epoch": 1.7279411764705883,
"grad_norm": 0.792892975194453,
"learning_rate": 3.743717084833425e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19585290551185608,
"step": 1645,
"valid_targets_mean": 1464.4,
"valid_targets_min": 974
},
{
"epoch": 1.7331932773109244,
"grad_norm": 0.779810593913834,
"learning_rate": 3.741145457608093e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20523177087306976,
"step": 1650,
"valid_targets_mean": 1381.2,
"valid_targets_min": 657
},
{
"epoch": 1.7384453781512605,
"grad_norm": 0.7826687066418191,
"learning_rate": 3.738561884824183e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20436634123325348,
"step": 1655,
"valid_targets_mean": 1486.0,
"valid_targets_min": 746
},
{
"epoch": 1.7436974789915967,
"grad_norm": 0.7652636064297311,
"learning_rate": 3.735966384206936e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20646733045578003,
"step": 1660,
"valid_targets_mean": 1459.7,
"valid_targets_min": 739
},
{
"epoch": 1.7489495798319328,
"grad_norm": 0.7655125678378137,
"learning_rate": 3.733358973563425e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18100708723068237,
"step": 1665,
"valid_targets_mean": 1397.0,
"valid_targets_min": 682
},
{
"epoch": 1.754201680672269,
"grad_norm": 0.7963580538812527,
"learning_rate": 3.730739670782435e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19578437507152557,
"step": 1670,
"valid_targets_mean": 1288.8,
"valid_targets_min": 703
},
{
"epoch": 1.759453781512605,
"grad_norm": 0.8662683116944544,
"learning_rate": 3.72810849383434e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18982970714569092,
"step": 1675,
"valid_targets_mean": 1446.1,
"valid_targets_min": 864
},
{
"epoch": 1.7647058823529411,
"grad_norm": 0.783041949999934,
"learning_rate": 3.725465460770978e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25431910157203674,
"step": 1680,
"valid_targets_mean": 1673.2,
"valid_targets_min": 734
},
{
"epoch": 1.7699579831932772,
"grad_norm": 0.7217643791824649,
"learning_rate": 3.7228105897255324e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2004881650209427,
"step": 1685,
"valid_targets_mean": 1598.7,
"valid_targets_min": 607
},
{
"epoch": 1.7752100840336134,
"grad_norm": 0.7436378042988409,
"learning_rate": 3.7201438989124e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1999681144952774,
"step": 1690,
"valid_targets_mean": 1445.2,
"valid_targets_min": 551
},
{
"epoch": 1.7804621848739495,
"grad_norm": 0.7501915605313334,
"learning_rate": 3.717465406627074e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20576688647270203,
"step": 1695,
"valid_targets_mean": 1552.2,
"valid_targets_min": 791
},
{
"epoch": 1.7857142857142856,
"grad_norm": 0.7628246639482904,
"learning_rate": 3.714775131246011e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20440012216567993,
"step": 1700,
"valid_targets_mean": 1511.6,
"valid_targets_min": 825
},
{
"epoch": 1.7909663865546217,
"grad_norm": 0.7246985646816825,
"learning_rate": 3.71207309122651e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20958301424980164,
"step": 1705,
"valid_targets_mean": 1489.3,
"valid_targets_min": 859
},
{
"epoch": 1.7962184873949578,
"grad_norm": 0.8076167406390439,
"learning_rate": 3.709359305106585e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18848812580108643,
"step": 1710,
"valid_targets_mean": 1356.9,
"valid_targets_min": 737
},
{
"epoch": 1.8014705882352942,
"grad_norm": 0.7618349813747334,
"learning_rate": 3.7066337915048354e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19808264076709747,
"step": 1715,
"valid_targets_mean": 1359.9,
"valid_targets_min": 791
},
{
"epoch": 1.8067226890756303,
"grad_norm": 0.8211165193393286,
"learning_rate": 3.7038965691203205e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20665648579597473,
"step": 1720,
"valid_targets_mean": 1443.4,
"valid_targets_min": 724
},
{
"epoch": 1.8119747899159664,
"grad_norm": 1.5195639624253412,
"learning_rate": 3.701147656732431e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18661421537399292,
"step": 1725,
"valid_targets_mean": 1376.3,
"valid_targets_min": 944
},
{
"epoch": 1.8172268907563025,
"grad_norm": 1.3672377372582318,
"learning_rate": 3.6983870732007596e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.171901673078537,
"step": 1730,
"valid_targets_mean": 1597.7,
"valid_targets_min": 802
},
{
"epoch": 1.8224789915966386,
"grad_norm": 0.7029694603857538,
"learning_rate": 3.695614837464972e-05,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18585661053657532,
"step": 1735,
"valid_targets_mean": 1419.2,
"valid_targets_min": 740
},
{
"epoch": 1.8277310924369747,
"grad_norm": 0.7128079074101666,
"learning_rate": 3.692830968544675e-05,
"loss": 0.192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1792781949043274,
"step": 1740,
"valid_targets_mean": 1570.5,
"valid_targets_min": 881
},
{
"epoch": 1.832983193277311,
"grad_norm": 0.7873525110103127,
"learning_rate": 3.690035485539291e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18637944757938385,
"step": 1745,
"valid_targets_mean": 1177.1,
"valid_targets_min": 636
},
{
"epoch": 1.8382352941176472,
"grad_norm": 0.812792057458698,
"learning_rate": 3.6872284076279205e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18359485268592834,
"step": 1750,
"valid_targets_mean": 1280.1,
"valid_targets_min": 814
},
{
"epoch": 1.8434873949579833,
"grad_norm": 0.7516261504287793,
"learning_rate": 3.684409754069215e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18630534410476685,
"step": 1755,
"valid_targets_mean": 1253.6,
"valid_targets_min": 604
},
{
"epoch": 1.8487394957983194,
"grad_norm": 0.7873312358062879,
"learning_rate": 3.681579544201244e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1809154450893402,
"step": 1760,
"valid_targets_mean": 1232.8,
"valid_targets_min": 661
},
{
"epoch": 1.8539915966386555,
"grad_norm": 0.7042638950908449,
"learning_rate": 3.6787377974413614e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1879248321056366,
"step": 1765,
"valid_targets_mean": 1484.8,
"valid_targets_min": 728
},
{
"epoch": 1.8592436974789917,
"grad_norm": 0.8708411897151677,
"learning_rate": 3.6758845332860734e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2018292248249054,
"step": 1770,
"valid_targets_mean": 1383.6,
"valid_targets_min": 692
},
{
"epoch": 1.8644957983193278,
"grad_norm": 0.727245204127273,
"learning_rate": 3.673019771310903e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19675494730472565,
"step": 1775,
"valid_targets_mean": 1386.2,
"valid_targets_min": 840
},
{
"epoch": 1.8697478991596639,
"grad_norm": 0.769303157042911,
"learning_rate": 3.670143531170258e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.200996533036232,
"step": 1780,
"valid_targets_mean": 1375.6,
"valid_targets_min": 772
},
{
"epoch": 1.875,
"grad_norm": 0.6945199303988268,
"learning_rate": 3.667255832597294e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19052547216415405,
"step": 1785,
"valid_targets_mean": 1612.4,
"valid_targets_min": 670
},
{
"epoch": 1.8802521008403361,
"grad_norm": 0.7679602226980033,
"learning_rate": 3.664356695403781e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18414106965065002,
"step": 1790,
"valid_targets_mean": 1427.0,
"valid_targets_min": 750
},
{
"epoch": 1.8855042016806722,
"grad_norm": 0.7707612142751945,
"learning_rate": 3.661446139479965e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20061108469963074,
"step": 1795,
"valid_targets_mean": 1479.3,
"valid_targets_min": 766
},
{
"epoch": 1.8907563025210083,
"grad_norm": 0.8561024756443094,
"learning_rate": 3.658524184794436e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16889707744121552,
"step": 1800,
"valid_targets_mean": 1241.5,
"valid_targets_min": 729
},
{
"epoch": 1.8960084033613445,
"grad_norm": 0.7618847795685194,
"learning_rate": 3.655590851393984e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20724733173847198,
"step": 1805,
"valid_targets_mean": 1410.9,
"valid_targets_min": 682
},
{
"epoch": 1.9012605042016806,
"grad_norm": 0.7752684468128507,
"learning_rate": 3.652646159403468e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20427414774894714,
"step": 1810,
"valid_targets_mean": 1569.1,
"valid_targets_min": 738
},
{
"epoch": 1.9065126050420167,
"grad_norm": 0.7353501689368992,
"learning_rate": 3.649690129025675e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2081902176141739,
"step": 1815,
"valid_targets_mean": 1378.0,
"valid_targets_min": 731
},
{
"epoch": 1.9117647058823528,
"grad_norm": 0.7289002335110303,
"learning_rate": 3.6467227805411824e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21570971608161926,
"step": 1820,
"valid_targets_mean": 1620.0,
"valid_targets_min": 748
},
{
"epoch": 1.917016806722689,
"grad_norm": 0.7240815176489389,
"learning_rate": 3.6437441343082174e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18155962228775024,
"step": 1825,
"valid_targets_mean": 1355.1,
"valid_targets_min": 564
},
{
"epoch": 1.9222689075630253,
"grad_norm": 0.7462727456723074,
"learning_rate": 3.6407542107625167e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18159963190555573,
"step": 1830,
"valid_targets_mean": 1419.1,
"valid_targets_min": 651
},
{
"epoch": 1.9275210084033614,
"grad_norm": 0.9386783714270683,
"learning_rate": 3.637753030417192e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18306277692317963,
"step": 1835,
"valid_targets_mean": 1291.7,
"valid_targets_min": 687
},
{
"epoch": 1.9327731092436975,
"grad_norm": 0.725039331848806,
"learning_rate": 3.6347406138625805e-05,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17465978860855103,
"step": 1840,
"valid_targets_mean": 1236.8,
"valid_targets_min": 703
},
{
"epoch": 1.9380252100840336,
"grad_norm": 0.7526079231589902,
"learning_rate": 3.631716981766111e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16068580746650696,
"step": 1845,
"valid_targets_mean": 1258.9,
"valid_targets_min": 522
},
{
"epoch": 1.9432773109243697,
"grad_norm": 0.7599278884583646,
"learning_rate": 3.6286821548721594e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1918371468782425,
"step": 1850,
"valid_targets_mean": 1495.5,
"valid_targets_min": 764
},
{
"epoch": 1.9485294117647058,
"grad_norm": 0.7979519291571235,
"learning_rate": 3.625636154001904e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21574504673480988,
"step": 1855,
"valid_targets_mean": 1421.0,
"valid_targets_min": 548
},
{
"epoch": 1.9537815126050422,
"grad_norm": 0.7338015635554208,
"learning_rate": 3.622579000053186e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20440888404846191,
"step": 1860,
"valid_targets_mean": 1487.2,
"valid_targets_min": 694
},
{
"epoch": 1.9590336134453783,
"grad_norm": 0.7129631803753865,
"learning_rate": 3.619510714000368e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2010660171508789,
"step": 1865,
"valid_targets_mean": 1512.4,
"valid_targets_min": 823
},
{
"epoch": 1.9642857142857144,
"grad_norm": 0.6958574230399347,
"learning_rate": 3.616431316894181e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15293735265731812,
"step": 1870,
"valid_targets_mean": 1375.4,
"valid_targets_min": 595
},
{
"epoch": 1.9695378151260505,
"grad_norm": 0.8984376849635196,
"learning_rate": 3.613340829861592e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2001931369304657,
"step": 1875,
"valid_targets_mean": 1401.2,
"valid_targets_min": 693
},
{
"epoch": 1.9747899159663866,
"grad_norm": 0.796278651195792,
"learning_rate": 3.61023927410565e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18896615505218506,
"step": 1880,
"valid_targets_mean": 1185.6,
"valid_targets_min": 720
},
{
"epoch": 1.9800420168067228,
"grad_norm": 0.6919750871597347,
"learning_rate": 3.607126670905346e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16711284220218658,
"step": 1885,
"valid_targets_mean": 1364.2,
"valid_targets_min": 685
},
{
"epoch": 1.9852941176470589,
"grad_norm": 0.6805728110467865,
"learning_rate": 3.60400304161546e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17011727392673492,
"step": 1890,
"valid_targets_mean": 1345.2,
"valid_targets_min": 658
},
{
"epoch": 1.990546218487395,
"grad_norm": 0.7601178723938317,
"learning_rate": 3.600868407666426e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18218779563903809,
"step": 1895,
"valid_targets_mean": 1431.4,
"valid_targets_min": 686
},
{
"epoch": 1.995798319327731,
"grad_norm": 0.6963519557748621,
"learning_rate": 3.597722790564172e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19570836424827576,
"step": 1900,
"valid_targets_mean": 1505.8,
"valid_targets_min": 713
},
{
"epoch": 2.0010504201680672,
"grad_norm": 0.8543332754648679,
"learning_rate": 3.5945662118899824e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3345944881439209,
"step": 1905,
"valid_targets_mean": 2493.1,
"valid_targets_min": 954
},
{
"epoch": 2.0063025210084033,
"grad_norm": 0.6540945057835557,
"learning_rate": 3.5913986933003455e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2893906235694885,
"step": 1910,
"valid_targets_mean": 3336.9,
"valid_targets_min": 533
},
{
"epoch": 2.0115546218487395,
"grad_norm": 0.5859587843451456,
"learning_rate": 3.5882202565268046e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30491194128990173,
"step": 1915,
"valid_targets_mean": 3515.8,
"valid_targets_min": 1635
},
{
"epoch": 2.0168067226890756,
"grad_norm": 0.5848592413314749,
"learning_rate": 3.58503092337581e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3176591992378235,
"step": 1920,
"valid_targets_mean": 3744.6,
"valid_targets_min": 777
},
{
"epoch": 2.0220588235294117,
"grad_norm": 0.5277378066045798,
"learning_rate": 3.5818307157285705e-05,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2889269292354584,
"step": 1925,
"valid_targets_mean": 4188.5,
"valid_targets_min": 2187
},
{
"epoch": 2.027310924369748,
"grad_norm": 0.6598583479222365,
"learning_rate": 3.5786196555409006e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30424559116363525,
"step": 1930,
"valid_targets_mean": 3188.1,
"valid_targets_min": 1432
},
{
"epoch": 2.032563025210084,
"grad_norm": 0.6035540307689007,
"learning_rate": 3.575397764843073e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2632938027381897,
"step": 1935,
"valid_targets_mean": 3703.5,
"valid_targets_min": 767
},
{
"epoch": 2.03781512605042,
"grad_norm": 0.6545986679555346,
"learning_rate": 3.572165065739664e-05,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869631052017212,
"step": 1940,
"valid_targets_mean": 3793.3,
"valid_targets_min": 1488
},
{
"epoch": 2.043067226890756,
"grad_norm": 0.5266355858459322,
"learning_rate": 3.5689215804094053e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2697930932044983,
"step": 1945,
"valid_targets_mean": 3814.2,
"valid_targets_min": 578
},
{
"epoch": 2.0483193277310923,
"grad_norm": 0.5529414922643042,
"learning_rate": 3.5656673311050285e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.298675537109375,
"step": 1950,
"valid_targets_mean": 3997.1,
"valid_targets_min": 1241
},
{
"epoch": 2.0535714285714284,
"grad_norm": 0.5889438843034916,
"learning_rate": 3.562402340153115e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097384572029114,
"step": 1955,
"valid_targets_mean": 3797.0,
"valid_targets_min": 807
},
{
"epoch": 2.0588235294117645,
"grad_norm": 0.4888383801769635,
"learning_rate": 3.559126629953942e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2800885736942291,
"step": 1960,
"valid_targets_mean": 5091.3,
"valid_targets_min": 2061
},
{
"epoch": 2.064075630252101,
"grad_norm": 0.5549566154812772,
"learning_rate": 3.5558402229813287e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28934812545776367,
"step": 1965,
"valid_targets_mean": 4230.9,
"valid_targets_min": 1329
},
{
"epoch": 2.069327731092437,
"grad_norm": 0.5836584192752005,
"learning_rate": 3.552543141782483e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896938621997833,
"step": 1970,
"valid_targets_mean": 3577.5,
"valid_targets_min": 1412
},
{
"epoch": 2.0745798319327733,
"grad_norm": 0.6187434500702056,
"learning_rate": 3.549235408977843e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2899538576602936,
"step": 1975,
"valid_targets_mean": 3247.0,
"valid_targets_min": 1334
},
{
"epoch": 2.0798319327731094,
"grad_norm": 0.5443173852803067,
"learning_rate": 3.545917047260928e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27411580085754395,
"step": 1980,
"valid_targets_mean": 4207.9,
"valid_targets_min": 1847
},
{
"epoch": 2.0850840336134455,
"grad_norm": 0.6049544183292745,
"learning_rate": 3.542588079398179e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2940400540828705,
"step": 1985,
"valid_targets_mean": 3505.8,
"valid_targets_min": 1040
},
{
"epoch": 2.0903361344537816,
"grad_norm": 0.6603766972468182,
"learning_rate": 3.539248528228801e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3235289454460144,
"step": 1990,
"valid_targets_mean": 3247.1,
"valid_targets_min": 1269
},
{
"epoch": 2.0955882352941178,
"grad_norm": 0.6507849332876462,
"learning_rate": 3.535898416664611e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29736390709877014,
"step": 1995,
"valid_targets_mean": 2779.6,
"valid_targets_min": 1041
},
{
"epoch": 2.100840336134454,
"grad_norm": 0.6263414769134444,
"learning_rate": 3.5325377676898766e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30523204803466797,
"step": 2000,
"valid_targets_mean": 2963.0,
"valid_targets_min": 1291
},
{
"epoch": 2.10609243697479,
"grad_norm": 0.7168587293071478,
"learning_rate": 3.529166604361161e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3294321298599243,
"step": 2005,
"valid_targets_mean": 2588.5,
"valid_targets_min": 1285
},
{
"epoch": 2.111344537815126,
"grad_norm": 0.7408150111837036,
"learning_rate": 3.525784949807162e-05,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28167465329170227,
"step": 2010,
"valid_targets_mean": 3554.5,
"valid_targets_min": 865
},
{
"epoch": 2.116596638655462,
"grad_norm": 0.6431903275157029,
"learning_rate": 3.522392827228557e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769734561443329,
"step": 2015,
"valid_targets_mean": 2872.8,
"valid_targets_min": 958
},
{
"epoch": 2.1218487394957983,
"grad_norm": 0.6159459227356286,
"learning_rate": 3.518990259897841e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30407899618148804,
"step": 2020,
"valid_targets_mean": 3317.6,
"valid_targets_min": 771
},
{
"epoch": 2.1271008403361344,
"grad_norm": 0.5523195230692622,
"learning_rate": 3.515577271159167e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792849838733673,
"step": 2025,
"valid_targets_mean": 3849.6,
"valid_targets_min": 1631
},
{
"epoch": 2.1323529411764706,
"grad_norm": 0.5889011467855694,
"learning_rate": 3.512153884428188e-05,
"loss": 0.2929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2551637589931488,
"step": 2030,
"valid_targets_mean": 3065.6,
"valid_targets_min": 908
},
{
"epoch": 2.1376050420168067,
"grad_norm": 0.6584415672877822,
"learning_rate": 3.5087201231918944e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2937019467353821,
"step": 2035,
"valid_targets_mean": 2962.0,
"valid_targets_min": 1264
},
{
"epoch": 2.142857142857143,
"grad_norm": 0.5843888599963277,
"learning_rate": 3.505276011008454e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29179146885871887,
"step": 2040,
"valid_targets_mean": 3853.1,
"valid_targets_min": 1889
},
{
"epoch": 2.148109243697479,
"grad_norm": 0.6018556070826566,
"learning_rate": 3.501821571507048e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27817726135253906,
"step": 2045,
"valid_targets_mean": 3645.2,
"valid_targets_min": 1075
},
{
"epoch": 2.153361344537815,
"grad_norm": 0.7369039817083102,
"learning_rate": 3.498356828387714e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28218644857406616,
"step": 2050,
"valid_targets_mean": 2874.9,
"valid_targets_min": 1036
},
{
"epoch": 2.158613445378151,
"grad_norm": 0.5740508320378505,
"learning_rate": 3.494881805421176e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2825021743774414,
"step": 2055,
"valid_targets_mean": 3808.9,
"valid_targets_min": 1162
},
{
"epoch": 2.1638655462184873,
"grad_norm": 0.6677586403458295,
"learning_rate": 3.4913965264486894e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2949675917625427,
"step": 2060,
"valid_targets_mean": 3164.9,
"valid_targets_min": 1281
},
{
"epoch": 2.1691176470588234,
"grad_norm": 0.583170841394605,
"learning_rate": 3.48790101538187e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2632118761539459,
"step": 2065,
"valid_targets_mean": 3503.5,
"valid_targets_min": 1841
},
{
"epoch": 2.1743697478991595,
"grad_norm": 0.6659128870236808,
"learning_rate": 3.484395296202537e-05,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30187827348709106,
"step": 2070,
"valid_targets_mean": 3121.7,
"valid_targets_min": 1629
},
{
"epoch": 2.1796218487394956,
"grad_norm": 0.7188591131831868,
"learning_rate": 3.480879392962541e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2901453971862793,
"step": 2075,
"valid_targets_mean": 2668.6,
"valid_targets_min": 1254
},
{
"epoch": 2.184873949579832,
"grad_norm": 0.7182569920584896,
"learning_rate": 3.477353329783606e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30515027046203613,
"step": 2080,
"valid_targets_mean": 3032.6,
"valid_targets_min": 1774
},
{
"epoch": 2.190126050420168,
"grad_norm": 0.678604840038963,
"learning_rate": 3.4738171308571595e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986491322517395,
"step": 2085,
"valid_targets_mean": 3079.8,
"valid_targets_min": 1643
},
{
"epoch": 2.1953781512605044,
"grad_norm": 0.6392734138959271,
"learning_rate": 3.470270820444168e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3071242570877075,
"step": 2090,
"valid_targets_mean": 3021.6,
"valid_targets_min": 1244
},
{
"epoch": 2.2006302521008405,
"grad_norm": 0.585164572193224,
"learning_rate": 3.4667144228749697e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744428515434265,
"step": 2095,
"valid_targets_mean": 3588.4,
"valid_targets_min": 959
},
{
"epoch": 2.2058823529411766,
"grad_norm": 0.5843477775486158,
"learning_rate": 3.463147962549109e-05,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655976414680481,
"step": 2100,
"valid_targets_mean": 3404.8,
"valid_targets_min": 2037
},
{
"epoch": 2.2111344537815127,
"grad_norm": 0.5703037332493616,
"learning_rate": 3.459571463935168e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898704409599304,
"step": 2105,
"valid_targets_mean": 3745.2,
"valid_targets_min": 1168
},
{
"epoch": 2.216386554621849,
"grad_norm": 0.6261977462323101,
"learning_rate": 3.455984951570598e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655256390571594,
"step": 2110,
"valid_targets_mean": 3479.8,
"valid_targets_min": 1700
},
{
"epoch": 2.221638655462185,
"grad_norm": 0.6273371865248328,
"learning_rate": 3.452388450061556e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25678104162216187,
"step": 2115,
"valid_targets_mean": 2905.8,
"valid_targets_min": 1261
},
{
"epoch": 2.226890756302521,
"grad_norm": 0.6154152263889715,
"learning_rate": 3.448781984082727e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2871716022491455,
"step": 2120,
"valid_targets_mean": 3363.2,
"valid_targets_min": 1124
},
{
"epoch": 2.232142857142857,
"grad_norm": 0.6237253157214722,
"learning_rate": 3.4451655783771625e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2972951829433441,
"step": 2125,
"valid_targets_mean": 3210.6,
"valid_targets_min": 1361
},
{
"epoch": 2.2373949579831933,
"grad_norm": 0.5944182232171416,
"learning_rate": 3.4415392577561064e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26949986815452576,
"step": 2130,
"valid_targets_mean": 2948.4,
"valid_targets_min": 1555
},
{
"epoch": 2.2426470588235294,
"grad_norm": 0.6239663761256676,
"learning_rate": 3.4379030470988285e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31491410732269287,
"step": 2135,
"valid_targets_mean": 3311.2,
"valid_targets_min": 1739
},
{
"epoch": 2.2478991596638656,
"grad_norm": 0.6358976127732551,
"learning_rate": 3.4342569713524496e-05,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2920129895210266,
"step": 2140,
"valid_targets_mean": 3192.8,
"valid_targets_min": 1278
},
{
"epoch": 2.2531512605042017,
"grad_norm": 0.534574837437247,
"learning_rate": 3.4306010555317735e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571936249732971,
"step": 2145,
"valid_targets_mean": 3951.6,
"valid_targets_min": 1522
},
{
"epoch": 2.258403361344538,
"grad_norm": 0.6364635502715449,
"learning_rate": 3.4269353247191135e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28747859597206116,
"step": 2150,
"valid_targets_mean": 3641.8,
"valid_targets_min": 464
},
{
"epoch": 2.263655462184874,
"grad_norm": 0.5854458561363409,
"learning_rate": 3.423259804064122e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2922632098197937,
"step": 2155,
"valid_targets_mean": 3598.4,
"valid_targets_min": 1003
},
{
"epoch": 2.26890756302521,
"grad_norm": 0.6600515244262581,
"learning_rate": 3.419574518783616e-05,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910274267196655,
"step": 2160,
"valid_targets_mean": 3158.1,
"valid_targets_min": 1632
},
{
"epoch": 2.274159663865546,
"grad_norm": 0.6099216472379927,
"learning_rate": 3.4158794941614055e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2801975905895233,
"step": 2165,
"valid_targets_mean": 3131.9,
"valid_targets_min": 1256
},
{
"epoch": 2.2794117647058822,
"grad_norm": 0.6173217093072781,
"learning_rate": 3.4121747555481216e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2909969091415405,
"step": 2170,
"valid_targets_mean": 3894.9,
"valid_targets_min": 1336
},
{
"epoch": 2.2846638655462184,
"grad_norm": 0.5395127043883584,
"learning_rate": 3.4084603283610365e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2728331685066223,
"step": 2175,
"valid_targets_mean": 4360.4,
"valid_targets_min": 1651
},
{
"epoch": 2.2899159663865545,
"grad_norm": 0.6332732127944597,
"learning_rate": 3.404736238083897e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2798515558242798,
"step": 2180,
"valid_targets_mean": 2921.1,
"valid_targets_min": 644
},
{
"epoch": 2.2951680672268906,
"grad_norm": 0.7961507640330674,
"learning_rate": 3.401002510266744e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26711398363113403,
"step": 2185,
"valid_targets_mean": 2848.1,
"valid_targets_min": 1397
},
{
"epoch": 2.3004201680672267,
"grad_norm": 0.6593038634993043,
"learning_rate": 3.397259170525739e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28789085149765015,
"step": 2190,
"valid_targets_mean": 2673.2,
"valid_targets_min": 1557
},
{
"epoch": 2.3056722689075633,
"grad_norm": 0.6958476283104791,
"learning_rate": 3.393506244542991e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292041540145874,
"step": 2195,
"valid_targets_mean": 2930.8,
"valid_targets_min": 1405
},
{
"epoch": 2.310924369747899,
"grad_norm": 0.6218694808083172,
"learning_rate": 3.389743758066374e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2553059458732605,
"step": 2200,
"valid_targets_mean": 3421.8,
"valid_targets_min": 1042
},
{
"epoch": 2.3161764705882355,
"grad_norm": 0.6961575232099882,
"learning_rate": 3.385971736909357e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27729037404060364,
"step": 2205,
"valid_targets_mean": 3172.2,
"valid_targets_min": 858
},
{
"epoch": 2.3214285714285716,
"grad_norm": 0.6655059432652326,
"learning_rate": 3.382190206950822e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27774959802627563,
"step": 2210,
"valid_targets_mean": 3166.3,
"valid_targets_min": 1288
},
{
"epoch": 2.3266806722689077,
"grad_norm": 0.5920405087936736,
"learning_rate": 3.3783991941348916e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696320414543152,
"step": 2215,
"valid_targets_mean": 3645.1,
"valid_targets_min": 1915
},
{
"epoch": 2.331932773109244,
"grad_norm": 0.6019837190284246,
"learning_rate": 3.374598724470745e-05,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2848033010959625,
"step": 2220,
"valid_targets_mean": 3868.2,
"valid_targets_min": 1501
},
{
"epoch": 2.33718487394958,
"grad_norm": 0.6419175889567692,
"learning_rate": 3.370788824032441e-05,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27997952699661255,
"step": 2225,
"valid_targets_mean": 2992.5,
"valid_targets_min": 1255
},
{
"epoch": 2.342436974789916,
"grad_norm": 0.6429288935922298,
"learning_rate": 3.366969518958746e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29206526279449463,
"step": 2230,
"valid_targets_mean": 3205.4,
"valid_targets_min": 1586
},
{
"epoch": 2.347689075630252,
"grad_norm": 0.5926026217237049,
"learning_rate": 3.363140835452945e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542131543159485,
"step": 2235,
"valid_targets_mean": 3410.4,
"valid_targets_min": 1181
},
{
"epoch": 2.3529411764705883,
"grad_norm": 0.6805026667731596,
"learning_rate": 3.3593027997826654e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26993298530578613,
"step": 2240,
"valid_targets_mean": 2876.6,
"valid_targets_min": 1428
},
{
"epoch": 2.3581932773109244,
"grad_norm": 0.6149224206718514,
"learning_rate": 3.355455438279702e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27489912509918213,
"step": 2245,
"valid_targets_mean": 3850.8,
"valid_targets_min": 1708
},
{
"epoch": 2.3634453781512605,
"grad_norm": 0.7148223911895215,
"learning_rate": 3.351598777339827e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31252795457839966,
"step": 2250,
"valid_targets_mean": 3311.1,
"valid_targets_min": 1171
},
{
"epoch": 2.3686974789915967,
"grad_norm": 0.6343777416548871,
"learning_rate": 3.3477328434226164e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894600033760071,
"step": 2255,
"valid_targets_mean": 3490.8,
"valid_targets_min": 1834
},
{
"epoch": 2.3739495798319328,
"grad_norm": 0.5713389821309428,
"learning_rate": 3.343857663051264e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28061312437057495,
"step": 2260,
"valid_targets_mean": 4200.2,
"valid_targets_min": 1529
},
{
"epoch": 2.379201680672269,
"grad_norm": 0.6593813910051031,
"learning_rate": 3.339973262812403e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28659868240356445,
"step": 2265,
"valid_targets_mean": 3408.4,
"valid_targets_min": 845
},
{
"epoch": 2.384453781512605,
"grad_norm": 0.5688545517719381,
"learning_rate": 3.336079669355921e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2584436535835266,
"step": 2270,
"valid_targets_mean": 3692.9,
"valid_targets_min": 2113
},
{
"epoch": 2.389705882352941,
"grad_norm": 0.6802358237019724,
"learning_rate": 3.332176909394777e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3029017448425293,
"step": 2275,
"valid_targets_mean": 2837.8,
"valid_targets_min": 802
},
{
"epoch": 2.3949579831932772,
"grad_norm": 0.6451243325404382,
"learning_rate": 3.3282650097048206e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26884186267852783,
"step": 2280,
"valid_targets_mean": 3303.2,
"valid_targets_min": 1433
},
{
"epoch": 2.4002100840336134,
"grad_norm": 0.7202674984435038,
"learning_rate": 3.324343997124606e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3011503219604492,
"step": 2285,
"valid_targets_mean": 3398.4,
"valid_targets_min": 1035
},
{
"epoch": 2.4054621848739495,
"grad_norm": 0.6862578318316971,
"learning_rate": 3.3204138985552094e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28322312235832214,
"step": 2290,
"valid_targets_mean": 2917.6,
"valid_targets_min": 637
},
{
"epoch": 2.4107142857142856,
"grad_norm": 0.6876766550885656,
"learning_rate": 3.316474740960041e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2967104911804199,
"step": 2295,
"valid_targets_mean": 3035.1,
"valid_targets_min": 814
},
{
"epoch": 2.4159663865546217,
"grad_norm": 0.603593965602333,
"learning_rate": 3.312526551364667e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26389676332473755,
"step": 2300,
"valid_targets_mean": 3494.5,
"valid_targets_min": 1913
},
{
"epoch": 2.421218487394958,
"grad_norm": 0.6258585295206295,
"learning_rate": 3.308569356856616e-05,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644697427749634,
"step": 2305,
"valid_targets_mean": 3577.7,
"valid_targets_min": 1410
},
{
"epoch": 2.426470588235294,
"grad_norm": 0.6298839340403605,
"learning_rate": 3.3046031845851993e-05,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26435354351997375,
"step": 2310,
"valid_targets_mean": 3195.6,
"valid_targets_min": 1390
},
{
"epoch": 2.43172268907563,
"grad_norm": 0.6686960769778729,
"learning_rate": 3.3006280617613214e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.333891898393631,
"step": 2315,
"valid_targets_mean": 3242.2,
"valid_targets_min": 611
},
{
"epoch": 2.4369747899159666,
"grad_norm": 0.6994882884638276,
"learning_rate": 3.296644015657295e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29009950160980225,
"step": 2320,
"valid_targets_mean": 3322.3,
"valid_targets_min": 1451
},
{
"epoch": 2.4422268907563023,
"grad_norm": 0.6022542746468339,
"learning_rate": 3.292651073606652e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24634996056556702,
"step": 2325,
"valid_targets_mean": 3026.8,
"valid_targets_min": 1459
},
{
"epoch": 2.447478991596639,
"grad_norm": 0.7597076620942451,
"learning_rate": 3.288649263003958e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30025792121887207,
"step": 2330,
"valid_targets_mean": 2535.8,
"valid_targets_min": 999
},
{
"epoch": 2.452731092436975,
"grad_norm": 0.5901929232154103,
"learning_rate": 3.284638611304623e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24954357743263245,
"step": 2335,
"valid_targets_mean": 3463.1,
"valid_targets_min": 1564
},
{
"epoch": 2.457983193277311,
"grad_norm": 0.6305958469820415,
"learning_rate": 3.280619146024714e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2825808525085449,
"step": 2340,
"valid_targets_mean": 3291.3,
"valid_targets_min": 1470
},
{
"epoch": 2.463235294117647,
"grad_norm": 0.6407328134623678,
"learning_rate": 3.2765908947407665e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26442772150039673,
"step": 2345,
"valid_targets_mean": 3654.3,
"valid_targets_min": 1935
},
{
"epoch": 2.4684873949579833,
"grad_norm": 0.6192241477472046,
"learning_rate": 3.2725538850895933e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25553327798843384,
"step": 2350,
"valid_targets_mean": 3334.8,
"valid_targets_min": 1375
},
{
"epoch": 2.4737394957983194,
"grad_norm": 0.5958070120631284,
"learning_rate": 3.268508144768096e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25967782735824585,
"step": 2355,
"valid_targets_mean": 3422.6,
"valid_targets_min": 1294
},
{
"epoch": 2.4789915966386555,
"grad_norm": 0.5693719485778825,
"learning_rate": 3.264453701533075e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25220775604248047,
"step": 2360,
"valid_targets_mean": 3406.5,
"valid_targets_min": 1496
},
{
"epoch": 2.4842436974789917,
"grad_norm": 0.6509477999261548,
"learning_rate": 3.260390583201041e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27943873405456543,
"step": 2365,
"valid_targets_mean": 3359.4,
"valid_targets_min": 1333
},
{
"epoch": 2.4894957983193278,
"grad_norm": 0.6327828789713742,
"learning_rate": 3.2563188176480217e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27448466420173645,
"step": 2370,
"valid_targets_mean": 3461.3,
"valid_targets_min": 2264
},
{
"epoch": 2.494747899159664,
"grad_norm": 0.6536523986307107,
"learning_rate": 3.252238432809368e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812950015068054,
"step": 2375,
"valid_targets_mean": 3145.4,
"valid_targets_min": 1454
},
{
"epoch": 2.5,
"grad_norm": 0.6139150491194192,
"learning_rate": 3.2481494566795716e-05,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27129268646240234,
"step": 2380,
"valid_targets_mean": 3347.1,
"valid_targets_min": 1712
},
{
"epoch": 2.505252100840336,
"grad_norm": 0.6255364740679421,
"learning_rate": 3.244051917312061e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2420213669538498,
"step": 2385,
"valid_targets_mean": 3450.1,
"valid_targets_min": 1433
},
{
"epoch": 2.5105042016806722,
"grad_norm": 0.5931305720132205,
"learning_rate": 3.239945842819018e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606050372123718,
"step": 2390,
"valid_targets_mean": 3711.4,
"valid_targets_min": 1943
},
{
"epoch": 2.5157563025210083,
"grad_norm": 0.5818743103427734,
"learning_rate": 3.2358312613711804e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24495342373847961,
"step": 2395,
"valid_targets_mean": 3649.8,
"valid_targets_min": 1945
},
{
"epoch": 2.5210084033613445,
"grad_norm": 0.6430898542162261,
"learning_rate": 3.231708201197653e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672806978225708,
"step": 2400,
"valid_targets_mean": 2710.3,
"valid_targets_min": 815
},
{
"epoch": 2.5262605042016806,
"grad_norm": 0.6238779450079466,
"learning_rate": 3.227576690585706e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29193007946014404,
"step": 2405,
"valid_targets_mean": 3416.9,
"valid_targets_min": 809
},
{
"epoch": 2.5315126050420167,
"grad_norm": 0.5995241914800916,
"learning_rate": 3.223436757880591e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2675004005432129,
"step": 2410,
"valid_targets_mean": 3632.6,
"valid_targets_min": 1727
},
{
"epoch": 2.536764705882353,
"grad_norm": 0.6158294085854414,
"learning_rate": 3.219288431485337e-05,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2477218508720398,
"step": 2415,
"valid_targets_mean": 2918.1,
"valid_targets_min": 1622
},
{
"epoch": 2.542016806722689,
"grad_norm": 0.8470134075805191,
"learning_rate": 3.2151317398605646e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1993420273065567,
"step": 2420,
"valid_targets_mean": 1337.4,
"valid_targets_min": 788
},
{
"epoch": 2.5472689075630255,
"grad_norm": 0.7459112191461049,
"learning_rate": 3.2109667115242815e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18858204782009125,
"step": 2425,
"valid_targets_mean": 1537.9,
"valid_targets_min": 957
},
{
"epoch": 2.552521008403361,
"grad_norm": 0.764955976635607,
"learning_rate": 3.206793375051694e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17688506841659546,
"step": 2430,
"valid_targets_mean": 1386.6,
"valid_targets_min": 796
},
{
"epoch": 2.5577731092436977,
"grad_norm": 0.9461176823521338,
"learning_rate": 3.2026117590750086e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18542060256004333,
"step": 2435,
"valid_targets_mean": 1313.4,
"valid_targets_min": 697
},
{
"epoch": 2.5630252100840334,
"grad_norm": 0.7925028804553308,
"learning_rate": 3.198421892283235e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18615254759788513,
"step": 2440,
"valid_targets_mean": 1576.1,
"valid_targets_min": 638
},
{
"epoch": 2.56827731092437,
"grad_norm": 0.7519556440109215,
"learning_rate": 3.1942238034219885e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18748995661735535,
"step": 2445,
"valid_targets_mean": 1508.0,
"valid_targets_min": 727
},
{
"epoch": 2.5735294117647056,
"grad_norm": 0.7720688633693402,
"learning_rate": 3.190017521293296e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16558489203453064,
"step": 2450,
"valid_targets_mean": 1276.2,
"valid_targets_min": 761
},
{
"epoch": 2.578781512605042,
"grad_norm": 0.8326618926243746,
"learning_rate": 3.185803074755395e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751636564731598,
"step": 2455,
"valid_targets_mean": 1297.8,
"valid_targets_min": 714
},
{
"epoch": 2.5840336134453783,
"grad_norm": 0.7347796399611563,
"learning_rate": 3.1815804927225363e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1736968755722046,
"step": 2460,
"valid_targets_mean": 1447.1,
"valid_targets_min": 741
},
{
"epoch": 2.5892857142857144,
"grad_norm": 0.7982508928947285,
"learning_rate": 3.1773498041647876e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20142167806625366,
"step": 2465,
"valid_targets_mean": 1720.9,
"valid_targets_min": 663
},
{
"epoch": 2.5945378151260505,
"grad_norm": 0.7855892482872033,
"learning_rate": 3.173111038107834e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18200182914733887,
"step": 2470,
"valid_targets_mean": 1435.6,
"valid_targets_min": 632
},
{
"epoch": 2.5997899159663866,
"grad_norm": 0.7759266996305735,
"learning_rate": 3.168864223632776e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17558130621910095,
"step": 2475,
"valid_targets_mean": 1619.9,
"valid_targets_min": 933
},
{
"epoch": 2.6050420168067228,
"grad_norm": 0.6783776091632051,
"learning_rate": 3.1646093898759334e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16645342111587524,
"step": 2480,
"valid_targets_mean": 1491.7,
"valid_targets_min": 717
},
{
"epoch": 2.610294117647059,
"grad_norm": 0.7711910637914073,
"learning_rate": 3.160346566028645e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16639794409275055,
"step": 2485,
"valid_targets_mean": 1278.4,
"valid_targets_min": 659
},
{
"epoch": 2.615546218487395,
"grad_norm": 0.7139740512846204,
"learning_rate": 3.156075781337068e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15931686758995056,
"step": 2490,
"valid_targets_mean": 1346.2,
"valid_targets_min": 642
},
{
"epoch": 2.620798319327731,
"grad_norm": 0.7301516156278756,
"learning_rate": 3.1517970651019735e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1589939445257187,
"step": 2495,
"valid_targets_mean": 1324.8,
"valid_targets_min": 765
},
{
"epoch": 2.6260504201680672,
"grad_norm": 0.8269901402636304,
"learning_rate": 3.1475104466785536e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1824565976858139,
"step": 2500,
"valid_targets_mean": 1293.7,
"valid_targets_min": 631
},
{
"epoch": 2.6313025210084033,
"grad_norm": 0.8200023743718566,
"learning_rate": 3.143215955476211e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19661253690719604,
"step": 2505,
"valid_targets_mean": 1490.3,
"valid_targets_min": 623
},
{
"epoch": 2.6365546218487395,
"grad_norm": 0.7270060792013762,
"learning_rate": 3.138913620958365e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1958092451095581,
"step": 2510,
"valid_targets_mean": 1748.8,
"valid_targets_min": 818
},
{
"epoch": 2.6418067226890756,
"grad_norm": 0.728759015109214,
"learning_rate": 3.134603472642244e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16739603877067566,
"step": 2515,
"valid_targets_mean": 1434.9,
"valid_targets_min": 776
},
{
"epoch": 2.6470588235294117,
"grad_norm": 0.8025983924576464,
"learning_rate": 3.1302855400986866e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17958450317382812,
"step": 2520,
"valid_targets_mean": 1402.4,
"valid_targets_min": 623
},
{
"epoch": 2.652310924369748,
"grad_norm": 0.7842835266150214,
"learning_rate": 3.1259598529519336e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18177050352096558,
"step": 2525,
"valid_targets_mean": 1400.9,
"valid_targets_min": 693
},
{
"epoch": 2.657563025210084,
"grad_norm": 0.7753249562445936,
"learning_rate": 3.121626440879432e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1475217640399933,
"step": 2530,
"valid_targets_mean": 1109.4,
"valid_targets_min": 611
},
{
"epoch": 2.66281512605042,
"grad_norm": 0.7722564104049819,
"learning_rate": 3.117285333611625e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18021240830421448,
"step": 2535,
"valid_targets_mean": 1552.2,
"valid_targets_min": 793
},
{
"epoch": 2.668067226890756,
"grad_norm": 0.8324884710244702,
"learning_rate": 3.112936560931752e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621646136045456,
"step": 2540,
"valid_targets_mean": 1393.4,
"valid_targets_min": 563
},
{
"epoch": 2.6733193277310923,
"grad_norm": 0.745079772832585,
"learning_rate": 3.108580152675642e-05,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16466446220874786,
"step": 2545,
"valid_targets_mean": 1476.5,
"valid_targets_min": 837
},
{
"epoch": 2.678571428571429,
"grad_norm": 0.7667224190162166,
"learning_rate": 3.104216138731511e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17364142835140228,
"step": 2550,
"valid_targets_mean": 1660.7,
"valid_targets_min": 1107
},
{
"epoch": 2.6838235294117645,
"grad_norm": 0.8705202254035619,
"learning_rate": 3.0998445490397546e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17687436938285828,
"step": 2555,
"valid_targets_mean": 1498.9,
"valid_targets_min": 680
},
{
"epoch": 2.689075630252101,
"grad_norm": 0.7422198641689959,
"learning_rate": 3.095465413592743e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1798504889011383,
"step": 2560,
"valid_targets_mean": 1571.8,
"valid_targets_min": 803
},
{
"epoch": 2.6943277310924367,
"grad_norm": 0.8053104805546935,
"learning_rate": 3.091078762434616e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.175202876329422,
"step": 2565,
"valid_targets_mean": 1496.6,
"valid_targets_min": 631
},
{
"epoch": 2.6995798319327733,
"grad_norm": 0.7483069663873031,
"learning_rate": 3.086684625661081e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16679367423057556,
"step": 2570,
"valid_targets_mean": 1476.0,
"valid_targets_min": 804
},
{
"epoch": 2.7048319327731094,
"grad_norm": 0.7649264183537576,
"learning_rate": 3.082283033419197e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16266639530658722,
"step": 2575,
"valid_targets_mean": 1448.8,
"valid_targets_min": 675
},
{
"epoch": 2.7100840336134455,
"grad_norm": 0.7515149499265241,
"learning_rate": 3.077874015907174e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18091100454330444,
"step": 2580,
"valid_targets_mean": 1305.0,
"valid_targets_min": 856
},
{
"epoch": 2.7153361344537816,
"grad_norm": 0.7377534312107921,
"learning_rate": 3.073457603374167e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628911793231964,
"step": 2585,
"valid_targets_mean": 1487.6,
"valid_targets_min": 715
},
{
"epoch": 2.7205882352941178,
"grad_norm": 0.7717568619128692,
"learning_rate": 3.069033826120066e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856994479894638,
"step": 2590,
"valid_targets_mean": 1619.1,
"valid_targets_min": 678
},
{
"epoch": 2.725840336134454,
"grad_norm": 0.9267036067403248,
"learning_rate": 3.064602714495286e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19266122579574585,
"step": 2595,
"valid_targets_mean": 1382.1,
"valid_targets_min": 676
},
{
"epoch": 2.73109243697479,
"grad_norm": 0.7500546233055486,
"learning_rate": 3.060164298900565e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605774164199829,
"step": 2600,
"valid_targets_mean": 1260.2,
"valid_targets_min": 794
},
{
"epoch": 2.736344537815126,
"grad_norm": 0.9445550576448264,
"learning_rate": 3.055718609786749e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16394124925136566,
"step": 2605,
"valid_targets_mean": 1414.1,
"valid_targets_min": 607
},
{
"epoch": 2.741596638655462,
"grad_norm": 0.7880924622108275,
"learning_rate": 3.051265677654585e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1700436919927597,
"step": 2610,
"valid_targets_mean": 1450.9,
"valid_targets_min": 741
},
{
"epoch": 2.7468487394957983,
"grad_norm": 0.7995324958770467,
"learning_rate": 3.0468055330545162e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18648771941661835,
"step": 2615,
"valid_targets_mean": 1626.9,
"valid_targets_min": 858
},
{
"epoch": 2.7521008403361344,
"grad_norm": 0.776585890510735,
"learning_rate": 3.0423382065864653e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16372038424015045,
"step": 2620,
"valid_targets_mean": 1370.7,
"valid_targets_min": 689
},
{
"epoch": 2.7573529411764706,
"grad_norm": 0.8233797828888295,
"learning_rate": 3.0378637288996304e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1707250475883484,
"step": 2625,
"valid_targets_mean": 1327.7,
"valid_targets_min": 690
},
{
"epoch": 2.7626050420168067,
"grad_norm": 0.7313593178890555,
"learning_rate": 3.033382130692269e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16939744353294373,
"step": 2630,
"valid_targets_mean": 1433.4,
"valid_targets_min": 718
},
{
"epoch": 2.767857142857143,
"grad_norm": 0.7983600909257519,
"learning_rate": 3.0288934427114955e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16010600328445435,
"step": 2635,
"valid_targets_mean": 1398.2,
"valid_targets_min": 618
},
{
"epoch": 2.773109243697479,
"grad_norm": 0.7280785441425935,
"learning_rate": 3.0243976957530602e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16162815690040588,
"step": 2640,
"valid_targets_mean": 1479.6,
"valid_targets_min": 629
},
{
"epoch": 2.778361344537815,
"grad_norm": 0.7839303867427334,
"learning_rate": 3.0198949206611475e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18356014788150787,
"step": 2645,
"valid_targets_mean": 1549.6,
"valid_targets_min": 650
},
{
"epoch": 2.783613445378151,
"grad_norm": 0.7391305503246356,
"learning_rate": 3.0153851483281582e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16755986213684082,
"step": 2650,
"valid_targets_mean": 1363.6,
"valid_targets_min": 677
},
{
"epoch": 2.7888655462184873,
"grad_norm": 0.7900413678108272,
"learning_rate": 3.010868409694499e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1623220145702362,
"step": 2655,
"valid_targets_mean": 1367.9,
"valid_targets_min": 679
},
{
"epoch": 2.7941176470588234,
"grad_norm": 0.7222759869118193,
"learning_rate": 3.0063447357483712e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16432425379753113,
"step": 2660,
"valid_targets_mean": 1393.1,
"valid_targets_min": 504
},
{
"epoch": 2.79936974789916,
"grad_norm": 0.7458633773608461,
"learning_rate": 3.0018141575255587e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16822689771652222,
"step": 2665,
"valid_targets_mean": 1577.6,
"valid_targets_min": 1006
},
{
"epoch": 2.8046218487394956,
"grad_norm": 0.7555827595039865,
"learning_rate": 2.9972767061092107e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15489238500595093,
"step": 2670,
"valid_targets_mean": 1338.3,
"valid_targets_min": 661
},
{
"epoch": 2.809873949579832,
"grad_norm": 0.6713741267521114,
"learning_rate": 2.9927324126296352e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1501934975385666,
"step": 2675,
"valid_targets_mean": 1335.4,
"valid_targets_min": 886
},
{
"epoch": 2.815126050420168,
"grad_norm": 0.677528061579685,
"learning_rate": 2.98818130826408e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1680719256401062,
"step": 2680,
"valid_targets_mean": 1633.0,
"valid_targets_min": 909
},
{
"epoch": 2.8203781512605044,
"grad_norm": 0.8220892091600075,
"learning_rate": 2.9836234242365204e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17720499634742737,
"step": 2685,
"valid_targets_mean": 1308.2,
"valid_targets_min": 793
},
{
"epoch": 2.82563025210084,
"grad_norm": 0.8315780706625598,
"learning_rate": 2.979058791817447e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1801975965499878,
"step": 2690,
"valid_targets_mean": 1479.8,
"valid_targets_min": 861
},
{
"epoch": 2.8308823529411766,
"grad_norm": 0.7948697249631214,
"learning_rate": 2.974487442323647e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16297297179698944,
"step": 2695,
"valid_targets_mean": 1284.6,
"valid_targets_min": 752
},
{
"epoch": 2.8361344537815127,
"grad_norm": 0.7446282359364188,
"learning_rate": 2.9699094071179938e-05,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18304650485515594,
"step": 2700,
"valid_targets_mean": 1584.1,
"valid_targets_min": 830
},
{
"epoch": 2.841386554621849,
"grad_norm": 0.718619587429062,
"learning_rate": 2.9653247176092286e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484600156545639,
"step": 2705,
"valid_targets_mean": 1445.1,
"valid_targets_min": 638
},
{
"epoch": 2.846638655462185,
"grad_norm": 0.8381765419273387,
"learning_rate": 2.9607334052517466e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1818123310804367,
"step": 2710,
"valid_targets_mean": 1449.8,
"valid_targets_min": 605
},
{
"epoch": 2.851890756302521,
"grad_norm": 0.7250086940420657,
"learning_rate": 2.9561355015453803e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16832154989242554,
"step": 2715,
"valid_targets_mean": 1551.5,
"valid_targets_min": 746
},
{
"epoch": 2.857142857142857,
"grad_norm": 0.7099316939262316,
"learning_rate": 2.9515310380351847e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16392531991004944,
"step": 2720,
"valid_targets_mean": 1306.3,
"valid_targets_min": 723
},
{
"epoch": 2.8623949579831933,
"grad_norm": 0.7472866347997246,
"learning_rate": 2.9469200463112186e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17414012551307678,
"step": 2725,
"valid_targets_mean": 1487.9,
"valid_targets_min": 855
},
{
"epoch": 2.8676470588235294,
"grad_norm": 0.7126081269612909,
"learning_rate": 2.9423025580083298e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15881696343421936,
"step": 2730,
"valid_targets_mean": 1503.1,
"valid_targets_min": 902
},
{
"epoch": 2.8728991596638656,
"grad_norm": 0.7172891409501757,
"learning_rate": 2.937678604805938e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16258196532726288,
"step": 2735,
"valid_targets_mean": 1501.8,
"valid_targets_min": 798
},
{
"epoch": 2.8781512605042017,
"grad_norm": 0.7828132309340979,
"learning_rate": 2.9330482184278168e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1718115508556366,
"step": 2740,
"valid_targets_mean": 1378.9,
"valid_targets_min": 740
},
{
"epoch": 2.883403361344538,
"grad_norm": 0.7837917980983125,
"learning_rate": 2.9284114306418758e-05,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1576087772846222,
"step": 2745,
"valid_targets_mean": 1222.1,
"valid_targets_min": 244
},
{
"epoch": 2.888655462184874,
"grad_norm": 0.7472309237344245,
"learning_rate": 2.923768273259942e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15255385637283325,
"step": 2750,
"valid_targets_mean": 1328.9,
"valid_targets_min": 714
},
{
"epoch": 2.89390756302521,
"grad_norm": 0.796880354826496,
"learning_rate": 2.919118778137546e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15773728489875793,
"step": 2755,
"valid_targets_mean": 1268.8,
"valid_targets_min": 585
},
{
"epoch": 2.899159663865546,
"grad_norm": 0.7916812281947033,
"learning_rate": 2.9144629771736954e-05,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18590059876441956,
"step": 2760,
"valid_targets_mean": 1596.2,
"valid_targets_min": 1041
},
{
"epoch": 2.9044117647058822,
"grad_norm": 0.7189169579851691,
"learning_rate": 2.9098009023106645e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15632124245166779,
"step": 2765,
"valid_targets_mean": 1373.1,
"valid_targets_min": 657
},
{
"epoch": 2.9096638655462184,
"grad_norm": 0.7049554537703587,
"learning_rate": 2.9051325855337684e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15910044312477112,
"step": 2770,
"valid_targets_mean": 1468.1,
"valid_targets_min": 959
},
{
"epoch": 2.9149159663865545,
"grad_norm": 0.7054773517266925,
"learning_rate": 2.90045805887115e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1691712886095047,
"step": 2775,
"valid_targets_mean": 1426.8,
"valid_targets_min": 620
},
{
"epoch": 2.9201680672268906,
"grad_norm": 0.8510450051223593,
"learning_rate": 2.8957773543935518e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1627202183008194,
"step": 2780,
"valid_targets_mean": 1360.6,
"valid_targets_min": 732
},
{
"epoch": 2.9254201680672267,
"grad_norm": 0.7255441493487386,
"learning_rate": 2.8910905042141046e-05,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17565231025218964,
"step": 2785,
"valid_targets_mean": 1550.9,
"valid_targets_min": 732
},
{
"epoch": 2.9306722689075633,
"grad_norm": 0.7448004871056576,
"learning_rate": 2.8863975404881022e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.170585036277771,
"step": 2790,
"valid_targets_mean": 1635.2,
"valid_targets_min": 682
},
{
"epoch": 2.935924369747899,
"grad_norm": 0.8125236767167314,
"learning_rate": 2.881698495412781e-05,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16882717609405518,
"step": 2795,
"valid_targets_mean": 1338.4,
"valid_targets_min": 596
},
{
"epoch": 2.9411764705882355,
"grad_norm": 0.7100556725806012,
"learning_rate": 2.8769934012271004e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684436947107315,
"step": 2800,
"valid_targets_mean": 1609.4,
"valid_targets_min": 747
},
{
"epoch": 2.946428571428571,
"grad_norm": 0.742789781874144,
"learning_rate": 2.8722822902115228e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1685582548379898,
"step": 2805,
"valid_targets_mean": 1568.2,
"valid_targets_min": 820
},
{
"epoch": 2.9516806722689077,
"grad_norm": 0.7211288410702199,
"learning_rate": 2.8675651946877884e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17647072672843933,
"step": 2810,
"valid_targets_mean": 1670.1,
"valid_targets_min": 799
},
{
"epoch": 2.956932773109244,
"grad_norm": 0.7463660696176379,
"learning_rate": 2.862842147018696e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17189790308475494,
"step": 2815,
"valid_targets_mean": 1533.6,
"valid_targets_min": 1047
},
{
"epoch": 2.96218487394958,
"grad_norm": 0.7064510545820726,
"learning_rate": 2.858113179607881e-05,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601008176803589,
"step": 2820,
"valid_targets_mean": 1528.5,
"valid_targets_min": 741
},
{
"epoch": 2.967436974789916,
"grad_norm": 0.7179205966287691,
"learning_rate": 2.8533783248995938e-05,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15484890341758728,
"step": 2825,
"valid_targets_mean": 1404.0,
"valid_targets_min": 720
},
{
"epoch": 2.972689075630252,
"grad_norm": 0.7844547172494378,
"learning_rate": 2.848637615378475e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16542135179042816,
"step": 2830,
"valid_targets_mean": 1366.3,
"valid_targets_min": 892
},
{
"epoch": 2.9779411764705883,
"grad_norm": 0.7331691954809272,
"learning_rate": 2.8438910835693314e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17777270078659058,
"step": 2835,
"valid_targets_mean": 1436.8,
"valid_targets_min": 684
},
{
"epoch": 2.9831932773109244,
"grad_norm": 0.6822641232454941,
"learning_rate": 2.8391387620369192e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1580207496881485,
"step": 2840,
"valid_targets_mean": 1425.5,
"valid_targets_min": 874
},
{
"epoch": 2.9884453781512605,
"grad_norm": 0.7108579727414756,
"learning_rate": 2.834380683385714e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16222992539405823,
"step": 2845,
"valid_targets_mean": 1604.8,
"valid_targets_min": 1280
},
{
"epoch": 2.9936974789915967,
"grad_norm": 0.7199485862107549,
"learning_rate": 2.8296168802596892e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16997018456459045,
"step": 2850,
"valid_targets_mean": 1522.8,
"valid_targets_min": 589
},
{
"epoch": 2.9989495798319328,
"grad_norm": 0.7245690379476749,
"learning_rate": 2.8248473853420933e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18465590476989746,
"step": 2855,
"valid_targets_mean": 1654.8,
"valid_targets_min": 918
},
{
"epoch": 3.004201680672269,
"grad_norm": 0.6536431805707318,
"learning_rate": 2.8200722313552247e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2750670313835144,
"step": 2860,
"valid_targets_mean": 3678.0,
"valid_targets_min": 702
},
{
"epoch": 3.009453781512605,
"grad_norm": 0.5616581452948703,
"learning_rate": 2.8152914510602073e-05,
"loss": 0.2663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2694254219532013,
"step": 2865,
"valid_targets_mean": 4133.2,
"valid_targets_min": 1550
},
{
"epoch": 3.014705882352941,
"grad_norm": 0.5914552324016616,
"learning_rate": 2.810505077256765e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26886335015296936,
"step": 2870,
"valid_targets_mean": 3929.9,
"valid_targets_min": 1296
},
{
"epoch": 3.0199579831932772,
"grad_norm": 0.5617545432111057,
"learning_rate": 2.8057131427829983e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23543497920036316,
"step": 2875,
"valid_targets_mean": 4362.6,
"valid_targets_min": 1681
},
{
"epoch": 3.0252100840336134,
"grad_norm": 0.5909970139213782,
"learning_rate": 2.800915680515157e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269046425819397,
"step": 2880,
"valid_targets_mean": 3591.2,
"valid_targets_min": 1044
},
{
"epoch": 3.0304621848739495,
"grad_norm": 0.548113977574793,
"learning_rate": 2.7961127233674167e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2423868477344513,
"step": 2885,
"valid_targets_mean": 3697.8,
"valid_targets_min": 920
},
{
"epoch": 3.0357142857142856,
"grad_norm": 0.5485874887437441,
"learning_rate": 2.7913043042916513e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25993612408638,
"step": 2890,
"valid_targets_mean": 5826.4,
"valid_targets_min": 2060
},
{
"epoch": 3.0409663865546217,
"grad_norm": 0.5329423434447529,
"learning_rate": 2.786490456277208e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24909579753875732,
"step": 2895,
"valid_targets_mean": 4033.6,
"valid_targets_min": 467
},
{
"epoch": 3.046218487394958,
"grad_norm": 0.5983501432535179,
"learning_rate": 2.7816712123506796e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2781432271003723,
"step": 2900,
"valid_targets_mean": 3789.9,
"valid_targets_min": 1689
},
{
"epoch": 3.051470588235294,
"grad_norm": 0.5971903589113992,
"learning_rate": 2.776846605575681e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563186287879944,
"step": 2905,
"valid_targets_mean": 3695.6,
"valid_targets_min": 1477
},
{
"epoch": 3.05672268907563,
"grad_norm": 0.5806312781845833,
"learning_rate": 2.772016669052618e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2883797883987427,
"step": 2910,
"valid_targets_mean": 4019.2,
"valid_targets_min": 1223
},
{
"epoch": 3.0619747899159666,
"grad_norm": 0.5300497777002529,
"learning_rate": 2.767181435918464e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27011632919311523,
"step": 2915,
"valid_targets_mean": 4429.1,
"valid_targets_min": 1552
},
{
"epoch": 3.0672268907563027,
"grad_norm": 0.6074007571412762,
"learning_rate": 2.7623409393465298e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2498617321252823,
"step": 2920,
"valid_targets_mean": 3706.6,
"valid_targets_min": 1439
},
{
"epoch": 3.072478991596639,
"grad_norm": 0.626168733306276,
"learning_rate": 2.7574952125462386e-05,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23380611836910248,
"step": 2925,
"valid_targets_mean": 3199.5,
"valid_targets_min": 1402
},
{
"epoch": 3.077731092436975,
"grad_norm": 0.6268290865377733,
"learning_rate": 2.7526442887628962e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27413225173950195,
"step": 2930,
"valid_targets_mean": 3583.0,
"valid_targets_min": 1586
},
{
"epoch": 3.082983193277311,
"grad_norm": 0.6176358259961854,
"learning_rate": 2.7477882012774633e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532740831375122,
"step": 2935,
"valid_targets_mean": 3411.6,
"valid_targets_min": 1538
},
{
"epoch": 3.088235294117647,
"grad_norm": 0.6568380568558851,
"learning_rate": 2.742926983406328e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2723920941352844,
"step": 2940,
"valid_targets_mean": 2824.4,
"valid_targets_min": 1058
},
{
"epoch": 3.0934873949579833,
"grad_norm": 0.6596581392165033,
"learning_rate": 2.7380606685010767e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707256078720093,
"step": 2945,
"valid_targets_mean": 2777.6,
"valid_targets_min": 1205
},
{
"epoch": 3.0987394957983194,
"grad_norm": 0.6126808354592166,
"learning_rate": 2.7331892899482654e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266759991645813,
"step": 2950,
"valid_targets_mean": 3421.2,
"valid_targets_min": 1165
},
{
"epoch": 3.1039915966386555,
"grad_norm": 0.6307476273476691,
"learning_rate": 2.7283128811691893e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2549319565296173,
"step": 2955,
"valid_targets_mean": 3220.3,
"valid_targets_min": 1267
},
{
"epoch": 3.1092436974789917,
"grad_norm": 0.6279599813034801,
"learning_rate": 2.7234314756196564e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24072325229644775,
"step": 2960,
"valid_targets_mean": 3117.6,
"valid_targets_min": 1026
},
{
"epoch": 3.1144957983193278,
"grad_norm": 0.612911115813002,
"learning_rate": 2.718545106789755e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25921279191970825,
"step": 2965,
"valid_targets_mean": 3350.1,
"valid_targets_min": 1345
},
{
"epoch": 3.119747899159664,
"grad_norm": 0.6086001253575483,
"learning_rate": 2.713653808203626e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24595654010772705,
"step": 2970,
"valid_targets_mean": 3563.4,
"valid_targets_min": 2050
},
{
"epoch": 3.125,
"grad_norm": 0.6022736229918767,
"learning_rate": 2.7087576134192305e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23543179035186768,
"step": 2975,
"valid_targets_mean": 3142.4,
"valid_targets_min": 1166
},
{
"epoch": 3.130252100840336,
"grad_norm": 0.6154494544856133,
"learning_rate": 2.7038565560281252e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2742067575454712,
"step": 2980,
"valid_targets_mean": 3220.9,
"valid_targets_min": 997
},
{
"epoch": 3.1355042016806722,
"grad_norm": 0.6742689274132734,
"learning_rate": 2.6989506696552224e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2767985463142395,
"step": 2985,
"valid_targets_mean": 2980.7,
"valid_targets_min": 1293
},
{
"epoch": 3.1407563025210083,
"grad_norm": 0.6039332698980796,
"learning_rate": 2.6940399879585685e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23629191517829895,
"step": 2990,
"valid_targets_mean": 3027.2,
"valid_targets_min": 1732
},
{
"epoch": 3.1460084033613445,
"grad_norm": 0.6818227952934203,
"learning_rate": 2.6891245446291093e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27924174070358276,
"step": 2995,
"valid_targets_mean": 3159.9,
"valid_targets_min": 1108
},
{
"epoch": 3.1512605042016806,
"grad_norm": 0.6924339005528242,
"learning_rate": 2.6842043733904578e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25699329376220703,
"step": 3000,
"valid_targets_mean": 3364.2,
"valid_targets_min": 571
},
{
"epoch": 3.1565126050420167,
"grad_norm": 0.675775810675891,
"learning_rate": 2.6792795079986634e-05,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25223487615585327,
"step": 3005,
"valid_targets_mean": 2891.1,
"valid_targets_min": 738
},
{
"epoch": 3.161764705882353,
"grad_norm": 0.7118892851934508,
"learning_rate": 2.6743499822419833e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26765280961990356,
"step": 3010,
"valid_targets_mean": 2982.2,
"valid_targets_min": 1798
},
{
"epoch": 3.167016806722689,
"grad_norm": 0.6135998796483827,
"learning_rate": 2.669415829940646e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24437305331230164,
"step": 3015,
"valid_targets_mean": 3367.0,
"valid_targets_min": 1338
},
{
"epoch": 3.172268907563025,
"grad_norm": 0.6308992296328928,
"learning_rate": 2.6644770849466226e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26935499906539917,
"step": 3020,
"valid_targets_mean": 3564.4,
"valid_targets_min": 1276
},
{
"epoch": 3.177521008403361,
"grad_norm": 0.6604476871808482,
"learning_rate": 2.6595337811433925e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25287342071533203,
"step": 3025,
"valid_targets_mean": 3842.9,
"valid_targets_min": 1668
},
{
"epoch": 3.1827731092436973,
"grad_norm": 0.5864716374259419,
"learning_rate": 2.654585952445714e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597090005874634,
"step": 3030,
"valid_targets_mean": 3920.2,
"valid_targets_min": 1373
},
{
"epoch": 3.1880252100840334,
"grad_norm": 0.6138428018636582,
"learning_rate": 2.6496336327993882e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2661425769329071,
"step": 3035,
"valid_targets_mean": 3629.1,
"valid_targets_min": 1858
},
{
"epoch": 3.19327731092437,
"grad_norm": 0.5951194931237926,
"learning_rate": 2.6446768561810264e-05,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323005348443985,
"step": 3040,
"valid_targets_mean": 3384.1,
"valid_targets_min": 922
},
{
"epoch": 3.198529411764706,
"grad_norm": 0.6617141663860238,
"learning_rate": 2.6397156565978198e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28470370173454285,
"step": 3045,
"valid_targets_mean": 3499.2,
"valid_targets_min": 2483
},
{
"epoch": 3.203781512605042,
"grad_norm": 0.6472312935786627,
"learning_rate": 2.6347500680873043e-05,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24719394743442535,
"step": 3050,
"valid_targets_mean": 2993.0,
"valid_targets_min": 977
},
{
"epoch": 3.2090336134453783,
"grad_norm": 0.5796753467452805,
"learning_rate": 2.6297801247171258e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2180900275707245,
"step": 3055,
"valid_targets_mean": 3620.9,
"valid_targets_min": 1856
},
{
"epoch": 3.2142857142857144,
"grad_norm": 0.663197194188445,
"learning_rate": 2.6248058605848097e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24358363449573517,
"step": 3060,
"valid_targets_mean": 3015.3,
"valid_targets_min": 1200
},
{
"epoch": 3.2195378151260505,
"grad_norm": 0.5921044967379778,
"learning_rate": 2.6198273098175234e-05,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21505384147167206,
"step": 3065,
"valid_targets_mean": 3572.4,
"valid_targets_min": 1607
},
{
"epoch": 3.2247899159663866,
"grad_norm": 0.656610014798293,
"learning_rate": 2.614844506571844e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24926620721817017,
"step": 3070,
"valid_targets_mean": 2880.9,
"valid_targets_min": 1358
},
{
"epoch": 3.2300420168067228,
"grad_norm": 0.6222197525250114,
"learning_rate": 2.609857485033525e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2442103624343872,
"step": 3075,
"valid_targets_mean": 3209.0,
"valid_targets_min": 1219
},
{
"epoch": 3.235294117647059,
"grad_norm": 0.587521968482715,
"learning_rate": 2.6048662794172595e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23662276566028595,
"step": 3080,
"valid_targets_mean": 3512.0,
"valid_targets_min": 1168
},
{
"epoch": 3.240546218487395,
"grad_norm": 0.6685246266555611,
"learning_rate": 2.599870923966447e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525354027748108,
"step": 3085,
"valid_targets_mean": 2764.2,
"valid_targets_min": 474
},
{
"epoch": 3.245798319327731,
"grad_norm": 0.6202106667084994,
"learning_rate": 2.5948714529529565e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24517540633678436,
"step": 3090,
"valid_targets_mean": 3665.3,
"valid_targets_min": 1140
},
{
"epoch": 3.2510504201680672,
"grad_norm": 0.5785793477278848,
"learning_rate": 2.5898679006768958e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22179822623729706,
"step": 3095,
"valid_targets_mean": 3486.1,
"valid_targets_min": 1482
},
{
"epoch": 3.2563025210084033,
"grad_norm": 0.6033278556859933,
"learning_rate": 2.5848603014663702e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21563810110092163,
"step": 3100,
"valid_targets_mean": 3097.8,
"valid_targets_min": 904
},
{
"epoch": 3.2615546218487395,
"grad_norm": 0.6455004631708245,
"learning_rate": 2.579848689677252e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29056334495544434,
"step": 3105,
"valid_targets_mean": 3727.6,
"valid_targets_min": 1194
},
{
"epoch": 3.2668067226890756,
"grad_norm": 0.5925539085498962,
"learning_rate": 2.5748330996929414e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2517462372779846,
"step": 3110,
"valid_targets_mean": 3901.4,
"valid_targets_min": 1527
},
{
"epoch": 3.2720588235294117,
"grad_norm": 0.6625252347137165,
"learning_rate": 2.5698135659241334e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597498893737793,
"step": 3115,
"valid_targets_mean": 3953.8,
"valid_targets_min": 1428
},
{
"epoch": 3.277310924369748,
"grad_norm": 0.6869236027507247,
"learning_rate": 2.564790122808579e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27155032753944397,
"step": 3120,
"valid_targets_mean": 3239.1,
"valid_targets_min": 1460
},
{
"epoch": 3.282563025210084,
"grad_norm": 0.641846245505168,
"learning_rate": 2.5597628048108504e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26535165309906006,
"step": 3125,
"valid_targets_mean": 3494.8,
"valid_targets_min": 1172
},
{
"epoch": 3.28781512605042,
"grad_norm": 0.6112401795648174,
"learning_rate": 2.5547316464221058e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2558062672615051,
"step": 3130,
"valid_targets_mean": 3518.0,
"valid_targets_min": 1229
},
{
"epoch": 3.293067226890756,
"grad_norm": 0.5712486962165064,
"learning_rate": 2.5496966821598493e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23176561295986176,
"step": 3135,
"valid_targets_mean": 3590.5,
"valid_targets_min": 1523
},
{
"epoch": 3.2983193277310923,
"grad_norm": 0.6085435476900142,
"learning_rate": 2.5446579465676977e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23727688193321228,
"step": 3140,
"valid_targets_mean": 3541.0,
"valid_targets_min": 997
},
{
"epoch": 3.3035714285714284,
"grad_norm": 0.6531904825025399,
"learning_rate": 2.5396154742151407e-05,
"loss": 0.2383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2473251223564148,
"step": 3145,
"valid_targets_mean": 3417.0,
"valid_targets_min": 621
},
{
"epoch": 3.3088235294117645,
"grad_norm": 0.6509222958342396,
"learning_rate": 2.5345692996973075e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24736976623535156,
"step": 3150,
"valid_targets_mean": 3183.2,
"valid_targets_min": 1282
},
{
"epoch": 3.314075630252101,
"grad_norm": 0.5707923779013074,
"learning_rate": 2.5295194576347233e-05,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21255888044834137,
"step": 3155,
"valid_targets_mean": 3807.4,
"valid_targets_min": 1143
},
{
"epoch": 3.3193277310924367,
"grad_norm": 0.638283494349549,
"learning_rate": 2.5244659826730774e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23158839344978333,
"step": 3160,
"valid_targets_mean": 3191.6,
"valid_targets_min": 1438
},
{
"epoch": 3.3245798319327733,
"grad_norm": 0.5983879302794481,
"learning_rate": 2.519408909482984e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23230604827404022,
"step": 3165,
"valid_targets_mean": 3549.1,
"valid_targets_min": 2091
},
{
"epoch": 3.3298319327731094,
"grad_norm": 0.6356003504281118,
"learning_rate": 2.5143482727597427e-05,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23692654073238373,
"step": 3170,
"valid_targets_mean": 3175.4,
"valid_targets_min": 1305
},
{
"epoch": 3.3350840336134455,
"grad_norm": 0.5822669278425938,
"learning_rate": 2.509284107223102e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323712259531021,
"step": 3175,
"valid_targets_mean": 3699.6,
"valid_targets_min": 1428
},
{
"epoch": 3.3403361344537816,
"grad_norm": 0.6034461853939603,
"learning_rate": 2.50421644761702e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2210870236158371,
"step": 3180,
"valid_targets_mean": 3405.7,
"valid_targets_min": 1388
},
{
"epoch": 3.3455882352941178,
"grad_norm": 0.6142007275077153,
"learning_rate": 2.499145328709429e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25747138261795044,
"step": 3185,
"valid_targets_mean": 3644.9,
"valid_targets_min": 1823
},
{
"epoch": 3.350840336134454,
"grad_norm": 0.6119837836741985,
"learning_rate": 2.4940707852919924e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2111436128616333,
"step": 3190,
"valid_targets_mean": 3011.4,
"valid_targets_min": 1109
},
{
"epoch": 3.35609243697479,
"grad_norm": 0.6533534419454151,
"learning_rate": 2.488992852179868e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23850302398204803,
"step": 3195,
"valid_targets_mean": 3141.6,
"valid_targets_min": 1649
},
{
"epoch": 3.361344537815126,
"grad_norm": 0.7140300662865305,
"learning_rate": 2.483911564211472e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26096731424331665,
"step": 3200,
"valid_targets_mean": 2904.2,
"valid_targets_min": 1249
},
{
"epoch": 3.366596638655462,
"grad_norm": 0.7251927942844403,
"learning_rate": 2.4788269562482355e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26130279898643494,
"step": 3205,
"valid_targets_mean": 3641.2,
"valid_targets_min": 1793
},
{
"epoch": 3.3718487394957983,
"grad_norm": 0.6421393556947993,
"learning_rate": 2.4737390631743675e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2507364749908447,
"step": 3210,
"valid_targets_mean": 3154.0,
"valid_targets_min": 1054
},
{
"epoch": 3.3771008403361344,
"grad_norm": 0.6437737473605846,
"learning_rate": 2.4686479198966146e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24308231472969055,
"step": 3215,
"valid_targets_mean": 3276.6,
"valid_targets_min": 1055
},
{
"epoch": 3.3823529411764706,
"grad_norm": 0.6571399883695811,
"learning_rate": 2.463553561344024e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24305208027362823,
"step": 3220,
"valid_targets_mean": 3750.0,
"valid_targets_min": 1241
},
{
"epoch": 3.3876050420168067,
"grad_norm": 0.650161760454692,
"learning_rate": 2.4584560224677013e-05,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24910904467105865,
"step": 3225,
"valid_targets_mean": 3649.5,
"valid_targets_min": 1174
},
{
"epoch": 3.392857142857143,
"grad_norm": 0.645357588744853,
"learning_rate": 2.4533553382405702e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2722882926464081,
"step": 3230,
"valid_targets_mean": 3284.9,
"valid_targets_min": 992
},
{
"epoch": 3.398109243697479,
"grad_norm": 0.6297523245044137,
"learning_rate": 2.4482515436571365e-05,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25592392683029175,
"step": 3235,
"valid_targets_mean": 3817.9,
"valid_targets_min": 1133
},
{
"epoch": 3.403361344537815,
"grad_norm": 0.6382149094735594,
"learning_rate": 2.4431446737332437e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542281150817871,
"step": 3240,
"valid_targets_mean": 3242.6,
"valid_targets_min": 1409
},
{
"epoch": 3.408613445378151,
"grad_norm": 0.726502424494956,
"learning_rate": 2.438034763505833e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25886449217796326,
"step": 3245,
"valid_targets_mean": 3062.4,
"valid_targets_min": 719
},
{
"epoch": 3.4138655462184873,
"grad_norm": 0.659719001774402,
"learning_rate": 2.432921848032707e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25948482751846313,
"step": 3250,
"valid_targets_mean": 3307.1,
"valid_targets_min": 1239
},
{
"epoch": 3.4191176470588234,
"grad_norm": 0.6125599642876945,
"learning_rate": 2.427805962392286e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24624377489089966,
"step": 3255,
"valid_targets_mean": 3635.1,
"valid_targets_min": 1349
},
{
"epoch": 3.4243697478991595,
"grad_norm": 0.6755501860373633,
"learning_rate": 2.4226871416833683e-05,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2604214549064636,
"step": 3260,
"valid_targets_mean": 3250.2,
"valid_targets_min": 1434
},
{
"epoch": 3.4296218487394956,
"grad_norm": 0.6523430203235168,
"learning_rate": 2.4175654210248848e-05,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23800113797187805,
"step": 3265,
"valid_targets_mean": 3233.2,
"valid_targets_min": 521
},
{
"epoch": 3.434873949579832,
"grad_norm": 0.6487475032548123,
"learning_rate": 2.4124408355556677e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2616475224494934,
"step": 3270,
"valid_targets_mean": 3477.9,
"valid_targets_min": 937
},
{
"epoch": 3.440126050420168,
"grad_norm": 0.7183856650514495,
"learning_rate": 2.4073134204342014e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25091075897216797,
"step": 3275,
"valid_targets_mean": 3096.8,
"valid_targets_min": 1239
},
{
"epoch": 3.4453781512605044,
"grad_norm": 0.6435718093662096,
"learning_rate": 2.4021832108383837e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23243436217308044,
"step": 3280,
"valid_targets_mean": 3552.1,
"valid_targets_min": 1457
},
{
"epoch": 3.4506302521008405,
"grad_norm": 0.6794408128931803,
"learning_rate": 2.3970502419652854e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24406090378761292,
"step": 3285,
"valid_targets_mean": 3231.3,
"valid_targets_min": 1307
},
{
"epoch": 3.4558823529411766,
"grad_norm": 0.6369525387600705,
"learning_rate": 2.3919145490309076e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24544468522071838,
"step": 3290,
"valid_targets_mean": 3674.0,
"valid_targets_min": 1773
},
{
"epoch": 3.4611344537815127,
"grad_norm": 0.6864257084128846,
"learning_rate": 2.38677616726994e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23525570333003998,
"step": 3295,
"valid_targets_mean": 3274.8,
"valid_targets_min": 1035
},
{
"epoch": 3.466386554621849,
"grad_norm": 0.6249370596202156,
"learning_rate": 2.381635131935521e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23440296947956085,
"step": 3300,
"valid_targets_mean": 3696.1,
"valid_targets_min": 1333
},
{
"epoch": 3.471638655462185,
"grad_norm": 0.609366608375307,
"learning_rate": 2.3764914782989926e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2386169135570526,
"step": 3305,
"valid_targets_mean": 3717.7,
"valid_targets_min": 1062
},
{
"epoch": 3.476890756302521,
"grad_norm": 0.6957649137605235,
"learning_rate": 2.3713452416496625e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2374548614025116,
"step": 3310,
"valid_targets_mean": 2991.9,
"valid_targets_min": 993
},
{
"epoch": 3.482142857142857,
"grad_norm": 0.6360187725166639,
"learning_rate": 2.366196457294558e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23413576185703278,
"step": 3315,
"valid_targets_mean": 3540.1,
"valid_targets_min": 873
},
{
"epoch": 3.4873949579831933,
"grad_norm": 0.6151473063134504,
"learning_rate": 2.3610451605581858e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21768996119499207,
"step": 3320,
"valid_targets_mean": 3565.8,
"valid_targets_min": 1152
},
{
"epoch": 3.4926470588235294,
"grad_norm": 0.6627058497672066,
"learning_rate": 2.3558913867822905e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24642956256866455,
"step": 3325,
"valid_targets_mean": 3437.2,
"valid_targets_min": 1128
},
{
"epoch": 3.4978991596638656,
"grad_norm": 0.6487038665095798,
"learning_rate": 2.3507351713256105e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22559967637062073,
"step": 3330,
"valid_targets_mean": 3062.5,
"valid_targets_min": 1123
},
{
"epoch": 3.5031512605042017,
"grad_norm": 0.7141894926568165,
"learning_rate": 2.3455765495636353e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572299838066101,
"step": 3335,
"valid_targets_mean": 2870.6,
"valid_targets_min": 1278
},
{
"epoch": 3.508403361344538,
"grad_norm": 0.7021679105572891,
"learning_rate": 2.3404155568883643e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23877769708633423,
"step": 3340,
"valid_targets_mean": 3168.8,
"valid_targets_min": 1834
},
{
"epoch": 3.513655462184874,
"grad_norm": 0.597320613139139,
"learning_rate": 2.3352522287080625e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21225066483020782,
"step": 3345,
"valid_targets_mean": 3446.2,
"valid_targets_min": 420
},
{
"epoch": 3.51890756302521,
"grad_norm": 0.6380276235544516,
"learning_rate": 2.3300866004470182e-05,
"loss": 0.2432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24665868282318115,
"step": 3350,
"valid_targets_mean": 3379.9,
"valid_targets_min": 757
},
{
"epoch": 3.524159663865546,
"grad_norm": 0.7068358500231999,
"learning_rate": 2.324918707545302e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24660983681678772,
"step": 3355,
"valid_targets_mean": 2930.9,
"valid_targets_min": 732
},
{
"epoch": 3.5294117647058822,
"grad_norm": 0.6415894870301354,
"learning_rate": 2.3197485854585183e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2307543158531189,
"step": 3360,
"valid_targets_mean": 3399.6,
"valid_targets_min": 929
},
{
"epoch": 3.5346638655462184,
"grad_norm": 0.6658926618185477,
"learning_rate": 2.3145762696575675e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25282666087150574,
"step": 3365,
"valid_targets_mean": 3603.7,
"valid_targets_min": 1217
},
{
"epoch": 3.5399159663865545,
"grad_norm": 0.9220749340704859,
"learning_rate": 2.3094017956283995e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17968519032001495,
"step": 3370,
"valid_targets_mean": 1437.6,
"valid_targets_min": 544
},
{
"epoch": 3.5451680672268906,
"grad_norm": 0.8146754285295436,
"learning_rate": 2.3042251988717728e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1631278544664383,
"step": 3375,
"valid_targets_mean": 1329.9,
"valid_targets_min": 632
},
{
"epoch": 3.5504201680672267,
"grad_norm": 0.8079169271047991,
"learning_rate": 2.2990465149030077e-05,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14737124741077423,
"step": 3380,
"valid_targets_mean": 1353.5,
"valid_targets_min": 514
},
{
"epoch": 3.5556722689075633,
"grad_norm": 0.8535871657760787,
"learning_rate": 2.2938657792517446e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16740497946739197,
"step": 3385,
"valid_targets_mean": 1316.6,
"valid_targets_min": 701
},
{
"epoch": 3.560924369747899,
"grad_norm": 0.7719202998888485,
"learning_rate": 2.2886830274617017e-05,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1611393243074417,
"step": 3390,
"valid_targets_mean": 1592.3,
"valid_targets_min": 754
},
{
"epoch": 3.5661764705882355,
"grad_norm": 0.7958529561306797,
"learning_rate": 2.2834982950904267e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14342686533927917,
"step": 3395,
"valid_targets_mean": 1302.9,
"valid_targets_min": 746
},
{
"epoch": 3.571428571428571,
"grad_norm": 0.8182753300383552,
"learning_rate": 2.2783116177090573e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16086168587207794,
"step": 3400,
"valid_targets_mean": 1477.3,
"valid_targets_min": 774
},
{
"epoch": 3.5766806722689077,
"grad_norm": 0.8440198093915002,
"learning_rate": 2.2731230309020762e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14826279878616333,
"step": 3405,
"valid_targets_mean": 1277.8,
"valid_targets_min": 648
},
{
"epoch": 3.581932773109244,
"grad_norm": 0.7376313701958287,
"learning_rate": 2.2679325702670642e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1509246826171875,
"step": 3410,
"valid_targets_mean": 1484.6,
"valid_targets_min": 708
},
{
"epoch": 3.58718487394958,
"grad_norm": 0.7318924656750266,
"learning_rate": 2.2627402714144586e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13782326877117157,
"step": 3415,
"valid_targets_mean": 1430.1,
"valid_targets_min": 770
},
{
"epoch": 3.592436974789916,
"grad_norm": 0.7765160826126889,
"learning_rate": 2.2575461699673085e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13097913563251495,
"step": 3420,
"valid_targets_mean": 1201.6,
"valid_targets_min": 572
},
{
"epoch": 3.597689075630252,
"grad_norm": 0.7638002189556976,
"learning_rate": 2.2523503015610303e-05,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455516219139099,
"step": 3425,
"valid_targets_mean": 1363.5,
"valid_targets_min": 627
},
{
"epoch": 3.6029411764705883,
"grad_norm": 1.2976616643941823,
"learning_rate": 2.2471527018431637e-05,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16458860039710999,
"step": 3430,
"valid_targets_mean": 1451.6,
"valid_targets_min": 765
},
{
"epoch": 3.6081932773109244,
"grad_norm": 0.7946926976962566,
"learning_rate": 2.2419534064731238e-05,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15298821032047272,
"step": 3435,
"valid_targets_mean": 1393.4,
"valid_targets_min": 740
},
{
"epoch": 3.6134453781512605,
"grad_norm": 0.7749793995924292,
"learning_rate": 2.236752451121963e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1496553122997284,
"step": 3440,
"valid_targets_mean": 1498.2,
"valid_targets_min": 821
},
{
"epoch": 3.6186974789915967,
"grad_norm": 0.8079854962978418,
"learning_rate": 2.2315498714721198e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1507023572921753,
"step": 3445,
"valid_targets_mean": 1411.3,
"valid_targets_min": 691
},
{
"epoch": 3.6239495798319328,
"grad_norm": 0.7810771746182552,
"learning_rate": 2.2263457032171762e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1364845335483551,
"step": 3450,
"valid_targets_mean": 1252.6,
"valid_targets_min": 721
},
{
"epoch": 3.629201680672269,
"grad_norm": 0.7854800292698711,
"learning_rate": 2.2211399820616154e-05,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15126636624336243,
"step": 3455,
"valid_targets_mean": 1422.4,
"valid_targets_min": 727
},
{
"epoch": 3.634453781512605,
"grad_norm": 0.7420584859304036,
"learning_rate": 2.2159327437205733e-05,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14271925389766693,
"step": 3460,
"valid_targets_mean": 1345.2,
"valid_targets_min": 681
},
{
"epoch": 3.639705882352941,
"grad_norm": 0.7964739958712432,
"learning_rate": 2.210724023919595e-05,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16524961590766907,
"step": 3465,
"valid_targets_mean": 1557.1,
"valid_targets_min": 814
},
{
"epoch": 3.6449579831932772,
"grad_norm": 0.737091402225577,
"learning_rate": 2.205513858394389e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16383059322834015,
"step": 3470,
"valid_targets_mean": 1626.4,
"valid_targets_min": 832
},
{
"epoch": 3.6502100840336134,
"grad_norm": 0.7022804917492798,
"learning_rate": 2.2003022828905832e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14327232539653778,
"step": 3475,
"valid_targets_mean": 1605.8,
"valid_targets_min": 891
},
{
"epoch": 3.6554621848739495,
"grad_norm": 0.9525205693478359,
"learning_rate": 2.19508933316348e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15683533251285553,
"step": 3480,
"valid_targets_mean": 1267.2,
"valid_targets_min": 621
},
{
"epoch": 3.6607142857142856,
"grad_norm": 0.76863394644955,
"learning_rate": 2.189875044977808e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12910358607769012,
"step": 3485,
"valid_targets_mean": 1270.9,
"valid_targets_min": 704
},
{
"epoch": 3.6659663865546217,
"grad_norm": 0.8107277676634275,
"learning_rate": 2.1846594541074796e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15735816955566406,
"step": 3490,
"valid_targets_mean": 1564.4,
"valid_targets_min": 872
},
{
"epoch": 3.671218487394958,
"grad_norm": 0.8063598539952364,
"learning_rate": 2.179442596335345e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13597534596920013,
"step": 3495,
"valid_targets_mean": 1323.2,
"valid_targets_min": 584
},
{
"epoch": 3.6764705882352944,
"grad_norm": 0.7114116421864716,
"learning_rate": 2.174224507452945e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1412769854068756,
"step": 3500,
"valid_targets_mean": 1568.7,
"valid_targets_min": 999
},
{
"epoch": 3.68172268907563,
"grad_norm": 0.9027372835508958,
"learning_rate": 2.1690052232602677e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17291805148124695,
"step": 3505,
"valid_targets_mean": 1610.1,
"valid_targets_min": 750
},
{
"epoch": 3.6869747899159666,
"grad_norm": 0.7921785974495511,
"learning_rate": 2.1637847795655022e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13400542736053467,
"step": 3510,
"valid_targets_mean": 1269.1,
"valid_targets_min": 613
},
{
"epoch": 3.6922268907563023,
"grad_norm": 0.7595580625561714,
"learning_rate": 2.1585632121847925e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14459824562072754,
"step": 3515,
"valid_targets_mean": 1640.6,
"valid_targets_min": 768
},
{
"epoch": 3.697478991596639,
"grad_norm": 0.8461026963697874,
"learning_rate": 2.153340556941991e-05,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13768309354782104,
"step": 3520,
"valid_targets_mean": 1270.5,
"valid_targets_min": 700
},
{
"epoch": 3.7027310924369745,
"grad_norm": 0.8139291786249493,
"learning_rate": 2.1481168496684145e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13502518832683563,
"step": 3525,
"valid_targets_mean": 1266.8,
"valid_targets_min": 800
},
{
"epoch": 3.707983193277311,
"grad_norm": 0.7773733165903327,
"learning_rate": 2.142892126202597e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14710843563079834,
"step": 3530,
"valid_targets_mean": 1562.7,
"valid_targets_min": 843
},
{
"epoch": 3.713235294117647,
"grad_norm": 0.8540100911584824,
"learning_rate": 2.137666422390045e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14058175683021545,
"step": 3535,
"valid_targets_mean": 1169.9,
"valid_targets_min": 746
},
{
"epoch": 3.7184873949579833,
"grad_norm": 0.8192520728614282,
"learning_rate": 2.132439774082991e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.136886328458786,
"step": 3540,
"valid_targets_mean": 1270.4,
"valid_targets_min": 772
},
{
"epoch": 3.7237394957983194,
"grad_norm": 0.7591394569870296,
"learning_rate": 2.1272122171401467e-05,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12614212930202484,
"step": 3545,
"valid_targets_mean": 1218.7,
"valid_targets_min": 619
},
{
"epoch": 3.7289915966386555,
"grad_norm": 0.8033788971182879,
"learning_rate": 2.1219837874264573e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14868700504302979,
"step": 3550,
"valid_targets_mean": 1416.0,
"valid_targets_min": 734
},
{
"epoch": 3.7342436974789917,
"grad_norm": 0.7186280622481173,
"learning_rate": 2.116754520812857e-05,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14419475197792053,
"step": 3555,
"valid_targets_mean": 1500.3,
"valid_targets_min": 831
},
{
"epoch": 3.7394957983193278,
"grad_norm": 0.8001515867898759,
"learning_rate": 2.111524453176022e-05,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14432606101036072,
"step": 3560,
"valid_targets_mean": 1469.2,
"valid_targets_min": 722
},
{
"epoch": 3.744747899159664,
"grad_norm": 0.7937436890534154,
"learning_rate": 2.1062936203981227e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1394154131412506,
"step": 3565,
"valid_targets_mean": 1317.1,
"valid_targets_min": 711
},
{
"epoch": 3.75,
"grad_norm": 0.768116550112638,
"learning_rate": 2.10106205836658e-05,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13312450051307678,
"step": 3570,
"valid_targets_mean": 1313.2,
"valid_targets_min": 733
},
{
"epoch": 3.755252100840336,
"grad_norm": 0.8277161948796012,
"learning_rate": 2.095829802973817e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15327024459838867,
"step": 3575,
"valid_targets_mean": 1500.1,
"valid_targets_min": 931
},
{
"epoch": 3.7605042016806722,
"grad_norm": 0.7538438394237286,
"learning_rate": 2.090596890117016e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14686134457588196,
"step": 3580,
"valid_targets_mean": 1631.1,
"valid_targets_min": 1011
},
{
"epoch": 3.7657563025210083,
"grad_norm": 0.8173261031285455,
"learning_rate": 2.0853633556978674e-05,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14837123453617096,
"step": 3585,
"valid_targets_mean": 1393.4,
"valid_targets_min": 748
},
{
"epoch": 3.7710084033613445,
"grad_norm": 0.8094111718458211,
"learning_rate": 2.0801292356223265e-05,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14551788568496704,
"step": 3590,
"valid_targets_mean": 1533.6,
"valid_targets_min": 699
},
{
"epoch": 3.7762605042016806,
"grad_norm": 0.9683838865909208,
"learning_rate": 2.0748945658003695e-05,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13133487105369568,
"step": 3595,
"valid_targets_mean": 1311.3,
"valid_targets_min": 534
},
{
"epoch": 3.7815126050420167,
"grad_norm": 0.7858949321807766,
"learning_rate": 2.0696593821457392e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13803954422473907,
"step": 3600,
"valid_targets_mean": 1410.7,
"valid_targets_min": 687
},
{
"epoch": 3.786764705882353,
"grad_norm": 0.7682170107004075,
"learning_rate": 2.064423720575709e-05,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1322372555732727,
"step": 3605,
"valid_targets_mean": 1287.4,
"valid_targets_min": 549
},
{
"epoch": 3.792016806722689,
"grad_norm": 0.785944883857896,
"learning_rate": 2.0591876170108257e-05,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13903062045574188,
"step": 3610,
"valid_targets_mean": 1356.6,
"valid_targets_min": 725
},
{
"epoch": 3.7972689075630255,
"grad_norm": 1.0766948059764874,
"learning_rate": 2.0539511073746743e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596774160861969,
"step": 3615,
"valid_targets_mean": 1579.2,
"valid_targets_min": 852
},
{
"epoch": 3.802521008403361,
"grad_norm": 0.8802148487961788,
"learning_rate": 2.0487142275936213e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1571769416332245,
"step": 3620,
"valid_targets_mean": 1478.4,
"valid_targets_min": 978
},
{
"epoch": 3.8077731092436977,
"grad_norm": 0.9017272636806979,
"learning_rate": 2.0434770135965743e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1524774432182312,
"step": 3625,
"valid_targets_mean": 1463.6,
"valid_targets_min": 545
},
{
"epoch": 3.8130252100840334,
"grad_norm": 0.794244937697772,
"learning_rate": 2.0382395013147347e-05,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15117822587490082,
"step": 3630,
"valid_targets_mean": 1314.1,
"valid_targets_min": 622
},
{
"epoch": 3.81827731092437,
"grad_norm": 0.683828437827683,
"learning_rate": 2.033001726681349e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17605149745941162,
"step": 3635,
"valid_targets_mean": 1785.9,
"valid_targets_min": 849
},
{
"epoch": 3.8235294117647056,
"grad_norm": 0.8701621923894823,
"learning_rate": 2.027763725631463e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1420620083808899,
"step": 3640,
"valid_targets_mean": 1337.8,
"valid_targets_min": 612
},
{
"epoch": 3.828781512605042,
"grad_norm": 0.8336992892361698,
"learning_rate": 2.0225255341016794e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13892850279808044,
"step": 3645,
"valid_targets_mean": 1443.2,
"valid_targets_min": 673
},
{
"epoch": 3.8340336134453783,
"grad_norm": 0.8497904024804793,
"learning_rate": 2.017287188029904e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14770525693893433,
"step": 3650,
"valid_targets_mean": 1358.2,
"valid_targets_min": 746
},
{
"epoch": 3.8392857142857144,
"grad_norm": 0.7320787153441641,
"learning_rate": 2.0120487233551035e-05,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13209758698940277,
"step": 3655,
"valid_targets_mean": 1293.9,
"valid_targets_min": 672
},
{
"epoch": 3.8445378151260505,
"grad_norm": 0.8025485910991912,
"learning_rate": 2.006810176017059e-05,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370171755552292,
"step": 3660,
"valid_targets_mean": 1362.8,
"valid_targets_min": 670
},
{
"epoch": 3.8497899159663866,
"grad_norm": 0.7870212464053592,
"learning_rate": 2.0015715819561205e-05,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440301537513733,
"step": 3665,
"valid_targets_mean": 1569.8,
"valid_targets_min": 647
},
{
"epoch": 3.8550420168067228,
"grad_norm": 0.7590451152844765,
"learning_rate": 1.9963329771129558e-05,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12877610325813293,
"step": 3670,
"valid_targets_mean": 1300.3,
"valid_targets_min": 613
},
{
"epoch": 3.860294117647059,
"grad_norm": 0.8086227373232483,
"learning_rate": 1.9910943974283066e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13503482937812805,
"step": 3675,
"valid_targets_mean": 1306.6,
"valid_targets_min": 746
},
{
"epoch": 3.865546218487395,
"grad_norm": 0.7360884641253568,
"learning_rate": 1.9858558788427447e-05,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1362096667289734,
"step": 3680,
"valid_targets_mean": 1580.3,
"valid_targets_min": 892
},
{
"epoch": 3.870798319327731,
"grad_norm": 0.8447821850921354,
"learning_rate": 1.9806174572964205e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15582120418548584,
"step": 3685,
"valid_targets_mean": 1388.9,
"valid_targets_min": 635
},
{
"epoch": 3.8760504201680672,
"grad_norm": 0.7698208399307699,
"learning_rate": 1.975379168728819e-05,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1433495581150055,
"step": 3690,
"valid_targets_mean": 1522.7,
"valid_targets_min": 636
},
{
"epoch": 3.8813025210084033,
"grad_norm": 0.8559947536872534,
"learning_rate": 1.9701410490785128e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15050233900547028,
"step": 3695,
"valid_targets_mean": 1404.7,
"valid_targets_min": 641
},
{
"epoch": 3.8865546218487395,
"grad_norm": 0.8384924745171093,
"learning_rate": 1.9649031342829178e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14834997057914734,
"step": 3700,
"valid_targets_mean": 1505.6,
"valid_targets_min": 818
},
{
"epoch": 3.8918067226890756,
"grad_norm": 0.904316575159625,
"learning_rate": 1.9596654602780398e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14717188477516174,
"step": 3705,
"valid_targets_mean": 1389.2,
"valid_targets_min": 625
},
{
"epoch": 3.8970588235294117,
"grad_norm": 0.8089593091562093,
"learning_rate": 1.9544280629982364e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16768889129161835,
"step": 3710,
"valid_targets_mean": 1636.1,
"valid_targets_min": 888
},
{
"epoch": 3.902310924369748,
"grad_norm": 1.1385386317837363,
"learning_rate": 1.949190978375966e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1377800554037094,
"step": 3715,
"valid_targets_mean": 1567.6,
"valid_targets_min": 908
},
{
"epoch": 3.907563025210084,
"grad_norm": 0.7625175757891974,
"learning_rate": 1.9439542423415413e-05,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1343471109867096,
"step": 3720,
"valid_targets_mean": 1259.7,
"valid_targets_min": 522
},
{
"epoch": 3.91281512605042,
"grad_norm": 0.7881066764674685,
"learning_rate": 1.9387178908228838e-05,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1399286389350891,
"step": 3725,
"valid_targets_mean": 1342.3,
"valid_targets_min": 730
},
{
"epoch": 3.918067226890756,
"grad_norm": 0.7975143538194005,
"learning_rate": 1.933481959745276e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13079893589019775,
"step": 3730,
"valid_targets_mean": 1350.1,
"valid_targets_min": 869
},
{
"epoch": 3.9233193277310923,
"grad_norm": 0.7958077340565655,
"learning_rate": 1.9282464850311184e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14043010771274567,
"step": 3735,
"valid_targets_mean": 1477.9,
"valid_targets_min": 769
},
{
"epoch": 3.928571428571429,
"grad_norm": 0.8357581182064178,
"learning_rate": 1.9230115025996764e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13817790150642395,
"step": 3740,
"valid_targets_mean": 1340.2,
"valid_targets_min": 716
},
{
"epoch": 3.9338235294117645,
"grad_norm": 0.7898072090831375,
"learning_rate": 1.9177770483668416e-05,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13853862881660461,
"step": 3745,
"valid_targets_mean": 1375.1,
"valid_targets_min": 707
},
{
"epoch": 3.939075630252101,
"grad_norm": 0.8156265634718887,
"learning_rate": 1.912543158244881e-05,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13628491759300232,
"step": 3750,
"valid_targets_mean": 1429.2,
"valid_targets_min": 964
},
{
"epoch": 3.9443277310924367,
"grad_norm": 0.8498119635524579,
"learning_rate": 1.9073098681421895e-05,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17182615399360657,
"step": 3755,
"valid_targets_mean": 1610.7,
"valid_targets_min": 793
},
{
"epoch": 3.9495798319327733,
"grad_norm": 0.7982935292914652,
"learning_rate": 1.902077213963048e-05,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1300593912601471,
"step": 3760,
"valid_targets_mean": 1399.4,
"valid_targets_min": 727
},
{
"epoch": 3.9548319327731094,
"grad_norm": 0.7854022510245628,
"learning_rate": 1.896845231607372e-05,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13969582319259644,
"step": 3765,
"valid_targets_mean": 1396.2,
"valid_targets_min": 734
},
{
"epoch": 3.9600840336134455,
"grad_norm": 0.5894392686560074,
"learning_rate": 1.8916139569704704e-05,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10743817687034607,
"step": 3770,
"valid_targets_mean": 2173.6,
"valid_targets_min": 917
},
{
"epoch": 3.9653361344537816,
"grad_norm": 0.7395136244392762,
"learning_rate": 1.886383425942795e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1325417160987854,
"step": 3775,
"valid_targets_mean": 1583.9,
"valid_targets_min": 930
},
{
"epoch": 3.9705882352941178,
"grad_norm": 0.7865246777578737,
"learning_rate": 1.8811536744096956e-05,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13856448233127594,
"step": 3780,
"valid_targets_mean": 1454.1,
"valid_targets_min": 570
},
{
"epoch": 3.975840336134454,
"grad_norm": 0.7942309792805228,
"learning_rate": 1.8759247382511748e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14219339191913605,
"step": 3785,
"valid_targets_mean": 1557.5,
"valid_targets_min": 870
},
{
"epoch": 3.98109243697479,
"grad_norm": 0.8125974018026644,
"learning_rate": 1.8706966533416413e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14180970191955566,
"step": 3790,
"valid_targets_mean": 1599.9,
"valid_targets_min": 1070
},
{
"epoch": 3.986344537815126,
"grad_norm": 0.7872308732821972,
"learning_rate": 1.8654694555496624e-05,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15511301159858704,
"step": 3795,
"valid_targets_mean": 1596.4,
"valid_targets_min": 626
},
{
"epoch": 3.991596638655462,
"grad_norm": 0.8264202266884269,
"learning_rate": 1.860243180737721e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13887375593185425,
"step": 3800,
"valid_targets_mean": 1423.5,
"valid_targets_min": 718
},
{
"epoch": 3.9968487394957983,
"grad_norm": 0.8547785642731142,
"learning_rate": 1.8550178647619664e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14218434691429138,
"step": 3805,
"valid_targets_mean": 1343.2,
"valid_targets_min": 646
},
{
"epoch": 4.0021008403361344,
"grad_norm": 0.9794746439498689,
"learning_rate": 1.84979354347197e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2445564717054367,
"step": 3810,
"valid_targets_mean": 3945.9,
"valid_targets_min": 1698
},
{
"epoch": 4.007352941176471,
"grad_norm": 0.6295029416310093,
"learning_rate": 1.8445702527104782e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21728411316871643,
"step": 3815,
"valid_targets_mean": 3601.0,
"valid_targets_min": 981
},
{
"epoch": 4.012605042016807,
"grad_norm": 0.6261229756084788,
"learning_rate": 1.8393480283131677e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2355230748653412,
"step": 3820,
"valid_targets_mean": 3562.5,
"valid_targets_min": 835
},
{
"epoch": 4.017857142857143,
"grad_norm": 0.5498474690761935,
"learning_rate": 1.8341269061083996e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23167270421981812,
"step": 3825,
"valid_targets_mean": 4304.1,
"valid_targets_min": 1201
},
{
"epoch": 4.023109243697479,
"grad_norm": 0.593694354846493,
"learning_rate": 1.8289069219169717e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22287964820861816,
"step": 3830,
"valid_targets_mean": 3669.4,
"valid_targets_min": 980
},
{
"epoch": 4.0283613445378155,
"grad_norm": 0.6618298739900584,
"learning_rate": 1.8236881115518766e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557893693447113,
"step": 3835,
"valid_targets_mean": 4120.9,
"valid_targets_min": 1512
},
{
"epoch": 4.033613445378151,
"grad_norm": 0.6142046700506524,
"learning_rate": 1.8184705108180516e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2090051770210266,
"step": 3840,
"valid_targets_mean": 3758.4,
"valid_targets_min": 1734
},
{
"epoch": 4.038865546218488,
"grad_norm": 0.5794721395589425,
"learning_rate": 1.8132541555121353e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2171669602394104,
"step": 3845,
"valid_targets_mean": 4416.4,
"valid_targets_min": 1381
},
{
"epoch": 4.044117647058823,
"grad_norm": 0.5873970760320343,
"learning_rate": 1.808039081422223e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23693841695785522,
"step": 3850,
"valid_targets_mean": 3650.9,
"valid_targets_min": 1024
},
{
"epoch": 4.04936974789916,
"grad_norm": 0.6544469337267305,
"learning_rate": 1.802825324327618e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22341692447662354,
"step": 3855,
"valid_targets_mean": 3792.1,
"valid_targets_min": 2107
},
{
"epoch": 4.054621848739496,
"grad_norm": 0.6368703549214123,
"learning_rate": 1.7976129199985886e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.216568723320961,
"step": 3860,
"valid_targets_mean": 3349.4,
"valid_targets_min": 802
},
{
"epoch": 4.059873949579832,
"grad_norm": 0.6024180533305669,
"learning_rate": 1.7924019041961228e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22188133001327515,
"step": 3865,
"valid_targets_mean": 3829.7,
"valid_targets_min": 1597
},
{
"epoch": 4.065126050420168,
"grad_norm": 0.6323374001658106,
"learning_rate": 1.7871923126716827e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21390947699546814,
"step": 3870,
"valid_targets_mean": 2841.6,
"valid_targets_min": 1535
},
{
"epoch": 4.070378151260504,
"grad_norm": 0.5926408570492498,
"learning_rate": 1.7819841811669573e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23295366764068604,
"step": 3875,
"valid_targets_mean": 4229.0,
"valid_targets_min": 1385
},
{
"epoch": 4.07563025210084,
"grad_norm": 0.6456267570500575,
"learning_rate": 1.7767775454136194e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24474671483039856,
"step": 3880,
"valid_targets_mean": 3543.5,
"valid_targets_min": 1451
},
{
"epoch": 4.080882352941177,
"grad_norm": 0.7628071822726314,
"learning_rate": 1.7715724411330806e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2485944777727127,
"step": 3885,
"valid_targets_mean": 2809.7,
"valid_targets_min": 1269
},
{
"epoch": 4.086134453781512,
"grad_norm": 0.6699354098606171,
"learning_rate": 1.7663689040362446e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23240669071674347,
"step": 3890,
"valid_targets_mean": 2924.8,
"valid_targets_min": 935
},
{
"epoch": 4.091386554621849,
"grad_norm": 0.6582143455705185,
"learning_rate": 1.761166969823262e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2368423342704773,
"step": 3895,
"valid_targets_mean": 3029.1,
"valid_targets_min": 1695
},
{
"epoch": 4.0966386554621845,
"grad_norm": 0.7189637917203952,
"learning_rate": 1.7559666741832896e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2396736443042755,
"step": 3900,
"valid_targets_mean": 3217.1,
"valid_targets_min": 671
},
{
"epoch": 4.101890756302521,
"grad_norm": 0.651225210749888,
"learning_rate": 1.750768052794239e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23836606740951538,
"step": 3905,
"valid_targets_mean": 3716.9,
"valid_targets_min": 1020
},
{
"epoch": 4.107142857142857,
"grad_norm": 0.6518633827861082,
"learning_rate": 1.7455711413225372e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.233098566532135,
"step": 3910,
"valid_targets_mean": 3237.8,
"valid_targets_min": 1889
},
{
"epoch": 4.112394957983193,
"grad_norm": 0.6876543636905016,
"learning_rate": 1.7403759754228794e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22473348677158356,
"step": 3915,
"valid_targets_mean": 2959.4,
"valid_targets_min": 1385
},
{
"epoch": 4.117647058823529,
"grad_norm": 0.7187642767454995,
"learning_rate": 1.7351825907379837e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25105470418930054,
"step": 3920,
"valid_targets_mean": 3390.4,
"valid_targets_min": 1588
},
{
"epoch": 4.1228991596638656,
"grad_norm": 0.6768076603434932,
"learning_rate": 1.7299910228983513e-05,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23110558092594147,
"step": 3925,
"valid_targets_mean": 3135.2,
"valid_targets_min": 699
},
{
"epoch": 4.128151260504202,
"grad_norm": 0.6753396109242978,
"learning_rate": 1.7248013075220128e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22585970163345337,
"step": 3930,
"valid_targets_mean": 2970.0,
"valid_targets_min": 648
},
{
"epoch": 4.133403361344538,
"grad_norm": 0.6444337615377012,
"learning_rate": 1.7196134802142945e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2224642038345337,
"step": 3935,
"valid_targets_mean": 3744.2,
"valid_targets_min": 1934
},
{
"epoch": 4.138655462184874,
"grad_norm": 0.6792362480524322,
"learning_rate": 1.7144275765675673e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23104789853096008,
"step": 3940,
"valid_targets_mean": 3753.4,
"valid_targets_min": 863
},
{
"epoch": 4.14390756302521,
"grad_norm": 0.6240116424894049,
"learning_rate": 1.7092436321610042e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2116166055202484,
"step": 3945,
"valid_targets_mean": 3309.5,
"valid_targets_min": 1410
},
{
"epoch": 4.149159663865547,
"grad_norm": 0.6706279698577615,
"learning_rate": 1.704061682560336e-05,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25118085741996765,
"step": 3950,
"valid_targets_mean": 4311.5,
"valid_targets_min": 2040
},
{
"epoch": 4.154411764705882,
"grad_norm": 0.7103731685784668,
"learning_rate": 1.698881763317609e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23094293475151062,
"step": 3955,
"valid_targets_mean": 2688.4,
"valid_targets_min": 1458
},
{
"epoch": 4.159663865546219,
"grad_norm": 0.6553558995778831,
"learning_rate": 1.69370390997094e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2209138721227646,
"step": 3960,
"valid_targets_mean": 3155.8,
"valid_targets_min": 1110
},
{
"epoch": 4.1649159663865545,
"grad_norm": 0.6997001621889637,
"learning_rate": 1.6885281580442677e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22238752245903015,
"step": 3965,
"valid_targets_mean": 2572.8,
"valid_targets_min": 513
},
{
"epoch": 4.170168067226891,
"grad_norm": 2.385982583274398,
"learning_rate": 1.6833545430471194e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642630636692047,
"step": 3970,
"valid_targets_mean": 2760.3,
"valid_targets_min": 1636
},
{
"epoch": 4.175420168067227,
"grad_norm": 0.6281184165319054,
"learning_rate": 1.678183100474359e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23373137414455414,
"step": 3975,
"valid_targets_mean": 3912.6,
"valid_targets_min": 1801
},
{
"epoch": 4.180672268907563,
"grad_norm": 0.7646111653644774,
"learning_rate": 1.6730138658059448e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311634123325348,
"step": 3980,
"valid_targets_mean": 3197.1,
"valid_targets_min": 924
},
{
"epoch": 4.185924369747899,
"grad_norm": 0.7085277743946552,
"learning_rate": 1.667846874506689e-05,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2161899358034134,
"step": 3985,
"valid_targets_mean": 2886.2,
"valid_targets_min": 1401
},
{
"epoch": 4.1911764705882355,
"grad_norm": 0.7229719956908336,
"learning_rate": 1.662682162026012e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24561478197574615,
"step": 3990,
"valid_targets_mean": 3041.9,
"valid_targets_min": 1265
},
{
"epoch": 4.196428571428571,
"grad_norm": 0.6233236849228904,
"learning_rate": 1.6575197637976995e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20357422530651093,
"step": 3995,
"valid_targets_mean": 3318.8,
"valid_targets_min": 1648
},
{
"epoch": 4.201680672268908,
"grad_norm": 0.684658245418384,
"learning_rate": 1.652359715239661e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21792471408843994,
"step": 4000,
"valid_targets_mean": 3989.8,
"valid_targets_min": 1844
},
{
"epoch": 4.206932773109243,
"grad_norm": 0.6398769831531746,
"learning_rate": 1.6472020517536828e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2144005000591278,
"step": 4005,
"valid_targets_mean": 3636.7,
"valid_targets_min": 1261
},
{
"epoch": 4.21218487394958,
"grad_norm": 0.7341420848535544,
"learning_rate": 1.6420468087251907e-05,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20942559838294983,
"step": 4010,
"valid_targets_mean": 3165.4,
"valid_targets_min": 1294
},
{
"epoch": 4.217436974789916,
"grad_norm": 0.7202011687730974,
"learning_rate": 1.6368940215230026e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24036064743995667,
"step": 4015,
"valid_targets_mean": 3169.3,
"valid_targets_min": 1432
},
{
"epoch": 4.222689075630252,
"grad_norm": 0.6828224156387892,
"learning_rate": 1.6317437254990875e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23701542615890503,
"step": 4020,
"valid_targets_mean": 3107.8,
"valid_targets_min": 742
},
{
"epoch": 4.227941176470588,
"grad_norm": 0.6787140516821543,
"learning_rate": 1.626595955988325e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21809794008731842,
"step": 4025,
"valid_targets_mean": 3005.8,
"valid_targets_min": 988
},
{
"epoch": 4.233193277310924,
"grad_norm": 0.7166611868537497,
"learning_rate": 1.6214507483082593e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.233636736869812,
"step": 4030,
"valid_targets_mean": 3192.8,
"valid_targets_min": 654
},
{
"epoch": 4.23844537815126,
"grad_norm": 0.6756135280787572,
"learning_rate": 1.6163081377588588e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22536295652389526,
"step": 4035,
"valid_targets_mean": 3349.0,
"valid_targets_min": 1328
},
{
"epoch": 4.243697478991597,
"grad_norm": 0.6733677254055387,
"learning_rate": 1.6111681596222732e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2062094807624817,
"step": 4040,
"valid_targets_mean": 3037.0,
"valid_targets_min": 1302
},
{
"epoch": 4.248949579831933,
"grad_norm": 0.7009721818052325,
"learning_rate": 1.606030849162593e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2229950726032257,
"step": 4045,
"valid_targets_mean": 3635.6,
"valid_targets_min": 1701
},
{
"epoch": 4.254201680672269,
"grad_norm": 0.6661284889755613,
"learning_rate": 1.600896241625605e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22747060656547546,
"step": 4050,
"valid_targets_mean": 3422.1,
"valid_targets_min": 1319
},
{
"epoch": 4.2594537815126055,
"grad_norm": 0.6094686088609381,
"learning_rate": 1.5957643722385532e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21023216843605042,
"step": 4055,
"valid_targets_mean": 3806.1,
"valid_targets_min": 1194
},
{
"epoch": 4.264705882352941,
"grad_norm": 0.6259994730524294,
"learning_rate": 1.590635276209896e-05,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20072561502456665,
"step": 4060,
"valid_targets_mean": 3004.6,
"valid_targets_min": 1453
},
{
"epoch": 4.269957983193278,
"grad_norm": 0.5928071676270973,
"learning_rate": 1.5855089887290634e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2144814431667328,
"step": 4065,
"valid_targets_mean": 3975.1,
"valid_targets_min": 1743
},
{
"epoch": 4.275210084033613,
"grad_norm": 0.7034766602053386,
"learning_rate": 1.5803855449662175e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23000982403755188,
"step": 4070,
"valid_targets_mean": 3192.5,
"valid_targets_min": 1234
},
{
"epoch": 4.28046218487395,
"grad_norm": 0.6797161663877974,
"learning_rate": 1.5752649800720096e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2336946427822113,
"step": 4075,
"valid_targets_mean": 3073.8,
"valid_targets_min": 1188
},
{
"epoch": 4.285714285714286,
"grad_norm": 0.5845573966663017,
"learning_rate": 1.5701473291773395e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2029433399438858,
"step": 4080,
"valid_targets_mean": 3894.5,
"valid_targets_min": 618
},
{
"epoch": 4.290966386554622,
"grad_norm": 0.9566677599879087,
"learning_rate": 1.5650326273931166e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21042492985725403,
"step": 4085,
"valid_targets_mean": 3189.6,
"valid_targets_min": 1364
},
{
"epoch": 4.296218487394958,
"grad_norm": 0.6929467596600297,
"learning_rate": 1.559920909810016e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22422900795936584,
"step": 4090,
"valid_targets_mean": 3735.1,
"valid_targets_min": 1514
},
{
"epoch": 4.301470588235294,
"grad_norm": 0.7889834685287505,
"learning_rate": 1.5548122114982393e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22729304432868958,
"step": 4095,
"valid_targets_mean": 2972.1,
"valid_targets_min": 1073
},
{
"epoch": 4.30672268907563,
"grad_norm": 0.7145190034824895,
"learning_rate": 1.5497065675072728e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22352570295333862,
"step": 4100,
"valid_targets_mean": 2926.5,
"valid_targets_min": 1026
},
{
"epoch": 4.311974789915967,
"grad_norm": 0.6561593136868893,
"learning_rate": 1.5446040128656485e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19251301884651184,
"step": 4105,
"valid_targets_mean": 2859.4,
"valid_targets_min": 857
},
{
"epoch": 4.317226890756302,
"grad_norm": 0.6862200086122758,
"learning_rate": 1.539504582580704e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21139201521873474,
"step": 4110,
"valid_targets_mean": 3083.8,
"valid_targets_min": 720
},
{
"epoch": 4.322478991596639,
"grad_norm": 0.776255577609975,
"learning_rate": 1.5344083116383395e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24367398023605347,
"step": 4115,
"valid_targets_mean": 3220.5,
"valid_targets_min": 1175
},
{
"epoch": 4.3277310924369745,
"grad_norm": 0.6825477266343268,
"learning_rate": 1.529315235002781e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20516598224639893,
"step": 4120,
"valid_targets_mean": 3000.1,
"valid_targets_min": 1411
},
{
"epoch": 4.332983193277311,
"grad_norm": 0.6569828485036016,
"learning_rate": 1.5242253876163399e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2060314565896988,
"step": 4125,
"valid_targets_mean": 3553.2,
"valid_targets_min": 1743
},
{
"epoch": 4.338235294117647,
"grad_norm": 0.7319933985960059,
"learning_rate": 1.5191388043991712e-05,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2330959588289261,
"step": 4130,
"valid_targets_mean": 3180.8,
"valid_targets_min": 1398
},
{
"epoch": 4.343487394957983,
"grad_norm": 0.6718430936496146,
"learning_rate": 1.5140555202490359e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20311537384986877,
"step": 4135,
"valid_targets_mean": 3596.6,
"valid_targets_min": 1767
},
{
"epoch": 4.348739495798319,
"grad_norm": 0.6541737718826137,
"learning_rate": 1.5089755700410602e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20354878902435303,
"step": 4140,
"valid_targets_mean": 3805.3,
"valid_targets_min": 1145
},
{
"epoch": 4.3539915966386555,
"grad_norm": 0.6642189302688583,
"learning_rate": 1.5038989886274992e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2232103943824768,
"step": 4145,
"valid_targets_mean": 3490.6,
"valid_targets_min": 1722
},
{
"epoch": 4.359243697478991,
"grad_norm": 0.6521008246137644,
"learning_rate": 1.498825810837492e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19541659951210022,
"step": 4150,
"valid_targets_mean": 3157.6,
"valid_targets_min": 1423
},
{
"epoch": 4.364495798319328,
"grad_norm": 0.6924321128175812,
"learning_rate": 1.4937560714768283e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22630862891674042,
"step": 4155,
"valid_targets_mean": 3276.0,
"valid_targets_min": 1426
},
{
"epoch": 4.369747899159664,
"grad_norm": 0.7066936740974944,
"learning_rate": 1.4886898053277086e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2139957845211029,
"step": 4160,
"valid_targets_mean": 3190.3,
"valid_targets_min": 538
},
{
"epoch": 4.375,
"grad_norm": 0.7759687498686932,
"learning_rate": 1.4836270471485029e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2279035598039627,
"step": 4165,
"valid_targets_mean": 2498.0,
"valid_targets_min": 537
},
{
"epoch": 4.380252100840336,
"grad_norm": 0.6772887664667172,
"learning_rate": 1.4785678316735144e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21676117181777954,
"step": 4170,
"valid_targets_mean": 3068.9,
"valid_targets_min": 721
},
{
"epoch": 4.385504201680672,
"grad_norm": 0.8980937779941081,
"learning_rate": 1.4735121936127406e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24256817996501923,
"step": 4175,
"valid_targets_mean": 3478.7,
"valid_targets_min": 1625
},
{
"epoch": 4.390756302521009,
"grad_norm": 0.7329255290185969,
"learning_rate": 1.4684601676516366e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2386029064655304,
"step": 4180,
"valid_targets_mean": 3130.2,
"valid_targets_min": 1400
},
{
"epoch": 4.3960084033613445,
"grad_norm": 0.7786336588807071,
"learning_rate": 1.4634117884508738e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19800731539726257,
"step": 4185,
"valid_targets_mean": 3135.8,
"valid_targets_min": 1648
},
{
"epoch": 4.401260504201681,
"grad_norm": 0.7631967058787871,
"learning_rate": 1.458367090646105e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2008107602596283,
"step": 4190,
"valid_targets_mean": 2437.4,
"valid_targets_min": 648
},
{
"epoch": 4.406512605042017,
"grad_norm": 0.7191244352959169,
"learning_rate": 1.4533261088477257e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20372244715690613,
"step": 4195,
"valid_targets_mean": 2783.8,
"valid_targets_min": 885
},
{
"epoch": 4.411764705882353,
"grad_norm": 0.7150862191687413,
"learning_rate": 1.448288877640637e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20869606733322144,
"step": 4200,
"valid_targets_mean": 3689.0,
"valid_targets_min": 1325
},
{
"epoch": 4.417016806722689,
"grad_norm": 0.716489559808733,
"learning_rate": 1.4432554315840082e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20727670192718506,
"step": 4205,
"valid_targets_mean": 3362.6,
"valid_targets_min": 953
},
{
"epoch": 4.4222689075630255,
"grad_norm": 0.7087446848068543,
"learning_rate": 1.438225805211039e-05,
"loss": 0.2114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.224325031042099,
"step": 4210,
"valid_targets_mean": 3481.2,
"valid_targets_min": 1592
},
{
"epoch": 4.427521008403361,
"grad_norm": 0.6500807963798068,
"learning_rate": 1.4332000330287248e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20948271453380585,
"step": 4215,
"valid_targets_mean": 3169.1,
"valid_targets_min": 530
},
{
"epoch": 4.432773109243698,
"grad_norm": 0.6730778830395577,
"learning_rate": 1.428178149517617e-05,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2134353220462799,
"step": 4220,
"valid_targets_mean": 3418.1,
"valid_targets_min": 1066
},
{
"epoch": 4.438025210084033,
"grad_norm": 0.6727213761188319,
"learning_rate": 1.4231601891315876e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2243449091911316,
"step": 4225,
"valid_targets_mean": 4071.0,
"valid_targets_min": 1885
},
{
"epoch": 4.44327731092437,
"grad_norm": 0.7011377195102847,
"learning_rate": 1.418146186297594e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19244351983070374,
"step": 4230,
"valid_targets_mean": 3914.1,
"valid_targets_min": 852
},
{
"epoch": 4.448529411764706,
"grad_norm": 0.6685868237134905,
"learning_rate": 1.413136175415441e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22170649468898773,
"step": 4235,
"valid_targets_mean": 2790.1,
"valid_targets_min": 1025
},
{
"epoch": 4.453781512605042,
"grad_norm": 0.6475753723469297,
"learning_rate": 1.4081301908575457e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2239975482225418,
"step": 4240,
"valid_targets_mean": 4196.2,
"valid_targets_min": 1397
},
{
"epoch": 4.459033613445378,
"grad_norm": 0.8141488892094502,
"learning_rate": 1.4031282669687035e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19613388180732727,
"step": 4245,
"valid_targets_mean": 3816.1,
"valid_targets_min": 1920
},
{
"epoch": 4.464285714285714,
"grad_norm": 0.6806187299183513,
"learning_rate": 1.3981304380658474e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20587432384490967,
"step": 4250,
"valid_targets_mean": 3625.5,
"valid_targets_min": 1687
},
{
"epoch": 4.46953781512605,
"grad_norm": 0.7502387892882345,
"learning_rate": 1.3931367384378183e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2327464073896408,
"step": 4255,
"valid_targets_mean": 3404.2,
"valid_targets_min": 1210
},
{
"epoch": 4.474789915966387,
"grad_norm": 0.6570388636908775,
"learning_rate": 1.3881472023451262e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919768750667572,
"step": 4260,
"valid_targets_mean": 3334.3,
"valid_targets_min": 1360
},
{
"epoch": 4.480042016806722,
"grad_norm": 0.6969625105218161,
"learning_rate": 1.3831618640197153e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21205592155456543,
"step": 4265,
"valid_targets_mean": 3091.5,
"valid_targets_min": 1447
},
{
"epoch": 4.485294117647059,
"grad_norm": 0.7307640724228113,
"learning_rate": 1.3781807576647315e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.204860657453537,
"step": 4270,
"valid_targets_mean": 2715.1,
"valid_targets_min": 1243
},
{
"epoch": 4.4905462184873945,
"grad_norm": 0.7293687135782331,
"learning_rate": 1.373203917454285e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21605542302131653,
"step": 4275,
"valid_targets_mean": 2944.4,
"valid_targets_min": 897
},
{
"epoch": 4.495798319327731,
"grad_norm": 0.7287294839891085,
"learning_rate": 1.3682313775332186e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2306896150112152,
"step": 4280,
"valid_targets_mean": 3085.3,
"valid_targets_min": 1312
},
{
"epoch": 4.501050420168067,
"grad_norm": 0.6982921140070419,
"learning_rate": 1.3632631720168705e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20665548741817474,
"step": 4285,
"valid_targets_mean": 3413.9,
"valid_targets_min": 1469
},
{
"epoch": 4.506302521008403,
"grad_norm": 0.7131094152829368,
"learning_rate": 1.358299334990842e-05,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2063906341791153,
"step": 4290,
"valid_targets_mean": 2992.4,
"valid_targets_min": 1593
},
{
"epoch": 4.51155462184874,
"grad_norm": 0.7372869299957252,
"learning_rate": 1.3533399005107635e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22824421525001526,
"step": 4295,
"valid_targets_mean": 3131.6,
"valid_targets_min": 1664
},
{
"epoch": 4.516806722689076,
"grad_norm": 0.6346433949828432,
"learning_rate": 1.3483849026020603e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19013050198554993,
"step": 4300,
"valid_targets_mean": 3709.5,
"valid_targets_min": 1605
},
{
"epoch": 4.522058823529412,
"grad_norm": 0.6754439443280119,
"learning_rate": 1.3434343752597199e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22575265169143677,
"step": 4305,
"valid_targets_mean": 3649.6,
"valid_targets_min": 1737
},
{
"epoch": 4.527310924369748,
"grad_norm": 0.6967616700028672,
"learning_rate": 1.3384883524480576e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22875870764255524,
"step": 4310,
"valid_targets_mean": 3512.8,
"valid_targets_min": 1817
},
{
"epoch": 4.532563025210084,
"grad_norm": 0.6886827979081415,
"learning_rate": 1.333546868100486e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20903798937797546,
"step": 4315,
"valid_targets_mean": 3413.6,
"valid_targets_min": 2026
},
{
"epoch": 4.53781512605042,
"grad_norm": 0.660189404042565,
"learning_rate": 1.3286099561192784e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21688057482242584,
"step": 4320,
"valid_targets_mean": 3905.8,
"valid_targets_min": 1214
},
{
"epoch": 4.543067226890757,
"grad_norm": 0.8043966125939357,
"learning_rate": 1.3236776503753397e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14316143095493317,
"step": 4325,
"valid_targets_mean": 1467.6,
"valid_targets_min": 715
},
{
"epoch": 4.548319327731092,
"grad_norm": 0.7841054688198438,
"learning_rate": 1.3187499847079713e-05,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14375540614128113,
"step": 4330,
"valid_targets_mean": 1573.2,
"valid_targets_min": 725
},
{
"epoch": 4.553571428571429,
"grad_norm": 0.8186335723421362,
"learning_rate": 1.3138269929246427e-05,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15070709586143494,
"step": 4335,
"valid_targets_mean": 1469.3,
"valid_targets_min": 714
},
{
"epoch": 4.5588235294117645,
"grad_norm": 0.8679170015389952,
"learning_rate": 1.308908708800753e-05,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14169779419898987,
"step": 4340,
"valid_targets_mean": 1390.9,
"valid_targets_min": 615
},
{
"epoch": 4.564075630252101,
"grad_norm": 0.9114994147726516,
"learning_rate": 1.3039951660794063e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14317017793655396,
"step": 4345,
"valid_targets_mean": 1436.4,
"valid_targets_min": 715
},
{
"epoch": 4.569327731092437,
"grad_norm": 0.8898038163908437,
"learning_rate": 1.2990863984711773e-05,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17335724830627441,
"step": 4350,
"valid_targets_mean": 1576.6,
"valid_targets_min": 625
},
{
"epoch": 4.574579831932773,
"grad_norm": 0.785064729278413,
"learning_rate": 1.294182439653878e-05,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12577390670776367,
"step": 4355,
"valid_targets_mean": 1400.9,
"valid_targets_min": 761
},
{
"epoch": 4.579831932773109,
"grad_norm": 0.7745818948625097,
"learning_rate": 1.2892833232723297e-05,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21761628985404968,
"step": 4360,
"valid_targets_mean": 1609.2,
"valid_targets_min": 703
},
{
"epoch": 4.5850840336134455,
"grad_norm": 0.9711741060616659,
"learning_rate": 1.2843890829381303e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14271649718284607,
"step": 4365,
"valid_targets_mean": 1564.4,
"valid_targets_min": 733
},
{
"epoch": 4.590336134453781,
"grad_norm": 0.8866160542903732,
"learning_rate": 1.2794997522294263e-05,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13775603473186493,
"step": 4370,
"valid_targets_mean": 1521.2,
"valid_targets_min": 835
},
{
"epoch": 4.595588235294118,
"grad_norm": 0.8231923650364629,
"learning_rate": 1.2746153646906766e-05,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13401484489440918,
"step": 4375,
"valid_targets_mean": 1525.2,
"valid_targets_min": 815
},
{
"epoch": 4.600840336134453,
"grad_norm": 0.8550257487811143,
"learning_rate": 1.2697359538324303e-05,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13395115733146667,
"step": 4380,
"valid_targets_mean": 1584.4,
"valid_targets_min": 797
},
{
"epoch": 4.60609243697479,
"grad_norm": 0.8426859205924878,
"learning_rate": 1.2648615531310907e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12041187286376953,
"step": 4385,
"valid_targets_mean": 1384.5,
"valid_targets_min": 570
},
{
"epoch": 4.6113445378151265,
"grad_norm": 0.786905654669723,
"learning_rate": 1.259992196028688e-05,
"loss": 0.1232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11873074620962143,
"step": 4390,
"valid_targets_mean": 1481.8,
"valid_targets_min": 548
},
{
"epoch": 4.616596638655462,
"grad_norm": 0.8303948199867104,
"learning_rate": 1.2551279159326495e-05,
"loss": 0.1208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11647927761077881,
"step": 4395,
"valid_targets_mean": 1247.1,
"valid_targets_min": 682
},
{
"epoch": 4.621848739495798,
"grad_norm": 0.8753106179981709,
"learning_rate": 1.2502687462155709e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494443118572235,
"step": 4400,
"valid_targets_mean": 1686.6,
"valid_targets_min": 896
},
{
"epoch": 4.6271008403361344,
"grad_norm": 0.8050150714693087,
"learning_rate": 1.2454147202149865e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12719589471817017,
"step": 4405,
"valid_targets_mean": 1415.3,
"valid_targets_min": 597
},
{
"epoch": 4.632352941176471,
"grad_norm": 0.8009830063907718,
"learning_rate": 1.2405658712331409e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12356242537498474,
"step": 4410,
"valid_targets_mean": 1527.1,
"valid_targets_min": 706
},
{
"epoch": 4.637605042016807,
"grad_norm": 0.7347334443196466,
"learning_rate": 1.2357222325367604e-05,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11749774217605591,
"step": 4415,
"valid_targets_mean": 1439.2,
"valid_targets_min": 754
},
{
"epoch": 4.642857142857143,
"grad_norm": 0.8064940468859054,
"learning_rate": 1.2308838373568249e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12089011818170547,
"step": 4420,
"valid_targets_mean": 1403.5,
"valid_targets_min": 785
},
{
"epoch": 4.648109243697479,
"grad_norm": 0.7972098191885254,
"learning_rate": 1.2260507188883395e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12170597910881042,
"step": 4425,
"valid_targets_mean": 1499.6,
"valid_targets_min": 617
},
{
"epoch": 4.6533613445378155,
"grad_norm": 0.975037389066893,
"learning_rate": 1.2212229102901077e-05,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13412654399871826,
"step": 4430,
"valid_targets_mean": 1218.8,
"valid_targets_min": 648
},
{
"epoch": 4.658613445378151,
"grad_norm": 0.8641754817962347,
"learning_rate": 1.2164004446845037e-05,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13030359148979187,
"step": 4435,
"valid_targets_mean": 1603.4,
"valid_targets_min": 1184
},
{
"epoch": 4.663865546218488,
"grad_norm": 0.9180121006760533,
"learning_rate": 1.2115833551572438e-05,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12268111109733582,
"step": 4440,
"valid_targets_mean": 1407.5,
"valid_targets_min": 774
},
{
"epoch": 4.669117647058823,
"grad_norm": 0.8547903927275693,
"learning_rate": 1.2067716747571616e-05,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13655883073806763,
"step": 4445,
"valid_targets_mean": 1627.1,
"valid_targets_min": 734
},
{
"epoch": 4.67436974789916,
"grad_norm": 0.881631394330736,
"learning_rate": 1.201965436495978e-05,
"loss": 0.1273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12907208502292633,
"step": 4450,
"valid_targets_mean": 1424.6,
"valid_targets_min": 1004
},
{
"epoch": 4.679621848739496,
"grad_norm": 0.8063717130180919,
"learning_rate": 1.1971646733480784e-05,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13420622050762177,
"step": 4455,
"valid_targets_mean": 1478.4,
"valid_targets_min": 803
},
{
"epoch": 4.684873949579832,
"grad_norm": 0.8260967863457012,
"learning_rate": 1.1923694182502848e-05,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11544696986675262,
"step": 4460,
"valid_targets_mean": 1341.6,
"valid_targets_min": 782
},
{
"epoch": 4.690126050420168,
"grad_norm": 0.8029075297918149,
"learning_rate": 1.1875797041016286e-05,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12873606383800507,
"step": 4465,
"valid_targets_mean": 1627.8,
"valid_targets_min": 646
},
{
"epoch": 4.695378151260504,
"grad_norm": 0.8998520655105815,
"learning_rate": 1.1827955637631283e-05,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14146029949188232,
"step": 4470,
"valid_targets_mean": 1465.2,
"valid_targets_min": 591
},
{
"epoch": 4.70063025210084,
"grad_norm": 0.9673884965286654,
"learning_rate": 1.1780170300575602e-05,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15864944458007812,
"step": 4475,
"valid_targets_mean": 1623.8,
"valid_targets_min": 796
},
{
"epoch": 4.705882352941177,
"grad_norm": 0.8028753858678307,
"learning_rate": 1.1732441357692353e-05,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11006323993206024,
"step": 4480,
"valid_targets_mean": 1318.8,
"valid_targets_min": 848
},
{
"epoch": 4.711134453781512,
"grad_norm": 0.7757517539215945,
"learning_rate": 1.1684769136437742e-05,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1143508329987526,
"step": 4485,
"valid_targets_mean": 1281.6,
"valid_targets_min": 665
},
{
"epoch": 4.716386554621849,
"grad_norm": 0.8198556072030991,
"learning_rate": 1.1637153963878815e-05,
"loss": 0.1189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10272709280252457,
"step": 4490,
"valid_targets_mean": 1267.4,
"valid_targets_min": 640
},
{
"epoch": 4.7216386554621845,
"grad_norm": 0.993622221837871,
"learning_rate": 1.1589596166691231e-05,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14048606157302856,
"step": 4495,
"valid_targets_mean": 1505.4,
"valid_targets_min": 662
},
{
"epoch": 4.726890756302521,
"grad_norm": 0.9175391246008294,
"learning_rate": 1.1542096071157012e-05,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12400451302528381,
"step": 4500,
"valid_targets_mean": 1243.3,
"valid_targets_min": 724
},
{
"epoch": 4.732142857142857,
"grad_norm": 0.8780528943864113,
"learning_rate": 1.1494654003162285e-05,
"loss": 0.1243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12478488683700562,
"step": 4505,
"valid_targets_mean": 1371.4,
"valid_targets_min": 924
},
{
"epoch": 4.737394957983193,
"grad_norm": 1.0957377833225224,
"learning_rate": 1.1447270288195089e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1323080062866211,
"step": 4510,
"valid_targets_mean": 1497.8,
"valid_targets_min": 773
},
{
"epoch": 4.742647058823529,
"grad_norm": 0.9093558038524169,
"learning_rate": 1.1399945251343114e-05,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14012199640274048,
"step": 4515,
"valid_targets_mean": 1446.2,
"valid_targets_min": 692
},
{
"epoch": 4.7478991596638656,
"grad_norm": 0.8399340996586211,
"learning_rate": 1.1352679217291457e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10750658810138702,
"step": 4520,
"valid_targets_mean": 1165.6,
"valid_targets_min": 776
},
{
"epoch": 4.753151260504202,
"grad_norm": 0.8065610789721998,
"learning_rate": 1.1305472510320419e-05,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12666700780391693,
"step": 4525,
"valid_targets_mean": 1593.9,
"valid_targets_min": 634
},
{
"epoch": 4.758403361344538,
"grad_norm": 0.825002414616717,
"learning_rate": 1.1258325454303286e-05,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13277189433574677,
"step": 4530,
"valid_targets_mean": 1652.5,
"valid_targets_min": 573
},
{
"epoch": 4.7636554621848735,
"grad_norm": 0.8052034847245988,
"learning_rate": 1.1211238372704073e-05,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12504729628562927,
"step": 4535,
"valid_targets_mean": 1694.2,
"valid_targets_min": 754
},
{
"epoch": 4.76890756302521,
"grad_norm": 0.7944186688073329,
"learning_rate": 1.1164211588575339e-05,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11452824622392654,
"step": 4540,
"valid_targets_mean": 1335.4,
"valid_targets_min": 763
},
{
"epoch": 4.774159663865547,
"grad_norm": 0.9867441295496705,
"learning_rate": 1.1117245424555967e-05,
"loss": 0.1213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12596900761127472,
"step": 4545,
"valid_targets_mean": 1470.9,
"valid_targets_min": 956
},
{
"epoch": 4.779411764705882,
"grad_norm": 0.9111318412419092,
"learning_rate": 1.1070340202868915e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12238766252994537,
"step": 4550,
"valid_targets_mean": 1322.6,
"valid_targets_min": 676
},
{
"epoch": 4.784663865546219,
"grad_norm": 0.9026375196081591,
"learning_rate": 1.1023496245319056e-05,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12969665229320526,
"step": 4555,
"valid_targets_mean": 1267.3,
"valid_targets_min": 780
},
{
"epoch": 4.7899159663865545,
"grad_norm": 0.8044017655815434,
"learning_rate": 1.0976713873290925e-05,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11323502659797668,
"step": 4560,
"valid_targets_mean": 1303.4,
"valid_targets_min": 677
},
{
"epoch": 4.795168067226891,
"grad_norm": 0.8200442636224358,
"learning_rate": 1.0929993407746543e-05,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10392217338085175,
"step": 4565,
"valid_targets_mean": 1200.9,
"valid_targets_min": 727
},
{
"epoch": 4.800420168067227,
"grad_norm": 0.839175470474291,
"learning_rate": 1.0883335169223212e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13048666715621948,
"step": 4570,
"valid_targets_mean": 1514.3,
"valid_targets_min": 726
},
{
"epoch": 4.805672268907563,
"grad_norm": 0.8992567495172576,
"learning_rate": 1.0836739477831297e-05,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13388502597808838,
"step": 4575,
"valid_targets_mean": 1504.9,
"valid_targets_min": 669
},
{
"epoch": 4.810924369747899,
"grad_norm": 0.8667203247346105,
"learning_rate": 1.0790206653252055e-05,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12979502975940704,
"step": 4580,
"valid_targets_mean": 1499.6,
"valid_targets_min": 750
},
{
"epoch": 4.8161764705882355,
"grad_norm": 0.8236209984599626,
"learning_rate": 1.0743737014735434e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11989112198352814,
"step": 4585,
"valid_targets_mean": 1397.2,
"valid_targets_min": 736
},
{
"epoch": 4.821428571428571,
"grad_norm": 0.8603157391015415,
"learning_rate": 1.0697330881097857e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1339968591928482,
"step": 4590,
"valid_targets_mean": 1373.4,
"valid_targets_min": 694
},
{
"epoch": 4.826680672268908,
"grad_norm": 0.8846127818913729,
"learning_rate": 1.0650988570720077e-05,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13660481572151184,
"step": 4595,
"valid_targets_mean": 1546.9,
"valid_targets_min": 727
},
{
"epoch": 4.831932773109243,
"grad_norm": 0.8465612563420826,
"learning_rate": 1.0604710401544963e-05,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11273416876792908,
"step": 4600,
"valid_targets_mean": 1265.4,
"valid_targets_min": 809
},
{
"epoch": 4.83718487394958,
"grad_norm": 0.8108208139117962,
"learning_rate": 1.0558496691075318e-05,
"loss": 0.123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11026652157306671,
"step": 4605,
"valid_targets_mean": 1368.5,
"valid_targets_min": 684
},
{
"epoch": 4.842436974789916,
"grad_norm": 0.8597461483981371,
"learning_rate": 1.0512347756371726e-05,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12328451871871948,
"step": 4610,
"valid_targets_mean": 1360.0,
"valid_targets_min": 750
},
{
"epoch": 4.847689075630252,
"grad_norm": 0.8960809913992954,
"learning_rate": 1.0466263914050362e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1297706663608551,
"step": 4615,
"valid_targets_mean": 1508.2,
"valid_targets_min": 818
},
{
"epoch": 4.852941176470588,
"grad_norm": 0.8624681465534092,
"learning_rate": 1.0420245480280804e-05,
"loss": 0.124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13054832816123962,
"step": 4620,
"valid_targets_mean": 1582.8,
"valid_targets_min": 665
},
{
"epoch": 4.858193277310924,
"grad_norm": 0.9437920037528255,
"learning_rate": 1.0374292770783891e-05,
"loss": 0.1205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14127075672149658,
"step": 4625,
"valid_targets_mean": 1475.8,
"valid_targets_min": 1093
},
{
"epoch": 4.86344537815126,
"grad_norm": 0.8557418798703278,
"learning_rate": 1.0328406100829542e-05,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1389474719762802,
"step": 4630,
"valid_targets_mean": 1493.8,
"valid_targets_min": 632
},
{
"epoch": 4.868697478991597,
"grad_norm": 0.87445714339707,
"learning_rate": 1.0282585785234578e-05,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13523709774017334,
"step": 4635,
"valid_targets_mean": 1507.4,
"valid_targets_min": 700
},
{
"epoch": 4.873949579831933,
"grad_norm": 0.8287344010980091,
"learning_rate": 1.023683213836061e-05,
"loss": 0.122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11704841256141663,
"step": 4640,
"valid_targets_mean": 1353.1,
"valid_targets_min": 810
},
{
"epoch": 4.879201680672269,
"grad_norm": 0.8509384511271177,
"learning_rate": 1.0191145474111823e-05,
"loss": 0.1225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11140401661396027,
"step": 4645,
"valid_targets_mean": 1293.3,
"valid_targets_min": 589
},
{
"epoch": 4.884453781512605,
"grad_norm": 0.9759630950705781,
"learning_rate": 1.0145526105932872e-05,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13949152827262878,
"step": 4650,
"valid_targets_mean": 1433.0,
"valid_targets_min": 750
},
{
"epoch": 4.889705882352941,
"grad_norm": 0.9316341415558835,
"learning_rate": 1.0099974346806714e-05,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12794744968414307,
"step": 4655,
"valid_targets_mean": 1385.1,
"valid_targets_min": 641
},
{
"epoch": 4.894957983193278,
"grad_norm": 0.8801743318163907,
"learning_rate": 1.0054490509252423e-05,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1252344250679016,
"step": 4660,
"valid_targets_mean": 1543.5,
"valid_targets_min": 701
},
{
"epoch": 4.900210084033613,
"grad_norm": 0.8895967821752813,
"learning_rate": 1.0009074905323118e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12817296385765076,
"step": 4665,
"valid_targets_mean": 1708.4,
"valid_targets_min": 1202
},
{
"epoch": 4.90546218487395,
"grad_norm": 0.803668498672539,
"learning_rate": 9.963727846603784e-06,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12417686730623245,
"step": 4670,
"valid_targets_mean": 1497.2,
"valid_targets_min": 770
},
{
"epoch": 4.910714285714286,
"grad_norm": 0.8209572965038717,
"learning_rate": 9.918449644209087e-06,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11642634868621826,
"step": 4675,
"valid_targets_mean": 1333.4,
"valid_targets_min": 646
},
{
"epoch": 4.915966386554622,
"grad_norm": 0.9106589305140345,
"learning_rate": 9.873240608781341e-06,
"loss": 0.1266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.126824289560318,
"step": 4680,
"valid_targets_mean": 1260.1,
"valid_targets_min": 723
},
{
"epoch": 4.921218487394958,
"grad_norm": 0.8246969179034082,
"learning_rate": 9.828101050488308e-06,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11583910137414932,
"step": 4685,
"valid_targets_mean": 1421.8,
"valid_targets_min": 808
},
{
"epoch": 4.926470588235294,
"grad_norm": 0.9467345871410094,
"learning_rate": 9.783031279021063e-06,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.121206134557724,
"step": 4690,
"valid_targets_mean": 1255.4,
"valid_targets_min": 634
},
{
"epoch": 4.93172268907563,
"grad_norm": 0.8946786916723871,
"learning_rate": 9.738031603591926e-06,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12146471440792084,
"step": 4695,
"valid_targets_mean": 1334.6,
"valid_targets_min": 821
},
{
"epoch": 4.936974789915967,
"grad_norm": 0.8415482635056759,
"learning_rate": 9.69310233293227e-06,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12440873682498932,
"step": 4700,
"valid_targets_mean": 1562.7,
"valid_targets_min": 849
},
{
"epoch": 4.942226890756302,
"grad_norm": 0.8253084558385871,
"learning_rate": 9.648243775290476e-06,
"loss": 0.1203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12124086171388626,
"step": 4705,
"valid_targets_mean": 1435.9,
"valid_targets_min": 781
},
{
"epoch": 4.947478991596639,
"grad_norm": 0.8212423721287204,
"learning_rate": 9.60345623842974e-06,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10891197621822357,
"step": 4710,
"valid_targets_mean": 1341.2,
"valid_targets_min": 567
},
{
"epoch": 4.9527310924369745,
"grad_norm": 0.7441257737363668,
"learning_rate": 9.558740029626046e-06,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10063184797763824,
"step": 4715,
"valid_targets_mean": 1319.9,
"valid_targets_min": 810
},
{
"epoch": 4.957983193277311,
"grad_norm": 0.8222604138587376,
"learning_rate": 9.51409545566597e-06,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12508775293827057,
"step": 4720,
"valid_targets_mean": 1657.6,
"valid_targets_min": 868
},
{
"epoch": 4.963235294117647,
"grad_norm": 0.8441572887401301,
"learning_rate": 9.469522822844663e-06,
"loss": 0.1134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12001735717058182,
"step": 4725,
"valid_targets_mean": 1566.1,
"valid_targets_min": 682
},
{
"epoch": 4.968487394957983,
"grad_norm": 0.8622442317465762,
"learning_rate": 9.425022436963664e-06,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13704422116279602,
"step": 4730,
"valid_targets_mean": 1575.5,
"valid_targets_min": 797
},
{
"epoch": 4.973739495798319,
"grad_norm": 0.8300300731222955,
"learning_rate": 9.380594603328875e-06,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11850959062576294,
"step": 4735,
"valid_targets_mean": 1568.6,
"valid_targets_min": 639
},
{
"epoch": 4.9789915966386555,
"grad_norm": 0.8820976325913817,
"learning_rate": 9.336239626748432e-06,
"loss": 0.1199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12084612995386124,
"step": 4740,
"valid_targets_mean": 1482.9,
"valid_targets_min": 920
},
{
"epoch": 4.984243697478991,
"grad_norm": 0.8235056111823619,
"learning_rate": 9.291957811530602e-06,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11309683322906494,
"step": 4745,
"valid_targets_mean": 1354.8,
"valid_targets_min": 847
},
{
"epoch": 4.989495798319328,
"grad_norm": 0.8380994731336534,
"learning_rate": 9.247749461481712e-06,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12259923666715622,
"step": 4750,
"valid_targets_mean": 1451.1,
"valid_targets_min": 557
},
{
"epoch": 4.994747899159664,
"grad_norm": 0.9271264619980075,
"learning_rate": 9.203614879904083e-06,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12632964551448822,
"step": 4755,
"valid_targets_mean": 1332.4,
"valid_targets_min": 645
},
{
"epoch": 5.0,
"grad_norm": 0.7766606123712497,
"learning_rate": 9.159554369593901e-06,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11304584890604019,
"step": 4760,
"valid_targets_mean": 1721.1,
"valid_targets_min": 760
},
{
"epoch": 5.005252100840337,
"grad_norm": 1.0368311360471962,
"learning_rate": 9.115568232839193e-06,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2315981090068817,
"step": 4765,
"valid_targets_mean": 3398.8,
"valid_targets_min": 746
},
{
"epoch": 5.010504201680672,
"grad_norm": 0.6460571203150131,
"learning_rate": 9.071656771417721e-06,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17781823873519897,
"step": 4770,
"valid_targets_mean": 4347.4,
"valid_targets_min": 1651
},
{
"epoch": 5.015756302521009,
"grad_norm": 0.542133417895063,
"learning_rate": 9.027820286594902e-06,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1896631270647049,
"step": 4775,
"valid_targets_mean": 4633.2,
"valid_targets_min": 1560
},
{
"epoch": 5.0210084033613445,
"grad_norm": 0.6608510247217927,
"learning_rate": 8.984059079121785e-06,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19018647074699402,
"step": 4780,
"valid_targets_mean": 3938.1,
"valid_targets_min": 1841
},
{
"epoch": 5.026260504201681,
"grad_norm": 0.6358924043276708,
"learning_rate": 8.940373449232935e-06,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22464792430400848,
"step": 4785,
"valid_targets_mean": 3724.8,
"valid_targets_min": 1374
},
{
"epoch": 5.031512605042017,
"grad_norm": 0.6599880706584261,
"learning_rate": 8.896763696644405e-06,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18435746431350708,
"step": 4790,
"valid_targets_mean": 3264.8,
"valid_targets_min": 1089
},
{
"epoch": 5.036764705882353,
"grad_norm": 0.7096826802832755,
"learning_rate": 8.853230120551693e-06,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21627312898635864,
"step": 4795,
"valid_targets_mean": 3374.9,
"valid_targets_min": 627
},
{
"epoch": 5.042016806722689,
"grad_norm": 0.6612340433792787,
"learning_rate": 8.809773019627635e-06,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21441474556922913,
"step": 4800,
"valid_targets_mean": 3514.9,
"valid_targets_min": 1574
},
{
"epoch": 5.0472689075630255,
"grad_norm": 0.6216659402671705,
"learning_rate": 8.766392692020413e-06,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21736544370651245,
"step": 4805,
"valid_targets_mean": 3956.7,
"valid_targets_min": 1899
},
{
"epoch": 5.052521008403361,
"grad_norm": 0.6397951889136652,
"learning_rate": 8.723089435351497e-06,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.213152214884758,
"step": 4810,
"valid_targets_mean": 4397.6,
"valid_targets_min": 2261
},
{
"epoch": 5.057773109243698,
"grad_norm": 0.6827468645370026,
"learning_rate": 8.679863546713559e-06,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19350934028625488,
"step": 4815,
"valid_targets_mean": 3263.8,
"valid_targets_min": 1873
},
{
"epoch": 5.063025210084033,
"grad_norm": 0.6432078260343645,
"learning_rate": 8.636715322668498e-06,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2112460732460022,
"step": 4820,
"valid_targets_mean": 3430.2,
"valid_targets_min": 1013
},
{
"epoch": 5.06827731092437,
"grad_norm": 0.5998462380114775,
"learning_rate": 8.593645059245365e-06,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1965964436531067,
"step": 4825,
"valid_targets_mean": 4041.6,
"valid_targets_min": 1366
},
{
"epoch": 5.073529411764706,
"grad_norm": 0.6552876974701827,
"learning_rate": 8.550653051938333e-06,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2239168882369995,
"step": 4830,
"valid_targets_mean": 3515.2,
"valid_targets_min": 2050
},
{
"epoch": 5.078781512605042,
"grad_norm": 0.7164022528196604,
"learning_rate": 8.507739595704695e-06,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21687167882919312,
"step": 4835,
"valid_targets_mean": 3048.9,
"valid_targets_min": 746
},
{
"epoch": 5.084033613445378,
"grad_norm": 0.7024986732808598,
"learning_rate": 8.464904984962832e-06,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2093815803527832,
"step": 4840,
"valid_targets_mean": 2982.6,
"valid_targets_min": 855
},
{
"epoch": 5.089285714285714,
"grad_norm": 0.6486210855345914,
"learning_rate": 8.422149513590151e-06,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22854307293891907,
"step": 4845,
"valid_targets_mean": 3753.4,
"valid_targets_min": 2125
},
{
"epoch": 5.09453781512605,
"grad_norm": 0.7106124392970365,
"learning_rate": 8.37947347492115e-06,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20508921146392822,
"step": 4850,
"valid_targets_mean": 2946.8,
"valid_targets_min": 1173
},
{
"epoch": 5.099789915966387,
"grad_norm": 0.7291320506136616,
"learning_rate": 8.33687716174532e-06,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20715506374835968,
"step": 4855,
"valid_targets_mean": 3284.2,
"valid_targets_min": 1438
},
{
"epoch": 5.105042016806722,
"grad_norm": 0.667621729812997,
"learning_rate": 8.294360866305192e-06,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18001650273799896,
"step": 4860,
"valid_targets_mean": 3818.4,
"valid_targets_min": 1133
},
{
"epoch": 5.110294117647059,
"grad_norm": 0.6904135635931854,
"learning_rate": 8.251924880294317e-06,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1863369643688202,
"step": 4865,
"valid_targets_mean": 3339.8,
"valid_targets_min": 1051
},
{
"epoch": 5.1155462184873945,
"grad_norm": 0.708134359007726,
"learning_rate": 8.20956949485527e-06,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2200697362422943,
"step": 4870,
"valid_targets_mean": 3285.1,
"valid_targets_min": 1642
},
{
"epoch": 5.120798319327731,
"grad_norm": 0.6714863526693571,
"learning_rate": 8.167295000577622e-06,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19819751381874084,
"step": 4875,
"valid_targets_mean": 3340.8,
"valid_targets_min": 1747
},
{
"epoch": 5.126050420168067,
"grad_norm": 0.6991162613090433,
"learning_rate": 8.125101687496e-06,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2069099098443985,
"step": 4880,
"valid_targets_mean": 3218.2,
"valid_targets_min": 1765
},
{
"epoch": 5.131302521008403,
"grad_norm": 0.6933394799250305,
"learning_rate": 8.082989845088038e-06,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20274317264556885,
"step": 4885,
"valid_targets_mean": 3182.9,
"valid_targets_min": 1233
},
{
"epoch": 5.13655462184874,
"grad_norm": 0.7022583842802075,
"learning_rate": 8.040959762272441e-06,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19732248783111572,
"step": 4890,
"valid_targets_mean": 3020.8,
"valid_targets_min": 869
},
{
"epoch": 5.141806722689076,
"grad_norm": 0.6578222367990266,
"learning_rate": 7.999011727406995e-06,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1947716623544693,
"step": 4895,
"valid_targets_mean": 3269.2,
"valid_targets_min": 926
},
{
"epoch": 5.147058823529412,
"grad_norm": 0.6729734257141221,
"learning_rate": 7.957146028286524e-06,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1842532753944397,
"step": 4900,
"valid_targets_mean": 3256.4,
"valid_targets_min": 1016
},
{
"epoch": 5.152310924369748,
"grad_norm": 0.6998982376570767,
"learning_rate": 7.915362952141017e-06,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19443146884441376,
"step": 4905,
"valid_targets_mean": 3058.4,
"valid_targets_min": 1367
},
{
"epoch": 5.157563025210084,
"grad_norm": 0.6159690568204116,
"learning_rate": 7.873662785633594e-06,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1794825792312622,
"step": 4910,
"valid_targets_mean": 3513.8,
"valid_targets_min": 761
},
{
"epoch": 5.16281512605042,
"grad_norm": 0.718929827088859,
"learning_rate": 7.832045814858538e-06,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19105938076972961,
"step": 4915,
"valid_targets_mean": 2834.2,
"valid_targets_min": 1480
},
{
"epoch": 5.168067226890757,
"grad_norm": 0.6775963512647579,
"learning_rate": 7.790512325339367e-06,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18776269257068634,
"step": 4920,
"valid_targets_mean": 2854.1,
"valid_targets_min": 1229
},
{
"epoch": 5.173319327731092,
"grad_norm": 0.7289317859752761,
"learning_rate": 7.74906260202685e-06,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19116216897964478,
"step": 4925,
"valid_targets_mean": 3215.8,
"valid_targets_min": 1727
},
{
"epoch": 5.178571428571429,
"grad_norm": 0.6500227003936777,
"learning_rate": 7.707696929297053e-06,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1965217888355255,
"step": 4930,
"valid_targets_mean": 3578.9,
"valid_targets_min": 1860
},
{
"epoch": 5.1838235294117645,
"grad_norm": 0.7034986881633343,
"learning_rate": 7.666415590949382e-06,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20505331456661224,
"step": 4935,
"valid_targets_mean": 3121.1,
"valid_targets_min": 1145
},
{
"epoch": 5.189075630252101,
"grad_norm": 0.8145007649387389,
"learning_rate": 7.625218870204676e-06,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20866146683692932,
"step": 4940,
"valid_targets_mean": 2910.1,
"valid_targets_min": 1195
},
{
"epoch": 5.194327731092437,
"grad_norm": 0.6372684720958994,
"learning_rate": 7.584107049703195e-06,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17585617303848267,
"step": 4945,
"valid_targets_mean": 3215.2,
"valid_targets_min": 1087
},
{
"epoch": 5.199579831932773,
"grad_norm": 0.6712839739955457,
"learning_rate": 7.5430804115027615e-06,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19442957639694214,
"step": 4950,
"valid_targets_mean": 3842.3,
"valid_targets_min": 730
},
{
"epoch": 5.204831932773109,
"grad_norm": 0.7139371019585867,
"learning_rate": 7.502139237076744e-06,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18818247318267822,
"step": 4955,
"valid_targets_mean": 3112.6,
"valid_targets_min": 1097
},
{
"epoch": 5.2100840336134455,
"grad_norm": 0.6441054449323667,
"learning_rate": 7.461283807312194e-06,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20336642861366272,
"step": 4960,
"valid_targets_mean": 3587.6,
"valid_targets_min": 1833
},
{
"epoch": 5.215336134453781,
"grad_norm": 0.7139397353122559,
"learning_rate": 7.420514402507886e-06,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21995452046394348,
"step": 4965,
"valid_targets_mean": 3660.6,
"valid_targets_min": 1182
},
{
"epoch": 5.220588235294118,
"grad_norm": 0.6921935226344126,
"learning_rate": 7.379831302372389e-06,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2377263605594635,
"step": 4970,
"valid_targets_mean": 3839.4,
"valid_targets_min": 1586
},
{
"epoch": 5.225840336134453,
"grad_norm": 0.78550496353629,
"learning_rate": 7.3392347860221556e-06,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2115703821182251,
"step": 4975,
"valid_targets_mean": 3062.7,
"valid_targets_min": 1714
},
{
"epoch": 5.23109243697479,
"grad_norm": 0.717261721079846,
"learning_rate": 7.298725131979629e-06,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2131146639585495,
"step": 4980,
"valid_targets_mean": 3611.1,
"valid_targets_min": 1504
},
{
"epoch": 5.236344537815126,
"grad_norm": 0.6319115820709261,
"learning_rate": 7.258302618171287e-06,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1644587367773056,
"step": 4985,
"valid_targets_mean": 3457.1,
"valid_targets_min": 1170
},
{
"epoch": 5.241596638655462,
"grad_norm": 0.760031676694523,
"learning_rate": 7.217967521925775e-06,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20226861536502838,
"step": 4990,
"valid_targets_mean": 3089.3,
"valid_targets_min": 1436
},
{
"epoch": 5.246848739495798,
"grad_norm": 0.9470898190916125,
"learning_rate": 7.177720119971998e-06,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19645410776138306,
"step": 4995,
"valid_targets_mean": 3257.2,
"valid_targets_min": 1302
},
{
"epoch": 5.2521008403361344,
"grad_norm": 0.706018495456836,
"learning_rate": 7.137560688437184e-06,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21298207342624664,
"step": 5000,
"valid_targets_mean": 3425.1,
"valid_targets_min": 2023
},
{
"epoch": 5.257352941176471,
"grad_norm": 0.6165263612026762,
"learning_rate": 7.097489502845047e-06,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1659245491027832,
"step": 5005,
"valid_targets_mean": 3196.4,
"valid_targets_min": 809
},
{
"epoch": 5.262605042016807,
"grad_norm": 0.7663728544419008,
"learning_rate": 7.0575068381138525e-06,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19875086843967438,
"step": 5010,
"valid_targets_mean": 3197.8,
"valid_targets_min": 1059
},
{
"epoch": 5.267857142857143,
"grad_norm": 0.6844105981294532,
"learning_rate": 7.0176129685545414e-06,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16719815135002136,
"step": 5015,
"valid_targets_mean": 3301.7,
"valid_targets_min": 964
},
{
"epoch": 5.273109243697479,
"grad_norm": 0.6796898164555453,
"learning_rate": 6.977808167868867e-06,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1949189305305481,
"step": 5020,
"valid_targets_mean": 3694.2,
"valid_targets_min": 1105
},
{
"epoch": 5.2783613445378155,
"grad_norm": 0.8023813457851872,
"learning_rate": 6.9380927091475085e-06,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20866572856903076,
"step": 5025,
"valid_targets_mean": 2612.6,
"valid_targets_min": 1491
},
{
"epoch": 5.283613445378151,
"grad_norm": 0.762817989942347,
"learning_rate": 6.898466864868165e-06,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20279455184936523,
"step": 5030,
"valid_targets_mean": 3110.5,
"valid_targets_min": 1091
},
{
"epoch": 5.288865546218488,
"grad_norm": 0.7866878344731686,
"learning_rate": 6.858930906893751e-06,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19141477346420288,
"step": 5035,
"valid_targets_mean": 3259.2,
"valid_targets_min": 1822
},
{
"epoch": 5.294117647058823,
"grad_norm": 0.7702679497523474,
"learning_rate": 6.819485106470454e-06,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862347275018692,
"step": 5040,
"valid_targets_mean": 3547.6,
"valid_targets_min": 1625
},
{
"epoch": 5.29936974789916,
"grad_norm": 0.6629392322076868,
"learning_rate": 6.780129734225949e-06,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17328760027885437,
"step": 5045,
"valid_targets_mean": 3628.2,
"valid_targets_min": 1415
},
{
"epoch": 5.304621848739496,
"grad_norm": 0.7042102260307026,
"learning_rate": 6.740865060167483e-06,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19156163930892944,
"step": 5050,
"valid_targets_mean": 3398.9,
"valid_targets_min": 1460
},
{
"epoch": 5.309873949579832,
"grad_norm": 0.7519060990832099,
"learning_rate": 6.701691353680049e-06,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19511482119560242,
"step": 5055,
"valid_targets_mean": 2947.4,
"valid_targets_min": 1079
},
{
"epoch": 5.315126050420168,
"grad_norm": 0.727969914435581,
"learning_rate": 6.662608883524542e-06,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18351078033447266,
"step": 5060,
"valid_targets_mean": 3003.0,
"valid_targets_min": 1274
},
{
"epoch": 5.320378151260504,
"grad_norm": 0.8817302867844496,
"learning_rate": 6.6236179178359115e-06,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21124529838562012,
"step": 5065,
"valid_targets_mean": 3306.3,
"valid_targets_min": 914
},
{
"epoch": 5.32563025210084,
"grad_norm": 0.713024621019574,
"learning_rate": 6.5847187241213e-06,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19047285616397858,
"step": 5070,
"valid_targets_mean": 3332.2,
"valid_targets_min": 1312
},
{
"epoch": 5.330882352941177,
"grad_norm": 0.752933122434432,
"learning_rate": 6.5459115692582386e-06,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1971365213394165,
"step": 5075,
"valid_targets_mean": 2601.3,
"valid_targets_min": 987
},
{
"epoch": 5.336134453781512,
"grad_norm": 0.624699265138433,
"learning_rate": 6.507196719492819e-06,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1911473274230957,
"step": 5080,
"valid_targets_mean": 4341.5,
"valid_targets_min": 1856
},
{
"epoch": 5.341386554621849,
"grad_norm": 0.7283950240407708,
"learning_rate": 6.468574440437801e-06,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19926682114601135,
"step": 5085,
"valid_targets_mean": 3290.9,
"valid_targets_min": 1601
},
{
"epoch": 5.3466386554621845,
"grad_norm": 0.7710715895807497,
"learning_rate": 6.43004499707089e-06,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20834487676620483,
"step": 5090,
"valid_targets_mean": 3119.4,
"valid_targets_min": 1986
},
{
"epoch": 5.351890756302521,
"grad_norm": 0.7170439306426001,
"learning_rate": 6.3916086537328545e-06,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21489310264587402,
"step": 5095,
"valid_targets_mean": 3777.1,
"valid_targets_min": 974
},
{
"epoch": 5.357142857142857,
"grad_norm": 0.6744006460741591,
"learning_rate": 6.3532656741257145e-06,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16385085880756378,
"step": 5100,
"valid_targets_mean": 2878.0,
"valid_targets_min": 512
},
{
"epoch": 5.362394957983193,
"grad_norm": 0.673275766985947,
"learning_rate": 6.315016321310965e-06,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1753840446472168,
"step": 5105,
"valid_targets_mean": 3215.4,
"valid_targets_min": 1202
},
{
"epoch": 5.367647058823529,
"grad_norm": 0.7266719247932443,
"learning_rate": 6.276860857707727e-06,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20921765267848969,
"step": 5110,
"valid_targets_mean": 3693.1,
"valid_targets_min": 1455
},
{
"epoch": 5.3728991596638656,
"grad_norm": 0.6960543396247455,
"learning_rate": 6.238799545090994e-06,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18564675748348236,
"step": 5115,
"valid_targets_mean": 3477.5,
"valid_targets_min": 1571
},
{
"epoch": 5.378151260504202,
"grad_norm": 0.789570094298452,
"learning_rate": 6.20083264458981e-06,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22905242443084717,
"step": 5120,
"valid_targets_mean": 2912.1,
"valid_targets_min": 1450
},
{
"epoch": 5.383403361344538,
"grad_norm": 0.687911349078074,
"learning_rate": 6.162960416685469e-06,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18090611696243286,
"step": 5125,
"valid_targets_mean": 3323.0,
"valid_targets_min": 1431
},
{
"epoch": 5.388655462184874,
"grad_norm": 0.8129192543706223,
"learning_rate": 6.125183121209741e-06,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2075553834438324,
"step": 5130,
"valid_targets_mean": 3461.4,
"valid_targets_min": 1147
},
{
"epoch": 5.39390756302521,
"grad_norm": 0.7873625003498075,
"learning_rate": 6.087501017343107e-06,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2097611427307129,
"step": 5135,
"valid_targets_mean": 2641.6,
"valid_targets_min": 998
},
{
"epoch": 5.399159663865547,
"grad_norm": 0.7237167630580533,
"learning_rate": 6.0499143636129384e-06,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20370076596736908,
"step": 5140,
"valid_targets_mean": 3260.9,
"valid_targets_min": 614
},
{
"epoch": 5.404411764705882,
"grad_norm": 0.85938348372471,
"learning_rate": 6.012423417891766e-06,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20711749792099,
"step": 5145,
"valid_targets_mean": 2796.2,
"valid_targets_min": 1005
},
{
"epoch": 5.409663865546219,
"grad_norm": 0.6968015629432648,
"learning_rate": 5.975028437395493e-06,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2024056762456894,
"step": 5150,
"valid_targets_mean": 3183.6,
"valid_targets_min": 2298
},
{
"epoch": 5.4149159663865545,
"grad_norm": 0.7775633759987758,
"learning_rate": 5.937729678681612e-06,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20395274460315704,
"step": 5155,
"valid_targets_mean": 2821.2,
"valid_targets_min": 617
},
{
"epoch": 5.420168067226891,
"grad_norm": 0.7494510775854252,
"learning_rate": 5.9005273976474684e-06,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18208947777748108,
"step": 5160,
"valid_targets_mean": 3265.2,
"valid_targets_min": 1665
},
{
"epoch": 5.425420168067227,
"grad_norm": 0.824725420965561,
"learning_rate": 5.8634218495285126e-06,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20658603310585022,
"step": 5165,
"valid_targets_mean": 3019.3,
"valid_targets_min": 1076
},
{
"epoch": 5.430672268907563,
"grad_norm": 0.706863386587082,
"learning_rate": 5.8264132888965155e-06,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19833385944366455,
"step": 5170,
"valid_targets_mean": 3610.8,
"valid_targets_min": 790
},
{
"epoch": 5.435924369747899,
"grad_norm": 0.7103390006031945,
"learning_rate": 5.789501969657853e-06,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1992931365966797,
"step": 5175,
"valid_targets_mean": 3255.8,
"valid_targets_min": 1728
},
{
"epoch": 5.4411764705882355,
"grad_norm": 0.6848028235034054,
"learning_rate": 5.752688145051761e-06,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18287193775177002,
"step": 5180,
"valid_targets_mean": 3377.2,
"valid_targets_min": 981
},
{
"epoch": 5.446428571428571,
"grad_norm": 0.6806365974211747,
"learning_rate": 5.715972067648561e-06,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1667267084121704,
"step": 5185,
"valid_targets_mean": 2839.1,
"valid_targets_min": 1351
},
{
"epoch": 5.451680672268908,
"grad_norm": 0.6810171841346309,
"learning_rate": 5.679353989347989e-06,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20622935891151428,
"step": 5190,
"valid_targets_mean": 4396.7,
"valid_targets_min": 2416
},
{
"epoch": 5.456932773109243,
"grad_norm": 0.6886243059430002,
"learning_rate": 5.642834161377408e-06,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1882258951663971,
"step": 5195,
"valid_targets_mean": 4668.6,
"valid_targets_min": 1233
},
{
"epoch": 5.46218487394958,
"grad_norm": 0.660869505715319,
"learning_rate": 5.606412834290121e-06,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740989089012146,
"step": 5200,
"valid_targets_mean": 3936.4,
"valid_targets_min": 1524
},
{
"epoch": 5.467436974789916,
"grad_norm": 0.6389923753551053,
"learning_rate": 5.570090257963645e-06,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18670515716075897,
"step": 5205,
"valid_targets_mean": 4389.3,
"valid_targets_min": 856
},
{
"epoch": 5.472689075630252,
"grad_norm": 0.7185606904022306,
"learning_rate": 5.533866681597981e-06,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18405769765377045,
"step": 5210,
"valid_targets_mean": 3241.3,
"valid_targets_min": 906
},
{
"epoch": 5.477941176470588,
"grad_norm": 0.796159259324853,
"learning_rate": 5.497742353713928e-06,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20212048292160034,
"step": 5215,
"valid_targets_mean": 3680.4,
"valid_targets_min": 832
},
{
"epoch": 5.483193277310924,
"grad_norm": 0.6843887461039875,
"learning_rate": 5.461717522151371e-06,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1704184114933014,
"step": 5220,
"valid_targets_mean": 3168.9,
"valid_targets_min": 1484
},
{
"epoch": 5.48844537815126,
"grad_norm": 0.81830636371663,
"learning_rate": 5.4257924340675535e-06,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18880800902843475,
"step": 5225,
"valid_targets_mean": 3667.5,
"valid_targets_min": 1440
},
{
"epoch": 5.493697478991597,
"grad_norm": 0.761192266055787,
"learning_rate": 5.389967335935429e-06,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2186485230922699,
"step": 5230,
"valid_targets_mean": 3025.6,
"valid_targets_min": 1349
},
{
"epoch": 5.498949579831933,
"grad_norm": 0.7532532316921411,
"learning_rate": 5.3542424735419306e-06,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1849045306444168,
"step": 5235,
"valid_targets_mean": 2935.8,
"valid_targets_min": 1156
},
{
"epoch": 5.504201680672269,
"grad_norm": 0.7266362371210848,
"learning_rate": 5.318618091986294e-06,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17571350932121277,
"step": 5240,
"valid_targets_mean": 3190.4,
"valid_targets_min": 993
},
{
"epoch": 5.509453781512605,
"grad_norm": 0.7883604048005873,
"learning_rate": 5.283094435678398e-06,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20258891582489014,
"step": 5245,
"valid_targets_mean": 2785.6,
"valid_targets_min": 1275
},
{
"epoch": 5.514705882352941,
"grad_norm": 0.738824710435114,
"learning_rate": 5.2476717483370685e-06,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991308033466339,
"step": 5250,
"valid_targets_mean": 3266.8,
"valid_targets_min": 1669
},
{
"epoch": 5.519957983193278,
"grad_norm": 0.7925166684746748,
"learning_rate": 5.212350272988394e-06,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1969340294599533,
"step": 5255,
"valid_targets_mean": 3357.5,
"valid_targets_min": 1710
},
{
"epoch": 5.525210084033613,
"grad_norm": 0.6825177393092328,
"learning_rate": 5.177130251964088e-06,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18405650556087494,
"step": 5260,
"valid_targets_mean": 3468.1,
"valid_targets_min": 1685
},
{
"epoch": 5.53046218487395,
"grad_norm": 0.6591391403288339,
"learning_rate": 5.1420119268998085e-06,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19749081134796143,
"step": 5265,
"valid_targets_mean": 3659.6,
"valid_targets_min": 1931
},
{
"epoch": 5.535714285714286,
"grad_norm": 0.6736986111232942,
"learning_rate": 5.106995538733488e-06,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18770131468772888,
"step": 5270,
"valid_targets_mean": 3862.3,
"valid_targets_min": 2009
},
{
"epoch": 5.540966386554622,
"grad_norm": 0.8741377267243634,
"learning_rate": 5.07208132770372e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16808158159255981,
"step": 5275,
"valid_targets_mean": 1792.6,
"valid_targets_min": 777
},
{
"epoch": 5.546218487394958,
"grad_norm": 0.8019745661839314,
"learning_rate": 5.037269533348075e-06,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12899786233901978,
"step": 5280,
"valid_targets_mean": 1354.7,
"valid_targets_min": 705
},
{
"epoch": 5.551470588235294,
"grad_norm": 0.9281156697299153,
"learning_rate": 5.002560394501463e-06,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13236215710639954,
"step": 5285,
"valid_targets_mean": 1556.9,
"valid_targets_min": 914
},
{
"epoch": 5.55672268907563,
"grad_norm": 0.823501068446433,
"learning_rate": 4.9679541492945135e-06,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11238055676221848,
"step": 5290,
"valid_targets_mean": 1397.1,
"valid_targets_min": 680
},
{
"epoch": 5.561974789915967,
"grad_norm": 0.8106452499925574,
"learning_rate": 4.933451035151913e-06,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12909407913684845,
"step": 5295,
"valid_targets_mean": 1698.1,
"valid_targets_min": 819
},
{
"epoch": 5.567226890756302,
"grad_norm": 0.8991107502754927,
"learning_rate": 4.899051288790806e-06,
"loss": 0.1232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12105128914117813,
"step": 5300,
"valid_targets_mean": 1393.1,
"valid_targets_min": 734
},
{
"epoch": 5.572478991596639,
"grad_norm": 0.8395119193730466,
"learning_rate": 4.86475514621916e-06,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11696095764636993,
"step": 5305,
"valid_targets_mean": 1443.1,
"valid_targets_min": 655
},
{
"epoch": 5.5777310924369745,
"grad_norm": 1.0738907935762767,
"learning_rate": 4.830562842734112e-06,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11815018951892853,
"step": 5310,
"valid_targets_mean": 1392.2,
"valid_targets_min": 737
},
{
"epoch": 5.582983193277311,
"grad_norm": 0.8292783339611027,
"learning_rate": 4.796474612920421e-06,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11230309307575226,
"step": 5315,
"valid_targets_mean": 1386.6,
"valid_targets_min": 759
},
{
"epoch": 5.588235294117647,
"grad_norm": 0.9357218955051299,
"learning_rate": 4.762490690648813e-06,
"loss": 0.1191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12718072533607483,
"step": 5320,
"valid_targets_mean": 1442.9,
"valid_targets_min": 750
},
{
"epoch": 5.593487394957983,
"grad_norm": 0.8519534800000159,
"learning_rate": 4.728611309074374e-06,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11761420965194702,
"step": 5325,
"valid_targets_mean": 1536.1,
"valid_targets_min": 780
},
{
"epoch": 5.598739495798319,
"grad_norm": 0.8547416140469031,
"learning_rate": 4.694836700634975e-06,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1196620911359787,
"step": 5330,
"valid_targets_mean": 1463.1,
"valid_targets_min": 679
},
{
"epoch": 5.6039915966386555,
"grad_norm": 1.0901335325216264,
"learning_rate": 4.661167097049668e-06,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12231962382793427,
"step": 5335,
"valid_targets_mean": 1292.8,
"valid_targets_min": 771
},
{
"epoch": 5.609243697478991,
"grad_norm": 0.9123241183930774,
"learning_rate": 4.62760272931708e-06,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11801913380622864,
"step": 5340,
"valid_targets_mean": 1542.4,
"valid_targets_min": 878
},
{
"epoch": 5.614495798319328,
"grad_norm": 0.8570929790691967,
"learning_rate": 4.594143827713844e-06,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10810776799917221,
"step": 5345,
"valid_targets_mean": 1506.8,
"valid_targets_min": 942
},
{
"epoch": 5.619747899159664,
"grad_norm": 0.9539604016186798,
"learning_rate": 4.56079062179303e-06,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11601479351520538,
"step": 5350,
"valid_targets_mean": 1401.9,
"valid_targets_min": 675
},
{
"epoch": 5.625,
"grad_norm": 0.9114757769971337,
"learning_rate": 4.527543340382538e-06,
"loss": 0.1171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11921755969524384,
"step": 5355,
"valid_targets_mean": 1483.8,
"valid_targets_min": 892
},
{
"epoch": 5.630252100840336,
"grad_norm": 0.9360433208438923,
"learning_rate": 4.494402211583569e-06,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11960253119468689,
"step": 5360,
"valid_targets_mean": 1356.3,
"valid_targets_min": 656
},
{
"epoch": 5.635504201680672,
"grad_norm": 0.8687564177093906,
"learning_rate": 4.461367462769009e-06,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10865601897239685,
"step": 5365,
"valid_targets_mean": 1340.6,
"valid_targets_min": 706
},
{
"epoch": 5.640756302521009,
"grad_norm": 0.8626601637005205,
"learning_rate": 4.428439320581923e-06,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.119922935962677,
"step": 5370,
"valid_targets_mean": 1528.6,
"valid_targets_min": 548
},
{
"epoch": 5.6460084033613445,
"grad_norm": 1.2286926999590546,
"learning_rate": 4.3956180109339705e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10904563963413239,
"step": 5375,
"valid_targets_mean": 1268.9,
"valid_targets_min": 658
},
{
"epoch": 5.651260504201681,
"grad_norm": 0.8729368734062463,
"learning_rate": 4.362903759003849e-06,
"loss": 0.1132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1106632798910141,
"step": 5380,
"valid_targets_mean": 1360.1,
"valid_targets_min": 650
},
{
"epoch": 5.656512605042017,
"grad_norm": 0.8066508995038737,
"learning_rate": 4.33029678923576e-06,
"loss": 0.1136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11501973122358322,
"step": 5385,
"valid_targets_mean": 1452.3,
"valid_targets_min": 859
},
{
"epoch": 5.661764705882353,
"grad_norm": 0.8482374901140713,
"learning_rate": 4.297797325337889e-06,
"loss": 0.1051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11828213930130005,
"step": 5390,
"valid_targets_mean": 1391.3,
"valid_targets_min": 728
},
{
"epoch": 5.667016806722689,
"grad_norm": 0.826557032894644,
"learning_rate": 4.265405590280822e-06,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09589506685733795,
"step": 5395,
"valid_targets_mean": 1344.4,
"valid_targets_min": 686
},
{
"epoch": 5.6722689075630255,
"grad_norm": 0.941561782597229,
"learning_rate": 4.233121806296072e-06,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12858964502811432,
"step": 5400,
"valid_targets_mean": 1545.2,
"valid_targets_min": 697
},
{
"epoch": 5.677521008403361,
"grad_norm": 0.912093405528764,
"learning_rate": 4.200946194874514e-06,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10562796890735626,
"step": 5405,
"valid_targets_mean": 1354.6,
"valid_targets_min": 779
},
{
"epoch": 5.682773109243698,
"grad_norm": 0.9260849926734132,
"learning_rate": 4.168878976764872e-06,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11829014122486115,
"step": 5410,
"valid_targets_mean": 1434.1,
"valid_targets_min": 729
},
{
"epoch": 5.688025210084033,
"grad_norm": 0.826771685553631,
"learning_rate": 4.136920371972228e-06,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1030585840344429,
"step": 5415,
"valid_targets_mean": 1388.2,
"valid_targets_min": 868
},
{
"epoch": 5.69327731092437,
"grad_norm": 1.6999684647726199,
"learning_rate": 4.105070599756482e-06,
"loss": 0.1163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10433146357536316,
"step": 5420,
"valid_targets_mean": 1282.3,
"valid_targets_min": 765
},
{
"epoch": 5.698529411764706,
"grad_norm": 0.8817697258847107,
"learning_rate": 4.073329878630856e-06,
"loss": 0.1127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11964145302772522,
"step": 5425,
"valid_targets_mean": 1457.2,
"valid_targets_min": 793
},
{
"epoch": 5.703781512605042,
"grad_norm": 0.8518914261076463,
"learning_rate": 4.041698426360425e-06,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11360062658786774,
"step": 5430,
"valid_targets_mean": 1448.5,
"valid_targets_min": 806
},
{
"epoch": 5.709033613445378,
"grad_norm": 0.8301646651006851,
"learning_rate": 4.010176459960569e-06,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09808893501758575,
"step": 5435,
"valid_targets_mean": 1380.7,
"valid_targets_min": 803
},
{
"epoch": 5.714285714285714,
"grad_norm": 0.8473401775683042,
"learning_rate": 3.978764195695528e-06,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11080893129110336,
"step": 5440,
"valid_targets_mean": 1515.7,
"valid_targets_min": 660
},
{
"epoch": 5.71953781512605,
"grad_norm": 0.9100300218409771,
"learning_rate": 3.947461849076912e-06,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1048063337802887,
"step": 5445,
"valid_targets_mean": 1402.0,
"valid_targets_min": 837
},
{
"epoch": 5.724789915966387,
"grad_norm": 0.8889294607662074,
"learning_rate": 3.916269634862193e-06,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10396813601255417,
"step": 5450,
"valid_targets_mean": 1574.1,
"valid_targets_min": 719
},
{
"epoch": 5.730042016806722,
"grad_norm": 0.8903144486882467,
"learning_rate": 3.885187767053269e-06,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10951384902000427,
"step": 5455,
"valid_targets_mean": 1430.1,
"valid_targets_min": 765
},
{
"epoch": 5.735294117647059,
"grad_norm": 0.9031317882555354,
"learning_rate": 3.854216458894973e-06,
"loss": 0.1117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12100645154714584,
"step": 5460,
"valid_targets_mean": 1372.3,
"valid_targets_min": 727
},
{
"epoch": 5.740546218487395,
"grad_norm": 0.8606806374553407,
"learning_rate": 3.823355922873606e-06,
"loss": 0.1084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09598094969987869,
"step": 5465,
"valid_targets_mean": 1192.8,
"valid_targets_min": 655
},
{
"epoch": 5.745798319327731,
"grad_norm": 0.9625073380564342,
"learning_rate": 3.792606370715508e-06,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10911808162927628,
"step": 5470,
"valid_targets_mean": 1508.0,
"valid_targets_min": 669
},
{
"epoch": 5.751050420168067,
"grad_norm": 0.8921081945325963,
"learning_rate": 3.761968013385584e-06,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10961748659610748,
"step": 5475,
"valid_targets_mean": 1430.2,
"valid_targets_min": 1046
},
{
"epoch": 5.756302521008403,
"grad_norm": 0.9534472437981408,
"learning_rate": 3.731441061085843e-06,
"loss": 0.114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12638525664806366,
"step": 5480,
"valid_targets_mean": 1651.8,
"valid_targets_min": 692
},
{
"epoch": 5.76155462184874,
"grad_norm": 0.8796809522933133,
"learning_rate": 3.701025723253988e-06,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11247321218252182,
"step": 5485,
"valid_targets_mean": 1540.4,
"valid_targets_min": 846
},
{
"epoch": 5.766806722689076,
"grad_norm": 0.845414134902536,
"learning_rate": 3.67072220856197e-06,
"loss": 0.1172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10926534980535507,
"step": 5490,
"valid_targets_mean": 1455.1,
"valid_targets_min": 764
},
{
"epoch": 5.772058823529412,
"grad_norm": 0.8126469766696464,
"learning_rate": 3.640530724914517e-06,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10028908401727676,
"step": 5495,
"valid_targets_mean": 1497.4,
"valid_targets_min": 822
},
{
"epoch": 5.777310924369748,
"grad_norm": 0.8406164976266153,
"learning_rate": 3.61045147944777e-06,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11252301931381226,
"step": 5500,
"valid_targets_mean": 1543.8,
"valid_targets_min": 982
},
{
"epoch": 5.782563025210084,
"grad_norm": 0.9415916945254411,
"learning_rate": 3.5804846785278315e-06,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10923096537590027,
"step": 5505,
"valid_targets_mean": 1346.3,
"valid_targets_min": 713
},
{
"epoch": 5.78781512605042,
"grad_norm": 0.9260499456205905,
"learning_rate": 3.5506305277493326e-06,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10536296665668488,
"step": 5510,
"valid_targets_mean": 1395.7,
"valid_targets_min": 721
},
{
"epoch": 5.793067226890757,
"grad_norm": 0.8774386593252896,
"learning_rate": 3.520889231934057e-06,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10436506569385529,
"step": 5515,
"valid_targets_mean": 1290.6,
"valid_targets_min": 741
},
{
"epoch": 5.798319327731092,
"grad_norm": 0.8896778034184114,
"learning_rate": 3.4912609951295084e-06,
"loss": 0.1088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1191120520234108,
"step": 5520,
"valid_targets_mean": 1568.1,
"valid_targets_min": 734
},
{
"epoch": 5.803571428571429,
"grad_norm": 0.9421881494917845,
"learning_rate": 3.461746020607526e-06,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13356809318065643,
"step": 5525,
"valid_targets_mean": 1703.1,
"valid_targets_min": 744
},
{
"epoch": 5.8088235294117645,
"grad_norm": 0.9745264130361654,
"learning_rate": 3.432344510862895e-06,
"loss": 0.1158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12390495836734772,
"step": 5530,
"valid_targets_mean": 1652.8,
"valid_targets_min": 620
},
{
"epoch": 5.814075630252101,
"grad_norm": 0.8607153880999272,
"learning_rate": 3.403056667611917e-06,
"loss": 0.1093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10633715987205505,
"step": 5535,
"valid_targets_mean": 1481.8,
"valid_targets_min": 723
},
{
"epoch": 5.819327731092437,
"grad_norm": 0.9758519266902133,
"learning_rate": 3.373882691791088e-06,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10976162552833557,
"step": 5540,
"valid_targets_mean": 1686.5,
"valid_targets_min": 740
},
{
"epoch": 5.824579831932773,
"grad_norm": 0.8967263497321722,
"learning_rate": 3.344822783555679e-06,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10004294663667679,
"step": 5545,
"valid_targets_mean": 1345.1,
"valid_targets_min": 711
},
{
"epoch": 5.829831932773109,
"grad_norm": 1.0391240197314284,
"learning_rate": 3.315877142278363e-06,
"loss": 0.1144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11110391467809677,
"step": 5550,
"valid_targets_mean": 1619.1,
"valid_targets_min": 804
},
{
"epoch": 5.8350840336134455,
"grad_norm": 0.8413197113632568,
"learning_rate": 3.287045966547866e-06,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11233742535114288,
"step": 5555,
"valid_targets_mean": 1423.2,
"valid_targets_min": 674
},
{
"epoch": 5.840336134453781,
"grad_norm": 0.8505366043709849,
"learning_rate": 3.258329454167599e-06,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10158196091651917,
"step": 5560,
"valid_targets_mean": 1207.4,
"valid_targets_min": 567
},
{
"epoch": 5.845588235294118,
"grad_norm": 0.8995630860603766,
"learning_rate": 3.2297278021542833e-06,
"loss": 0.1047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11643253266811371,
"step": 5565,
"valid_targets_mean": 1542.4,
"valid_targets_min": 912
},
{
"epoch": 5.850840336134453,
"grad_norm": 0.8887960162735108,
"learning_rate": 3.201241206736614e-06,
"loss": 0.1131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11594435572624207,
"step": 5570,
"valid_targets_mean": 1591.0,
"valid_targets_min": 897
},
{
"epoch": 5.85609243697479,
"grad_norm": 1.1842033013727196,
"learning_rate": 3.1728698633539266e-06,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1004495844244957,
"step": 5575,
"valid_targets_mean": 1290.1,
"valid_targets_min": 773
},
{
"epoch": 5.8613445378151265,
"grad_norm": 0.8528216924870448,
"learning_rate": 3.1446139666548212e-06,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09786748886108398,
"step": 5580,
"valid_targets_mean": 1407.2,
"valid_targets_min": 679
},
{
"epoch": 5.866596638655462,
"grad_norm": 0.9063160104966684,
"learning_rate": 3.1164737104958707e-06,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11985988914966583,
"step": 5585,
"valid_targets_mean": 1600.2,
"valid_targets_min": 818
},
{
"epoch": 5.871848739495798,
"grad_norm": 0.8331809940510251,
"learning_rate": 3.0884492879402452e-06,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10528066009283066,
"step": 5590,
"valid_targets_mean": 1442.4,
"valid_targets_min": 790
},
{
"epoch": 5.8771008403361344,
"grad_norm": 0.8662258381631335,
"learning_rate": 3.0605408912564184e-06,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11069589108228683,
"step": 5595,
"valid_targets_mean": 1426.6,
"valid_targets_min": 592
},
{
"epoch": 5.882352941176471,
"grad_norm": 0.8059447911663884,
"learning_rate": 3.032748711916851e-06,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1017690896987915,
"step": 5600,
"valid_targets_mean": 1430.9,
"valid_targets_min": 662
},
{
"epoch": 5.887605042016807,
"grad_norm": 0.8787623158989677,
"learning_rate": 3.0050729405966495e-06,
"loss": 0.1123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11519140005111694,
"step": 5605,
"valid_targets_mean": 1412.6,
"valid_targets_min": 622
},
{
"epoch": 5.892857142857143,
"grad_norm": 1.0058669337260462,
"learning_rate": 2.9775137671722754e-06,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12139453738927841,
"step": 5610,
"valid_targets_mean": 1372.1,
"valid_targets_min": 667
},
{
"epoch": 5.898109243697479,
"grad_norm": 0.9818342504773482,
"learning_rate": 2.9500713807202565e-06,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1251143366098404,
"step": 5615,
"valid_targets_mean": 1628.1,
"valid_targets_min": 1012
},
{
"epoch": 5.9033613445378155,
"grad_norm": 1.0048701808002658,
"learning_rate": 2.9227459695158543e-06,
"loss": 0.1195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12856556475162506,
"step": 5620,
"valid_targets_mean": 1464.7,
"valid_targets_min": 635
},
{
"epoch": 5.908613445378151,
"grad_norm": 0.9524777797952462,
"learning_rate": 2.895537721031809e-06,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13392376899719238,
"step": 5625,
"valid_targets_mean": 1745.9,
"valid_targets_min": 689
},
{
"epoch": 5.913865546218488,
"grad_norm": 0.8360052998799868,
"learning_rate": 2.8684468219370364e-06,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09906312078237534,
"step": 5630,
"valid_targets_mean": 1129.1,
"valid_targets_min": 697
},
{
"epoch": 5.919117647058823,
"grad_norm": 0.9259328855340732,
"learning_rate": 2.841473458095334e-06,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12108924984931946,
"step": 5635,
"valid_targets_mean": 1624.6,
"valid_targets_min": 656
},
{
"epoch": 5.92436974789916,
"grad_norm": 0.9476207176974106,
"learning_rate": 2.8146178145641355e-06,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1358291506767273,
"step": 5640,
"valid_targets_mean": 1755.8,
"valid_targets_min": 697
},
{
"epoch": 5.929621848739496,
"grad_norm": 0.8733881430652086,
"learning_rate": 2.787880075593217e-06,
"loss": 0.1096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11107189953327179,
"step": 5645,
"valid_targets_mean": 1516.4,
"valid_targets_min": 820
},
{
"epoch": 5.934873949579832,
"grad_norm": 0.8803395218820865,
"learning_rate": 2.7612604246234355e-06,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10555368661880493,
"step": 5650,
"valid_targets_mean": 1391.4,
"valid_targets_min": 680
},
{
"epoch": 5.940126050420168,
"grad_norm": 0.8940529152418495,
"learning_rate": 2.7347590442854867e-06,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11712536960840225,
"step": 5655,
"valid_targets_mean": 1412.4,
"valid_targets_min": 778
},
{
"epoch": 5.945378151260504,
"grad_norm": 0.9009479204017542,
"learning_rate": 2.7083761163986433e-06,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12473637610673904,
"step": 5660,
"valid_targets_mean": 1599.6,
"valid_targets_min": 851
},
{
"epoch": 5.95063025210084,
"grad_norm": 0.8299195293692447,
"learning_rate": 2.682111821969493e-06,
"loss": 0.1072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10053186863660812,
"step": 5665,
"valid_targets_mean": 1398.4,
"valid_targets_min": 692
},
{
"epoch": 5.955882352941177,
"grad_norm": 0.8224894370809741,
"learning_rate": 2.6559663411907233e-06,
"loss": 0.1068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09880638122558594,
"step": 5670,
"valid_targets_mean": 1477.9,
"valid_targets_min": 741
},
{
"epoch": 5.961134453781512,
"grad_norm": 0.8446943544157789,
"learning_rate": 2.629939853439856e-06,
"loss": 0.1043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09644494950771332,
"step": 5675,
"valid_targets_mean": 1299.4,
"valid_targets_min": 639
},
{
"epoch": 5.966386554621849,
"grad_norm": 0.8887196740407839,
"learning_rate": 2.604032537278052e-06,
"loss": 0.1009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10244621336460114,
"step": 5680,
"valid_targets_mean": 1277.9,
"valid_targets_min": 743
},
{
"epoch": 5.9716386554621845,
"grad_norm": 0.8494276928184287,
"learning_rate": 2.5782445704488447e-06,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10847003012895584,
"step": 5685,
"valid_targets_mean": 1529.9,
"valid_targets_min": 610
},
{
"epoch": 5.976890756302521,
"grad_norm": 0.8658895151511194,
"learning_rate": 2.5525761298769515e-06,
"loss": 0.1061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10970406234264374,
"step": 5690,
"valid_targets_mean": 1331.6,
"valid_targets_min": 695
},
{
"epoch": 5.982142857142857,
"grad_norm": 0.9065356041104413,
"learning_rate": 2.527027391667054e-06,
"loss": 0.1048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10520265996456146,
"step": 5695,
"valid_targets_mean": 1581.9,
"valid_targets_min": 807
},
{
"epoch": 5.987394957983193,
"grad_norm": 0.9469535446284602,
"learning_rate": 2.501598531102587e-06,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10947225987911224,
"step": 5700,
"valid_targets_mean": 1327.6,
"valid_targets_min": 765
},
{
"epoch": 5.992647058823529,
"grad_norm": 0.9476175324156466,
"learning_rate": 2.47628972264452e-06,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11112868785858154,
"step": 5705,
"valid_targets_mean": 1346.4,
"valid_targets_min": 591
},
{
"epoch": 5.9978991596638656,
"grad_norm": 0.9233409415833587,
"learning_rate": 2.4511011399301944e-06,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10038024187088013,
"step": 5710,
"valid_targets_mean": 1483.2,
"valid_targets_min": 692
},
{
"epoch": 6.003151260504202,
"grad_norm": 1.1538573337023281,
"learning_rate": 2.4260329557721107e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20704257488250732,
"step": 5715,
"valid_targets_mean": 4404.5,
"valid_targets_min": 1323
},
{
"epoch": 6.008403361344538,
"grad_norm": 1.1897027864306338,
"learning_rate": 2.4010853421567237e-06,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22920134663581848,
"step": 5720,
"valid_targets_mean": 4483.4,
"valid_targets_min": 1005
},
{
"epoch": 6.013655462184874,
"grad_norm": 0.8684521464937454,
"learning_rate": 2.376258470243309e-06,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19509011507034302,
"step": 5725,
"valid_targets_mean": 4502.1,
"valid_targets_min": 1509
},
{
"epoch": 6.01890756302521,
"grad_norm": 0.8037614431305709,
"learning_rate": 2.351552510362758e-06,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1814684271812439,
"step": 5730,
"valid_targets_mean": 3430.2,
"valid_targets_min": 1561
},
{
"epoch": 6.024159663865547,
"grad_norm": 0.7816962283075021,
"learning_rate": 2.326967632016406e-06,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18898342549800873,
"step": 5735,
"valid_targets_mean": 3385.4,
"valid_targets_min": 1184
},
{
"epoch": 6.029411764705882,
"grad_norm": 0.6426902354697276,
"learning_rate": 2.302504003874888e-06,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1760241985321045,
"step": 5740,
"valid_targets_mean": 3982.6,
"valid_targets_min": 1413
},
{
"epoch": 6.034663865546219,
"grad_norm": 0.632043071580013,
"learning_rate": 2.2781617937769675e-06,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19574542343616486,
"step": 5745,
"valid_targets_mean": 4911.7,
"valid_targets_min": 2160
},
{
"epoch": 6.0399159663865545,
"grad_norm": 0.7493769564211563,
"learning_rate": 2.2539411687283907e-06,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19801229238510132,
"step": 5750,
"valid_targets_mean": 3782.6,
"valid_targets_min": 1511
},
{
"epoch": 6.045168067226891,
"grad_norm": 0.7505509884796049,
"learning_rate": 2.229842294900744e-06,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20454156398773193,
"step": 5755,
"valid_targets_mean": 3030.0,
"valid_targets_min": 1462
},
{
"epoch": 6.050420168067227,
"grad_norm": 0.6430262170455331,
"learning_rate": 2.205865337630302e-06,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18196547031402588,
"step": 5760,
"valid_targets_mean": 3772.4,
"valid_targets_min": 874
},
{
"epoch": 6.055672268907563,
"grad_norm": 0.7098617069387976,
"learning_rate": 2.182010461416899e-06,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19023019075393677,
"step": 5765,
"valid_targets_mean": 3337.1,
"valid_targets_min": 953
},
{
"epoch": 6.060924369747899,
"grad_norm": 0.6552026128807007,
"learning_rate": 2.158277829922817e-06,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2095913290977478,
"step": 5770,
"valid_targets_mean": 4284.9,
"valid_targets_min": 1265
},
{
"epoch": 6.0661764705882355,
"grad_norm": 0.5640222204672125,
"learning_rate": 2.1346676059716253e-06,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19262853264808655,
"step": 5775,
"valid_targets_mean": 5010.6,
"valid_targets_min": 1596
},
{
"epoch": 6.071428571428571,
"grad_norm": 0.6700501160751591,
"learning_rate": 2.1111799515471066e-06,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2048107534646988,
"step": 5780,
"valid_targets_mean": 3490.4,
"valid_targets_min": 1759
},
{
"epoch": 6.076680672268908,
"grad_norm": 1.192594245087854,
"learning_rate": 2.0878150277921195e-06,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20699971914291382,
"step": 5785,
"valid_targets_mean": 3264.3,
"valid_targets_min": 1353
},
{
"epoch": 6.081932773109243,
"grad_norm": 0.6402893347468779,
"learning_rate": 2.064572995007492e-06,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17887401580810547,
"step": 5790,
"valid_targets_mean": 3814.6,
"valid_targets_min": 1643
},
{
"epoch": 6.08718487394958,
"grad_norm": 0.6836188652244888,
"learning_rate": 2.0414540126509274e-06,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17512783408164978,
"step": 5795,
"valid_targets_mean": 3166.1,
"valid_targets_min": 1269
},
{
"epoch": 6.092436974789916,
"grad_norm": 0.6778220747996802,
"learning_rate": 2.0184582393359253e-06,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20338422060012817,
"step": 5800,
"valid_targets_mean": 3617.4,
"valid_targets_min": 1681
},
{
"epoch": 6.097689075630252,
"grad_norm": 0.6622080466063627,
"learning_rate": 1.99558583283066e-06,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17835170030593872,
"step": 5805,
"valid_targets_mean": 3919.8,
"valid_targets_min": 1477
},
{
"epoch": 6.102941176470588,
"grad_norm": 0.7482662124846838,
"learning_rate": 1.9728369500569333e-06,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1978331208229065,
"step": 5810,
"valid_targets_mean": 3418.5,
"valid_targets_min": 662
},
{
"epoch": 6.108193277310924,
"grad_norm": 1.0158385440208195,
"learning_rate": 1.950211747089077e-06,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101389467716217,
"step": 5815,
"valid_targets_mean": 3706.7,
"valid_targets_min": 2077
},
{
"epoch": 6.11344537815126,
"grad_norm": 0.7058981750753525,
"learning_rate": 1.927710379152881e-06,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1703696846961975,
"step": 5820,
"valid_targets_mean": 2878.1,
"valid_targets_min": 1505
},
{
"epoch": 6.118697478991597,
"grad_norm": 0.7508480855114319,
"learning_rate": 1.9053330006245452e-06,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21035335958003998,
"step": 5825,
"valid_targets_mean": 3418.0,
"valid_targets_min": 1957
},
{
"epoch": 6.123949579831933,
"grad_norm": 0.8433194225905101,
"learning_rate": 1.8830797650296006e-06,
"loss": 0.2058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25868695974349976,
"step": 5830,
"valid_targets_mean": 4106.4,
"valid_targets_min": 1704
},
{
"epoch": 6.129201680672269,
"grad_norm": 0.7590435573654869,
"learning_rate": 1.8609508250418628e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2122974842786789,
"step": 5835,
"valid_targets_mean": 3046.9,
"valid_targets_min": 1422
},
{
"epoch": 6.1344537815126055,
"grad_norm": 0.685478517649954,
"learning_rate": 1.8389463324823986e-06,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1737407147884369,
"step": 5840,
"valid_targets_mean": 3447.4,
"valid_targets_min": 1603
},
{
"epoch": 6.139705882352941,
"grad_norm": 0.8161452603910854,
"learning_rate": 1.81706643831846e-06,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20304900407791138,
"step": 5845,
"valid_targets_mean": 2597.8,
"valid_targets_min": 1685
},
{
"epoch": 6.144957983193278,
"grad_norm": 0.7114292866383795,
"learning_rate": 1.7953112926624715e-06,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19642803072929382,
"step": 5850,
"valid_targets_mean": 3290.6,
"valid_targets_min": 1208
},
{
"epoch": 6.150210084033613,
"grad_norm": 0.7279693187875432,
"learning_rate": 1.7736810447709852e-06,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1854780614376068,
"step": 5855,
"valid_targets_mean": 2661.8,
"valid_targets_min": 1501
},
{
"epoch": 6.15546218487395,
"grad_norm": 0.7284805186121608,
"learning_rate": 1.7521758430436553e-06,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22248005867004395,
"step": 5860,
"valid_targets_mean": 3849.0,
"valid_targets_min": 1866
},
{
"epoch": 6.160714285714286,
"grad_norm": 0.641586434100809,
"learning_rate": 1.7307958350222366e-06,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1723538041114807,
"step": 5865,
"valid_targets_mean": 3397.9,
"valid_targets_min": 1239
},
{
"epoch": 6.165966386554622,
"grad_norm": 0.7494400065396022,
"learning_rate": 1.7095411673895545e-06,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20020216703414917,
"step": 5870,
"valid_targets_mean": 3155.5,
"valid_targets_min": 1177
},
{
"epoch": 6.171218487394958,
"grad_norm": 0.7120710111731775,
"learning_rate": 1.6884119859685034e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18129676580429077,
"step": 5875,
"valid_targets_mean": 3594.5,
"valid_targets_min": 1270
},
{
"epoch": 6.176470588235294,
"grad_norm": 0.7012711548565949,
"learning_rate": 1.6674084357210562e-06,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18761314451694489,
"step": 5880,
"valid_targets_mean": 3571.2,
"valid_targets_min": 1216
},
{
"epoch": 6.18172268907563,
"grad_norm": 0.6937981892604655,
"learning_rate": 1.6465306607472608e-06,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18734653294086456,
"step": 5885,
"valid_targets_mean": 3290.8,
"valid_targets_min": 1184
},
{
"epoch": 6.186974789915967,
"grad_norm": 0.7223230217430263,
"learning_rate": 1.625778804284246e-06,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18657483160495758,
"step": 5890,
"valid_targets_mean": 2986.1,
"valid_targets_min": 1292
},
{
"epoch": 6.192226890756302,
"grad_norm": 0.703895451312637,
"learning_rate": 1.6051530087052558e-06,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18239927291870117,
"step": 5895,
"valid_targets_mean": 3485.4,
"valid_targets_min": 1639
},
{
"epoch": 6.197478991596639,
"grad_norm": 0.7220190947994646,
"learning_rate": 1.5846534155186511e-06,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19022542238235474,
"step": 5900,
"valid_targets_mean": 2959.4,
"valid_targets_min": 1394
},
{
"epoch": 6.2027310924369745,
"grad_norm": 0.7192311642483811,
"learning_rate": 1.564280165366956e-06,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20613990724086761,
"step": 5905,
"valid_targets_mean": 3428.9,
"valid_targets_min": 2280
},
{
"epoch": 6.207983193277311,
"grad_norm": 0.7691711026249906,
"learning_rate": 1.544033398025886e-06,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21603600680828094,
"step": 5910,
"valid_targets_mean": 3233.9,
"valid_targets_min": 810
},
{
"epoch": 6.213235294117647,
"grad_norm": 0.8449315953755364,
"learning_rate": 1.5239132524033951e-06,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18134553730487823,
"step": 5915,
"valid_targets_mean": 3211.6,
"valid_targets_min": 1654
},
{
"epoch": 6.218487394957983,
"grad_norm": 0.7395008703366813,
"learning_rate": 1.50391986653871e-06,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18029049038887024,
"step": 5920,
"valid_targets_mean": 3057.8,
"valid_targets_min": 584
},
{
"epoch": 6.223739495798319,
"grad_norm": 0.7120133644780183,
"learning_rate": 1.4840533776013954e-06,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20296408236026764,
"step": 5925,
"valid_targets_mean": 3572.6,
"valid_targets_min": 2498
},
{
"epoch": 6.2289915966386555,
"grad_norm": 0.752548834195417,
"learning_rate": 1.4643139218904035e-06,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18757691979408264,
"step": 5930,
"valid_targets_mean": 3161.1,
"valid_targets_min": 1350
},
{
"epoch": 6.234243697478991,
"grad_norm": 0.7837418288101413,
"learning_rate": 1.4447016348331477e-06,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19451862573623657,
"step": 5935,
"valid_targets_mean": 3486.1,
"valid_targets_min": 1624
},
{
"epoch": 6.239495798319328,
"grad_norm": 0.7679677373950752,
"learning_rate": 1.4252166509845777e-06,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16891759634017944,
"step": 5940,
"valid_targets_mean": 2769.6,
"valid_targets_min": 916
},
{
"epoch": 6.244747899159663,
"grad_norm": 0.6545085160769695,
"learning_rate": 1.4058591040262259e-06,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1811821609735489,
"step": 5945,
"valid_targets_mean": 3734.1,
"valid_targets_min": 2209
},
{
"epoch": 6.25,
"grad_norm": 0.7272522502400294,
"learning_rate": 1.3866291267653309e-06,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18539613485336304,
"step": 5950,
"valid_targets_mean": 3107.0,
"valid_targets_min": 1259
},
{
"epoch": 6.255252100840336,
"grad_norm": 0.6965968942209451,
"learning_rate": 1.3675268511339067e-06,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17434164881706238,
"step": 5955,
"valid_targets_mean": 3685.6,
"valid_targets_min": 1183
},
{
"epoch": 6.260504201680672,
"grad_norm": 0.7307769179047728,
"learning_rate": 1.3485524081878288e-06,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20974670350551605,
"step": 5960,
"valid_targets_mean": 3891.3,
"valid_targets_min": 1101
},
{
"epoch": 6.265756302521009,
"grad_norm": 0.7157157431884991,
"learning_rate": 1.3297059281059533e-06,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19651910662651062,
"step": 5965,
"valid_targets_mean": 3877.6,
"valid_targets_min": 1658
},
{
"epoch": 6.2710084033613445,
"grad_norm": 0.8654778291967979,
"learning_rate": 1.3109875401892146e-06,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19856885075569153,
"step": 5970,
"valid_targets_mean": 3050.1,
"valid_targets_min": 1423
},
{
"epoch": 6.276260504201681,
"grad_norm": 0.7591061487662136,
"learning_rate": 1.2923973728597373e-06,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18958264589309692,
"step": 5975,
"valid_targets_mean": 3202.4,
"valid_targets_min": 1185
},
{
"epoch": 6.281512605042017,
"grad_norm": 0.7845162142528881,
"learning_rate": 1.2739355536599508e-06,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2176717221736908,
"step": 5980,
"valid_targets_mean": 3779.1,
"valid_targets_min": 1091
},
{
"epoch": 6.286764705882353,
"grad_norm": 0.7274113285487317,
"learning_rate": 1.2556022092517362e-06,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1754409372806549,
"step": 5985,
"valid_targets_mean": 3628.9,
"valid_targets_min": 1352
},
{
"epoch": 6.292016806722689,
"grad_norm": 0.6322394750569781,
"learning_rate": 1.237397465415524e-06,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19616565108299255,
"step": 5990,
"valid_targets_mean": 4061.2,
"valid_targets_min": 1535
},
{
"epoch": 6.2972689075630255,
"grad_norm": 0.7257557508034214,
"learning_rate": 1.2193214470494664e-06,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.167373925447464,
"step": 5995,
"valid_targets_mean": 2753.1,
"valid_targets_min": 854
},
{
"epoch": 6.302521008403361,
"grad_norm": 0.7431922528740501,
"learning_rate": 1.201374278168541e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16021127998828888,
"step": 6000,
"valid_targets_mean": 2942.5,
"valid_targets_min": 1179
},
{
"epoch": 6.307773109243698,
"grad_norm": 0.7197510596784839,
"learning_rate": 1.1835560819037429e-06,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1804109513759613,
"step": 6005,
"valid_targets_mean": 3598.9,
"valid_targets_min": 1290
},
{
"epoch": 6.313025210084033,
"grad_norm": 0.8045418304005293,
"learning_rate": 1.1658669805012112e-06,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749718338251114,
"step": 6010,
"valid_targets_mean": 2332.6,
"valid_targets_min": 642
},
{
"epoch": 6.31827731092437,
"grad_norm": 0.7127205041558864,
"learning_rate": 1.1483070953213904e-06,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18035557866096497,
"step": 6015,
"valid_targets_mean": 3670.2,
"valid_targets_min": 1764
},
{
"epoch": 6.323529411764706,
"grad_norm": 0.8051860130698884,
"learning_rate": 1.130876546838211e-06,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2282528579235077,
"step": 6020,
"valid_targets_mean": 3528.6,
"valid_targets_min": 1410
},
{
"epoch": 6.328781512605042,
"grad_norm": 0.7625429310294065,
"learning_rate": 1.1135754546382627e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19633427262306213,
"step": 6025,
"valid_targets_mean": 3147.7,
"valid_targets_min": 1683
},
{
"epoch": 6.334033613445378,
"grad_norm": 0.7138024696131663,
"learning_rate": 1.0964039374199564e-06,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19841980934143066,
"step": 6030,
"valid_targets_mean": 3632.5,
"valid_targets_min": 996
},
{
"epoch": 6.339285714285714,
"grad_norm": 0.7688382202900614,
"learning_rate": 1.07936211299273e-06,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18963909149169922,
"step": 6035,
"valid_targets_mean": 3135.3,
"valid_targets_min": 1349
},
{
"epoch": 6.34453781512605,
"grad_norm": 0.7341808809524797,
"learning_rate": 1.0624500982762376e-06,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2044352889060974,
"step": 6040,
"valid_targets_mean": 3391.6,
"valid_targets_min": 1248
},
{
"epoch": 6.349789915966387,
"grad_norm": 0.7221599296550733,
"learning_rate": 1.045668009299523e-06,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17875009775161743,
"step": 6045,
"valid_targets_mean": 3323.4,
"valid_targets_min": 1445
},
{
"epoch": 6.355042016806722,
"grad_norm": 0.7155618590130363,
"learning_rate": 1.029015961200266e-06,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17386895418167114,
"step": 6050,
"valid_targets_mean": 3134.3,
"valid_targets_min": 2000
},
{
"epoch": 6.360294117647059,
"grad_norm": 0.8696023819163883,
"learning_rate": 1.012494068223946e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18593569099903107,
"step": 6055,
"valid_targets_mean": 2828.3,
"valid_targets_min": 1197
},
{
"epoch": 6.3655462184873945,
"grad_norm": 0.7145375703144178,
"learning_rate": 9.961024437230948e-07,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18828941881656647,
"step": 6060,
"valid_targets_mean": 3219.0,
"valid_targets_min": 1223
},
{
"epoch": 6.370798319327731,
"grad_norm": 0.7434045401240451,
"learning_rate": 9.798412001565038e-07,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17213355004787445,
"step": 6065,
"valid_targets_mean": 3199.2,
"valid_targets_min": 869
},
{
"epoch": 6.376050420168067,
"grad_norm": 0.760275705548783,
"learning_rate": 9.63710449088453e-07,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19253242015838623,
"step": 6070,
"valid_targets_mean": 2817.8,
"valid_targets_min": 1603
},
{
"epoch": 6.381302521008403,
"grad_norm": 0.729204870471661,
"learning_rate": 9.477103011879408e-07,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17323127388954163,
"step": 6075,
"valid_targets_mean": 2942.2,
"valid_targets_min": 1135
},
{
"epoch": 6.38655462184874,
"grad_norm": 0.7069419195201837,
"learning_rate": 9.318408662279399e-07,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21406994760036469,
"step": 6080,
"valid_targets_mean": 4077.0,
"valid_targets_min": 1994
},
{
"epoch": 6.391806722689076,
"grad_norm": 0.7466628023501196,
"learning_rate": 9.161022530846253e-07,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16813525557518005,
"step": 6085,
"valid_targets_mean": 3060.1,
"valid_targets_min": 1066
},
{
"epoch": 6.397058823529412,
"grad_norm": 0.7366467317633626,
"learning_rate": 9.004945697366452e-07,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20294198393821716,
"step": 6090,
"valid_targets_mean": 3687.4,
"valid_targets_min": 1211
},
{
"epoch": 6.402310924369748,
"grad_norm": 0.7660213872137742,
"learning_rate": 8.850179232643641e-07,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1757078468799591,
"step": 6095,
"valid_targets_mean": 2972.2,
"valid_targets_min": 1195
},
{
"epoch": 6.407563025210084,
"grad_norm": 0.8448238623784213,
"learning_rate": 8.696724198491369e-07,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18741391599178314,
"step": 6100,
"valid_targets_mean": 2429.5,
"valid_targets_min": 484
},
{
"epoch": 6.41281512605042,
"grad_norm": 0.7208665843891413,
"learning_rate": 8.544581647725825e-07,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2011285126209259,
"step": 6105,
"valid_targets_mean": 3851.9,
"valid_targets_min": 1257
},
{
"epoch": 6.418067226890757,
"grad_norm": 0.7164569848209156,
"learning_rate": 8.393752624158603e-07,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17893822491168976,
"step": 6110,
"valid_targets_mean": 3483.2,
"valid_targets_min": 1372
},
{
"epoch": 6.423319327731092,
"grad_norm": 0.7706889942916458,
"learning_rate": 8.244238162589435e-07,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19799582660198212,
"step": 6115,
"valid_targets_mean": 3186.8,
"valid_targets_min": 1769
},
{
"epoch": 6.428571428571429,
"grad_norm": 0.7885866860059115,
"learning_rate": 8.096039288799251e-07,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18775229156017303,
"step": 6120,
"valid_targets_mean": 3407.6,
"valid_targets_min": 1074
},
{
"epoch": 6.4338235294117645,
"grad_norm": 0.6919907540962501,
"learning_rate": 7.949157019543064e-07,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1812029927968979,
"step": 6125,
"valid_targets_mean": 3796.4,
"valid_targets_min": 980
},
{
"epoch": 6.439075630252101,
"grad_norm": 0.7918341376555602,
"learning_rate": 7.803592362542911e-07,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20236995816230774,
"step": 6130,
"valid_targets_mean": 2808.1,
"valid_targets_min": 793
},
{
"epoch": 6.444327731092437,
"grad_norm": 0.7965898165350053,
"learning_rate": 7.659346316481086e-07,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22702500224113464,
"step": 6135,
"valid_targets_mean": 3677.5,
"valid_targets_min": 1471
},
{
"epoch": 6.449579831932773,
"grad_norm": 0.7266460626729361,
"learning_rate": 7.516419870993296e-07,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16017696261405945,
"step": 6140,
"valid_targets_mean": 3032.6,
"valid_targets_min": 1353
},
{
"epoch": 6.454831932773109,
"grad_norm": 0.7762725308287282,
"learning_rate": 7.374814006661667e-07,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17704874277114868,
"step": 6145,
"valid_targets_mean": 2601.9,
"valid_targets_min": 1084
},
{
"epoch": 6.4600840336134455,
"grad_norm": 0.6779697306222039,
"learning_rate": 7.234529695008241e-07,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17760631442070007,
"step": 6150,
"valid_targets_mean": 3280.8,
"valid_targets_min": 1428
},
{
"epoch": 6.465336134453781,
"grad_norm": 0.8121257910719274,
"learning_rate": 7.095567898488175e-07,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856568455696106,
"step": 6155,
"valid_targets_mean": 3229.4,
"valid_targets_min": 1193
},
{
"epoch": 6.470588235294118,
"grad_norm": 0.7371997769488223,
"learning_rate": 6.957929570483224e-07,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17043937742710114,
"step": 6160,
"valid_targets_mean": 3519.2,
"valid_targets_min": 1614
},
{
"epoch": 6.475840336134453,
"grad_norm": 0.6638062829293753,
"learning_rate": 6.821615655295155e-07,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16736310720443726,
"step": 6165,
"valid_targets_mean": 3699.1,
"valid_targets_min": 974
},
{
"epoch": 6.48109243697479,
"grad_norm": 0.7220475008819989,
"learning_rate": 6.686627088139253e-07,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14820286631584167,
"step": 6170,
"valid_targets_mean": 2730.4,
"valid_targets_min": 1575
},
{
"epoch": 6.486344537815126,
"grad_norm": 0.6962914540227392,
"learning_rate": 6.552964795137895e-07,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18003645539283752,
"step": 6175,
"valid_targets_mean": 3345.0,
"valid_targets_min": 1697
},
{
"epoch": 6.491596638655462,
"grad_norm": 0.7440882846707011,
"learning_rate": 6.420629693314317e-07,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19298087060451508,
"step": 6180,
"valid_targets_mean": 3602.2,
"valid_targets_min": 1970
},
{
"epoch": 6.496848739495798,
"grad_norm": 0.7715353825685302,
"learning_rate": 6.289622690586151e-07,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18994097411632538,
"step": 6185,
"valid_targets_mean": 3128.4,
"valid_targets_min": 887
},
{
"epoch": 6.5021008403361344,
"grad_norm": 0.8887946663567943,
"learning_rate": 6.159944685759289e-07,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1865498125553131,
"step": 6190,
"valid_targets_mean": 2712.2,
"valid_targets_min": 1279
},
{
"epoch": 6.507352941176471,
"grad_norm": 0.6867564122848154,
"learning_rate": 6.031596568521792e-07,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1672389805316925,
"step": 6195,
"valid_targets_mean": 3052.6,
"valid_targets_min": 1021
},
{
"epoch": 6.512605042016807,
"grad_norm": 0.8081151613494477,
"learning_rate": 5.904579219437567e-07,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1853436529636383,
"step": 6200,
"valid_targets_mean": 3352.1,
"valid_targets_min": 654
},
{
"epoch": 6.517857142857143,
"grad_norm": 0.8297017876682581,
"learning_rate": 5.778893509940497e-07,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2378537356853485,
"step": 6205,
"valid_targets_mean": 2860.6,
"valid_targets_min": 1039
},
{
"epoch": 6.523109243697479,
"grad_norm": 0.7037062721004519,
"learning_rate": 5.654540302328526e-07,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17788448929786682,
"step": 6210,
"valid_targets_mean": 3742.9,
"valid_targets_min": 2459
},
{
"epoch": 6.5283613445378155,
"grad_norm": 0.6751043734055584,
"learning_rate": 5.531520449757465e-07,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16557300090789795,
"step": 6215,
"valid_targets_mean": 3435.8,
"valid_targets_min": 1276
},
{
"epoch": 6.533613445378151,
"grad_norm": 0.6332717965969442,
"learning_rate": 5.409834796235447e-07,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17843201756477356,
"step": 6220,
"valid_targets_mean": 4335.8,
"valid_targets_min": 1572
},
{
"epoch": 6.538865546218488,
"grad_norm": 0.7540653616743905,
"learning_rate": 5.28948417661701e-07,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1931922882795334,
"step": 6225,
"valid_targets_mean": 2975.5,
"valid_targets_min": 791
},
{
"epoch": 6.544117647058823,
"grad_norm": 0.945825539132947,
"learning_rate": 5.170469416597223e-07,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1272469162940979,
"step": 6230,
"valid_targets_mean": 1444.9,
"valid_targets_min": 740
},
{
"epoch": 6.54936974789916,
"grad_norm": 0.9201038959571372,
"learning_rate": 5.05279133270633e-07,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12720605731010437,
"step": 6235,
"valid_targets_mean": 1456.5,
"valid_targets_min": 612
},
{
"epoch": 6.554621848739496,
"grad_norm": 0.9294548695403332,
"learning_rate": 4.936450732303866e-07,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12623611092567444,
"step": 6240,
"valid_targets_mean": 1432.6,
"valid_targets_min": 826
},
{
"epoch": 6.559873949579832,
"grad_norm": 0.81095763836755,
"learning_rate": 4.821448413573237e-07,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11129063367843628,
"step": 6245,
"valid_targets_mean": 1432.6,
"valid_targets_min": 742
},
{
"epoch": 6.565126050420168,
"grad_norm": 0.8336053499869773,
"learning_rate": 4.70778516551631e-07,
"loss": 0.123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11743263155221939,
"step": 6250,
"valid_targets_mean": 1387.0,
"valid_targets_min": 718
},
{
"epoch": 6.570378151260504,
"grad_norm": 0.8189714574359003,
"learning_rate": 4.595461767947829e-07,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12419360131025314,
"step": 6255,
"valid_targets_mean": 1527.4,
"valid_targets_min": 764
},
{
"epoch": 6.57563025210084,
"grad_norm": 0.8726128195536536,
"learning_rate": 4.484478991490249e-07,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10007977485656738,
"step": 6260,
"valid_targets_mean": 1353.6,
"valid_targets_min": 725
},
{
"epoch": 6.580882352941177,
"grad_norm": 0.9528237066239539,
"learning_rate": 4.374837597568338e-07,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10588499903678894,
"step": 6265,
"valid_targets_mean": 1309.9,
"valid_targets_min": 610
},
{
"epoch": 6.586134453781512,
"grad_norm": 0.773375907639893,
"learning_rate": 4.266538338403936e-07,
"loss": 0.1134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1066712811589241,
"step": 6270,
"valid_targets_mean": 1465.4,
"valid_targets_min": 720
},
{
"epoch": 6.591386554621849,
"grad_norm": 0.7447038454026255,
"learning_rate": 4.159581957010894e-07,
"loss": 0.1176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10983015596866608,
"step": 6275,
"valid_targets_mean": 1379.4,
"valid_targets_min": 615
},
{
"epoch": 6.5966386554621845,
"grad_norm": 0.8705541079832045,
"learning_rate": 4.0539691871898545e-07,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10850921273231506,
"step": 6280,
"valid_targets_mean": 1158.2,
"valid_targets_min": 593
},
{
"epoch": 6.601890756302521,
"grad_norm": 0.9416604661089228,
"learning_rate": 3.949700753523344e-07,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1087367981672287,
"step": 6285,
"valid_targets_mean": 1543.1,
"valid_targets_min": 704
},
{
"epoch": 6.607142857142857,
"grad_norm": 0.7499389879872029,
"learning_rate": 3.8467773713707134e-07,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0929175540804863,
"step": 6290,
"valid_targets_mean": 1300.1,
"valid_targets_min": 722
},
{
"epoch": 6.612394957983193,
"grad_norm": 0.7928586147639457,
"learning_rate": 3.7451997468632486e-07,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10093091428279877,
"step": 6295,
"valid_targets_mean": 1401.3,
"valid_targets_min": 642
},
{
"epoch": 6.617647058823529,
"grad_norm": 0.9017571609664792,
"learning_rate": 3.6449685768993327e-07,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11259915679693222,
"step": 6300,
"valid_targets_mean": 1436.8,
"valid_targets_min": 518
},
{
"epoch": 6.6228991596638656,
"grad_norm": 0.8365779847032611,
"learning_rate": 3.5460845491396944e-07,
"loss": 0.1145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12376931309700012,
"step": 6305,
"valid_targets_mean": 1531.6,
"valid_targets_min": 728
},
{
"epoch": 6.628151260504202,
"grad_norm": 0.889104983252716,
"learning_rate": 3.448548342002589e-07,
"loss": 0.1106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1163712590932846,
"step": 6310,
"valid_targets_mean": 1469.6,
"valid_targets_min": 764
},
{
"epoch": 6.633403361344538,
"grad_norm": 0.8740557078182234,
"learning_rate": 3.352360624659312e-07,
"loss": 0.1176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12843522429466248,
"step": 6315,
"valid_targets_mean": 1437.8,
"valid_targets_min": 818
},
{
"epoch": 6.6386554621848735,
"grad_norm": 0.8792645901441288,
"learning_rate": 3.2575220570294276e-07,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11173952370882034,
"step": 6320,
"valid_targets_mean": 1327.3,
"valid_targets_min": 625
},
{
"epoch": 6.64390756302521,
"grad_norm": 0.8115595326058354,
"learning_rate": 3.164033289776369e-07,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12014767527580261,
"step": 6325,
"valid_targets_mean": 1685.2,
"valid_targets_min": 790
},
{
"epoch": 6.649159663865547,
"grad_norm": 0.9521276969718082,
"learning_rate": 3.071894964302935e-07,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12036529183387756,
"step": 6330,
"valid_targets_mean": 1595.3,
"valid_targets_min": 891
},
{
"epoch": 6.654411764705882,
"grad_norm": 0.7903280323515541,
"learning_rate": 2.981107712746867e-07,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09706208854913712,
"step": 6335,
"valid_targets_mean": 1381.1,
"valid_targets_min": 719
},
{
"epoch": 6.659663865546219,
"grad_norm": 0.8355498112239595,
"learning_rate": 2.891672157976522e-07,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10185357928276062,
"step": 6340,
"valid_targets_mean": 1345.7,
"valid_targets_min": 657
},
{
"epoch": 6.6649159663865545,
"grad_norm": 0.8948565870788178,
"learning_rate": 2.803588913586608e-07,
"loss": 0.1052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10712474584579468,
"step": 6345,
"valid_targets_mean": 1342.1,
"valid_targets_min": 783
},
{
"epoch": 6.670168067226891,
"grad_norm": 0.8221625640757199,
"learning_rate": 2.716858583894033e-07,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10669823735952377,
"step": 6350,
"valid_targets_mean": 1450.6,
"valid_targets_min": 629
},
{
"epoch": 6.675420168067227,
"grad_norm": 0.8413623877263701,
"learning_rate": 2.6314817639335964e-07,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11155045032501221,
"step": 6355,
"valid_targets_mean": 1461.3,
"valid_targets_min": 678
},
{
"epoch": 6.680672268907563,
"grad_norm": 0.8587976871867034,
"learning_rate": 2.547459039454103e-07,
"loss": 0.1128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.120185486972332,
"step": 6360,
"valid_targets_mean": 1723.1,
"valid_targets_min": 1075
},
{
"epoch": 6.685924369747899,
"grad_norm": 0.92862789354394,
"learning_rate": 2.4647909869142117e-07,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1129080206155777,
"step": 6365,
"valid_targets_mean": 1669.1,
"valid_targets_min": 816
},
{
"epoch": 6.6911764705882355,
"grad_norm": 0.8365500928151788,
"learning_rate": 2.3834781734784817e-07,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11981870979070663,
"step": 6370,
"valid_targets_mean": 1521.4,
"valid_targets_min": 957
},
{
"epoch": 6.696428571428571,
"grad_norm": 0.8689676540452689,
"learning_rate": 2.3035211570135995e-07,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09756392240524292,
"step": 6375,
"valid_targets_mean": 1282.1,
"valid_targets_min": 643
},
{
"epoch": 6.701680672268908,
"grad_norm": 0.9369896336428621,
"learning_rate": 2.224920486084403e-07,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10868951678276062,
"step": 6380,
"valid_targets_mean": 1499.7,
"valid_targets_min": 726
},
{
"epoch": 6.706932773109243,
"grad_norm": 0.8236205446292434,
"learning_rate": 2.1476766999502408e-07,
"loss": 0.1034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11456996202468872,
"step": 6385,
"valid_targets_mean": 1621.1,
"valid_targets_min": 705
},
{
"epoch": 6.71218487394958,
"grad_norm": 0.8914772064174625,
"learning_rate": 2.071790328561152e-07,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11084552109241486,
"step": 6390,
"valid_targets_mean": 1390.9,
"valid_targets_min": 700
},
{
"epoch": 6.717436974789916,
"grad_norm": 0.847420104124652,
"learning_rate": 1.997261892554403e-07,
"loss": 0.0992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09959986060857773,
"step": 6395,
"valid_targets_mean": 1254.4,
"valid_targets_min": 627
},
{
"epoch": 6.722689075630252,
"grad_norm": 0.874119271608596,
"learning_rate": 1.9240919032506688e-07,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10325537621974945,
"step": 6400,
"valid_targets_mean": 1479.2,
"valid_targets_min": 817
},
{
"epoch": 6.727941176470588,
"grad_norm": 0.8485613033201405,
"learning_rate": 1.8522808626507683e-07,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11246100813150406,
"step": 6405,
"valid_targets_mean": 1464.4,
"valid_targets_min": 974
},
{
"epoch": 6.733193277310924,
"grad_norm": 0.8500768031572533,
"learning_rate": 1.781829263432111e-07,
"loss": 0.1057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10820727050304413,
"step": 6410,
"valid_targets_mean": 1381.2,
"valid_targets_min": 657
},
{
"epoch": 6.73844537815126,
"grad_norm": 1.0070862147853497,
"learning_rate": 1.7127375889452569e-07,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10374858230352402,
"step": 6415,
"valid_targets_mean": 1486.0,
"valid_targets_min": 746
},
{
"epoch": 6.743697478991597,
"grad_norm": 0.9783876731250509,
"learning_rate": 1.6450063132107396e-07,
"loss": 0.1081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11519736051559448,
"step": 6420,
"valid_targets_mean": 1459.7,
"valid_targets_min": 739
},
{
"epoch": 6.748949579831933,
"grad_norm": 0.8259991898073508,
"learning_rate": 1.5786359009156928e-07,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09908154606819153,
"step": 6425,
"valid_targets_mean": 1397.0,
"valid_targets_min": 682
},
{
"epoch": 6.754201680672269,
"grad_norm": 0.8592177771547324,
"learning_rate": 1.5136268074107398e-07,
"loss": 0.1029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10556816309690475,
"step": 6430,
"valid_targets_mean": 1288.8,
"valid_targets_min": 703
},
{
"epoch": 6.759453781512605,
"grad_norm": 0.876887343291053,
"learning_rate": 1.44997947870682e-07,
"loss": 0.1128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11252713203430176,
"step": 6435,
"valid_targets_mean": 1446.1,
"valid_targets_min": 864
},
{
"epoch": 6.764705882352941,
"grad_norm": 0.9653593171457929,
"learning_rate": 1.3876943514721465e-07,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14397484064102173,
"step": 6440,
"valid_targets_mean": 1673.2,
"valid_targets_min": 734
},
{
"epoch": 6.769957983193278,
"grad_norm": 0.8493841465052333,
"learning_rate": 1.3267718530292296e-07,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10939159989356995,
"step": 6445,
"valid_targets_mean": 1598.7,
"valid_targets_min": 607
},
{
"epoch": 6.775210084033613,
"grad_norm": 0.821915166356728,
"learning_rate": 1.267212401351925e-07,
"loss": 0.1029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10267669707536697,
"step": 6450,
"valid_targets_mean": 1445.2,
"valid_targets_min": 551
},
{
"epoch": 6.78046218487395,
"grad_norm": 0.9162688760398915,
"learning_rate": 1.2090164050625907e-07,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11637894809246063,
"step": 6455,
"valid_targets_mean": 1552.2,
"valid_targets_min": 791
},
{
"epoch": 6.785714285714286,
"grad_norm": 0.8967489554798673,
"learning_rate": 1.1521842634292013e-07,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10807375609874725,
"step": 6460,
"valid_targets_mean": 1511.6,
"valid_targets_min": 825
},
{
"epoch": 6.790966386554622,
"grad_norm": 0.8909809447006225,
"learning_rate": 1.0967163663627044e-07,
"loss": 0.1008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10812873393297195,
"step": 6465,
"valid_targets_mean": 1489.3,
"valid_targets_min": 859
},
{
"epoch": 6.796218487394958,
"grad_norm": 0.8597923475845829,
"learning_rate": 1.0426130944143353e-07,
"loss": 0.0978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09637298434972763,
"step": 6470,
"valid_targets_mean": 1356.9,
"valid_targets_min": 737
},
{
"epoch": 6.801470588235294,
"grad_norm": 0.8605974789325253,
"learning_rate": 9.898748187729513e-08,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09894619882106781,
"step": 6475,
"valid_targets_mean": 1359.9,
"valid_targets_min": 791
},
{
"epoch": 6.80672268907563,
"grad_norm": 0.9100875928994199,
"learning_rate": 9.385019012625007e-08,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11625594645738602,
"step": 6480,
"valid_targets_mean": 1443.4,
"valid_targets_min": 724
},
{
"epoch": 6.811974789915967,
"grad_norm": 0.8583853259041662,
"learning_rate": 8.884946943395811e-08,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11173100769519806,
"step": 6485,
"valid_targets_mean": 1376.3,
"valid_targets_min": 944
},
{
"epoch": 6.817226890756302,
"grad_norm": 0.7696906815936799,
"learning_rate": 8.398535410910402e-08,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09793375432491302,
"step": 6490,
"valid_targets_mean": 1597.7,
"valid_targets_min": 802
},
{
"epoch": 6.822478991596639,
"grad_norm": 0.7990711794579531,
"learning_rate": 7.925787752314674e-08,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09811538457870483,
"step": 6495,
"valid_targets_mean": 1419.2,
"valid_targets_min": 740
},
{
"epoch": 6.8277310924369745,
"grad_norm": 0.7717945193131686,
"learning_rate": 7.466707211010838e-08,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10290801525115967,
"step": 6500,
"valid_targets_mean": 1570.5,
"valid_targets_min": 881
},
{
"epoch": 6.832983193277311,
"grad_norm": 0.9330044417782807,
"learning_rate": 7.02129693663478e-08,
"loss": 0.102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10135114192962646,
"step": 6505,
"valid_targets_mean": 1177.1,
"valid_targets_min": 636
},
{
"epoch": 6.838235294117647,
"grad_norm": 0.885799823289419,
"learning_rate": 6.589559985033189e-08,
"loss": 0.1051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10052669793367386,
"step": 6510,
"valid_targets_mean": 1280.1,
"valid_targets_min": 814
},
{
"epoch": 6.843487394957983,
"grad_norm": 0.8895050648007775,
"learning_rate": 6.171499318244234e-08,
"loss": 0.0972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0963287502527237,
"step": 6515,
"valid_targets_mean": 1253.6,
"valid_targets_min": 604
},
{
"epoch": 6.848739495798319,
"grad_norm": 0.8626286788780626,
"learning_rate": 5.767117804476696e-08,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0979156345129013,
"step": 6520,
"valid_targets_mean": 1232.8,
"valid_targets_min": 661
},
{
"epoch": 6.8539915966386555,
"grad_norm": 0.8311072710033767,
"learning_rate": 5.376418218089541e-08,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1046762764453888,
"step": 6525,
"valid_targets_mean": 1484.8,
"valid_targets_min": 728
},
{
"epoch": 6.859243697478991,
"grad_norm": 0.9079288548187959,
"learning_rate": 4.99940323957393e-08,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11257081478834152,
"step": 6530,
"valid_targets_mean": 1383.6,
"valid_targets_min": 692
},
{
"epoch": 6.864495798319328,
"grad_norm": 0.8918440819640617,
"learning_rate": 4.63607545553435e-08,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10769190639257431,
"step": 6535,
"valid_targets_mean": 1386.2,
"valid_targets_min": 840
},
{
"epoch": 6.869747899159664,
"grad_norm": 0.9081288698653714,
"learning_rate": 4.2864373586706254e-08,
"loss": 0.1084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10562418401241302,
"step": 6540,
"valid_targets_mean": 1375.6,
"valid_targets_min": 772
},
{
"epoch": 6.875,
"grad_norm": 0.8331522601558252,
"learning_rate": 3.950491347761487e-08,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10698384046554565,
"step": 6545,
"valid_targets_mean": 1612.4,
"valid_targets_min": 670
},
{
"epoch": 6.880252100840336,
"grad_norm": 0.8223352044912656,
"learning_rate": 3.628239727647254e-08,
"loss": 0.1039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10564574599266052,
"step": 6550,
"valid_targets_mean": 1427.0,
"valid_targets_min": 750
},
{
"epoch": 6.885504201680672,
"grad_norm": 1.2026759527578401,
"learning_rate": 3.319684709215176e-08,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10793040692806244,
"step": 6555,
"valid_targets_mean": 1479.3,
"valid_targets_min": 766
},
{
"epoch": 6.890756302521009,
"grad_norm": 0.8039951616902973,
"learning_rate": 3.024828409383007e-08,
"loss": 0.1018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09126448631286621,
"step": 6560,
"valid_targets_mean": 1241.5,
"valid_targets_min": 729
},
{
"epoch": 6.8960084033613445,
"grad_norm": 0.8938242214668102,
"learning_rate": 2.743672851085233e-08,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11531618982553482,
"step": 6565,
"valid_targets_mean": 1410.9,
"valid_targets_min": 682
},
{
"epoch": 6.901260504201681,
"grad_norm": 0.891140302112469,
"learning_rate": 2.4762199632588634e-08,
"loss": 0.1181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11160510778427124,
"step": 6570,
"valid_targets_mean": 1569.1,
"valid_targets_min": 738
},
{
"epoch": 6.906512605042017,
"grad_norm": 0.8886137842875292,
"learning_rate": 2.2224715808309983e-08,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10890690982341766,
"step": 6575,
"valid_targets_mean": 1378.0,
"valid_targets_min": 731
},
{
"epoch": 6.911764705882353,
"grad_norm": 0.9367326463088681,
"learning_rate": 1.9824294447043923e-08,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13127145171165466,
"step": 6580,
"valid_targets_mean": 1620.0,
"valid_targets_min": 748
},
{
"epoch": 6.917016806722689,
"grad_norm": 0.838793196574803,
"learning_rate": 1.7560952017481313e-08,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09811349958181381,
"step": 6585,
"valid_targets_mean": 1355.1,
"valid_targets_min": 564
},
{
"epoch": 6.9222689075630255,
"grad_norm": 0.8347467550105157,
"learning_rate": 1.5434704047836424e-08,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09899817407131195,
"step": 6590,
"valid_targets_mean": 1419.1,
"valid_targets_min": 651
},
{
"epoch": 6.927521008403361,
"grad_norm": 0.8905919808272537,
"learning_rate": 1.344556512576256e-08,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10358569025993347,
"step": 6595,
"valid_targets_mean": 1291.7,
"valid_targets_min": 687
},
{
"epoch": 6.932773109243698,
"grad_norm": 0.8193427692652885,
"learning_rate": 1.1593548898236606e-08,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09667745232582092,
"step": 6600,
"valid_targets_mean": 1236.8,
"valid_targets_min": 703
},
{
"epoch": 6.938025210084033,
"grad_norm": 0.8054209308544474,
"learning_rate": 9.878668071474639e-09,
"loss": 0.101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08912120014429092,
"step": 6605,
"valid_targets_mean": 1258.9,
"valid_targets_min": 522
},
{
"epoch": 6.94327731092437,
"grad_norm": 0.8379632670512256,
"learning_rate": 8.3009344108409e-09,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10500848293304443,
"step": 6610,
"valid_targets_mean": 1495.5,
"valid_targets_min": 764
},
{
"epoch": 6.948529411764706,
"grad_norm": 0.9047510484875828,
"learning_rate": 6.860358740763406e-09,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12173473089933395,
"step": 6615,
"valid_targets_mean": 1421.0,
"valid_targets_min": 548
},
{
"epoch": 6.953781512605042,
"grad_norm": 0.8386152042305247,
"learning_rate": 5.55695094467179e-09,
"loss": 0.1013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11426173895597458,
"step": 6620,
"valid_targets_mean": 1487.2,
"valid_targets_min": 694
},
{
"epoch": 6.959033613445378,
"grad_norm": 0.8298195930802489,
"learning_rate": 4.3907199649151355e-09,
"loss": 0.105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10774379968643188,
"step": 6625,
"valid_targets_mean": 1512.4,
"valid_targets_min": 823
},
{
"epoch": 6.964285714285714,
"grad_norm": 0.7758294188223108,
"learning_rate": 3.361673802708687e-09,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08553959429264069,
"step": 6630,
"valid_targets_mean": 1375.4,
"valid_targets_min": 595
},
{
"epoch": 6.96953781512605,
"grad_norm": 0.9086042968946347,
"learning_rate": 2.469819518080563e-09,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11077478528022766,
"step": 6635,
"valid_targets_mean": 1401.2,
"valid_targets_min": 693
},
{
"epoch": 6.974789915966387,
"grad_norm": 1.0872068857891495,
"learning_rate": 1.7151632298140209e-09,
"loss": 0.1005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09122096002101898,
"step": 6640,
"valid_targets_mean": 1185.6,
"valid_targets_min": 720
},
{
"epoch": 6.980042016806722,
"grad_norm": 0.9264996959156637,
"learning_rate": 1.0977101154163727e-09,
"loss": 0.102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08891530334949493,
"step": 6645,
"valid_targets_mean": 1364.2,
"valid_targets_min": 685
},
{
"epoch": 6.985294117647059,
"grad_norm": 0.8282065868459698,
"learning_rate": 6.174644110767958e-10,
"loss": 0.0982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0922815352678299,
"step": 6650,
"valid_targets_mean": 1345.2,
"valid_targets_min": 658
},
{
"epoch": 6.990546218487395,
"grad_norm": 0.7963997364292627,
"learning_rate": 2.744294116419077e-10,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09688857197761536,
"step": 6655,
"valid_targets_mean": 1431.4,
"valid_targets_min": 686
},
{
"epoch": 6.995798319327731,
"grad_norm": 0.8692235718392078,
"learning_rate": 6.860747058468064e-11,
"loss": 0.1056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11209136247634888,
"step": 6660,
"valid_targets_mean": 1505.8,
"valid_targets_min": 713
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0974183976650238,
"step": 6664,
"total_flos": 1189064928198656.0,
"train_loss": 0.2180497848695996,
"train_runtime": 25724.8893,
"train_samples_per_second": 4.145,
"train_steps_per_second": 0.259,
"valid_targets_mean": 1721.1,
"valid_targets_min": 760
}
],
"logging_steps": 5,
"max_steps": 6664,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1189064928198656.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}