nl2bash-stack-undr3070 / trainer_state.json
hf-reset
Reset repository without checkpoints directories
1c387d8
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 5159,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0067842605156037995,
"grad_norm": 11.89448977442727,
"learning_rate": 3.1007751937984497e-07,
"loss": 0.7467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.753227710723877,
"step": 5,
"valid_targets_mean": 2444.9,
"valid_targets_min": 744
},
{
"epoch": 0.013568521031207599,
"grad_norm": 11.235151503546374,
"learning_rate": 6.976744186046513e-07,
"loss": 0.7355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7996399998664856,
"step": 10,
"valid_targets_mean": 2697.8,
"valid_targets_min": 1231
},
{
"epoch": 0.0203527815468114,
"grad_norm": 10.797290846276908,
"learning_rate": 1.0852713178294575e-06,
"loss": 0.7424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7481732368469238,
"step": 15,
"valid_targets_mean": 2544.7,
"valid_targets_min": 794
},
{
"epoch": 0.027137042062415198,
"grad_norm": 8.962671209264652,
"learning_rate": 1.4728682170542638e-06,
"loss": 0.721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.750222384929657,
"step": 20,
"valid_targets_mean": 2245.1,
"valid_targets_min": 869
},
{
"epoch": 0.033921302578018994,
"grad_norm": 5.830676916492257,
"learning_rate": 1.86046511627907e-06,
"loss": 0.7025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6887879371643066,
"step": 25,
"valid_targets_mean": 3070.0,
"valid_targets_min": 777
},
{
"epoch": 0.0407055630936228,
"grad_norm": 4.8564311609396285,
"learning_rate": 2.2480620155038763e-06,
"loss": 0.6958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6251484155654907,
"step": 30,
"valid_targets_mean": 2736.8,
"valid_targets_min": 721
},
{
"epoch": 0.04748982360922659,
"grad_norm": 3.646908378962616,
"learning_rate": 2.635658914728683e-06,
"loss": 0.6536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6334314942359924,
"step": 35,
"valid_targets_mean": 2762.1,
"valid_targets_min": 1005
},
{
"epoch": 0.054274084124830396,
"grad_norm": 2.9965745618812183,
"learning_rate": 3.0232558139534885e-06,
"loss": 0.612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6031469106674194,
"step": 40,
"valid_targets_mean": 2219.0,
"valid_targets_min": 584
},
{
"epoch": 0.06105834464043419,
"grad_norm": 2.746946360828467,
"learning_rate": 3.4108527131782946e-06,
"loss": 0.5748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5974681973457336,
"step": 45,
"valid_targets_mean": 2428.1,
"valid_targets_min": 819
},
{
"epoch": 0.06784260515603799,
"grad_norm": 1.5002667732002524,
"learning_rate": 3.798449612403101e-06,
"loss": 0.5401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.528899073600769,
"step": 50,
"valid_targets_mean": 2882.4,
"valid_targets_min": 924
},
{
"epoch": 0.07462686567164178,
"grad_norm": 1.1607016531427559,
"learning_rate": 4.186046511627907e-06,
"loss": 0.5035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5087602734565735,
"step": 55,
"valid_targets_mean": 2938.0,
"valid_targets_min": 1086
},
{
"epoch": 0.0814111261872456,
"grad_norm": 0.9535068201891985,
"learning_rate": 4.573643410852713e-06,
"loss": 0.4885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4569432735443115,
"step": 60,
"valid_targets_mean": 2973.9,
"valid_targets_min": 627
},
{
"epoch": 0.08819538670284939,
"grad_norm": 1.1135265052091592,
"learning_rate": 4.9612403100775195e-06,
"loss": 0.5046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5376325845718384,
"step": 65,
"valid_targets_mean": 2420.6,
"valid_targets_min": 876
},
{
"epoch": 0.09497964721845319,
"grad_norm": 0.9604258885113336,
"learning_rate": 5.348837209302326e-06,
"loss": 0.4622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44064652919769287,
"step": 70,
"valid_targets_mean": 2443.4,
"valid_targets_min": 904
},
{
"epoch": 0.10176390773405698,
"grad_norm": 0.7991192270229877,
"learning_rate": 5.736434108527133e-06,
"loss": 0.4649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4826815724372864,
"step": 75,
"valid_targets_mean": 3380.5,
"valid_targets_min": 908
},
{
"epoch": 0.10854816824966079,
"grad_norm": 0.769158116469445,
"learning_rate": 6.124031007751938e-06,
"loss": 0.4427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44103240966796875,
"step": 80,
"valid_targets_mean": 3035.8,
"valid_targets_min": 1083
},
{
"epoch": 0.11533242876526459,
"grad_norm": 0.7875257411449904,
"learning_rate": 6.511627906976745e-06,
"loss": 0.4481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4029495120048523,
"step": 85,
"valid_targets_mean": 2706.4,
"valid_targets_min": 854
},
{
"epoch": 0.12211668928086838,
"grad_norm": 0.8473139007291898,
"learning_rate": 6.899224806201551e-06,
"loss": 0.4384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45044875144958496,
"step": 90,
"valid_targets_mean": 2473.2,
"valid_targets_min": 777
},
{
"epoch": 0.12890094979647218,
"grad_norm": 0.7757846680357573,
"learning_rate": 7.286821705426357e-06,
"loss": 0.4459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4469519853591919,
"step": 95,
"valid_targets_mean": 2856.1,
"valid_targets_min": 819
},
{
"epoch": 0.13568521031207598,
"grad_norm": 0.8491234814195904,
"learning_rate": 7.674418604651164e-06,
"loss": 0.4352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.439635306596756,
"step": 100,
"valid_targets_mean": 2584.4,
"valid_targets_min": 998
},
{
"epoch": 0.14246947082767977,
"grad_norm": 0.7130925742464007,
"learning_rate": 8.06201550387597e-06,
"loss": 0.4203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4034441113471985,
"step": 105,
"valid_targets_mean": 3170.1,
"valid_targets_min": 719
},
{
"epoch": 0.14925373134328357,
"grad_norm": 0.8093168817770919,
"learning_rate": 8.449612403100775e-06,
"loss": 0.4547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4224606156349182,
"step": 110,
"valid_targets_mean": 2654.3,
"valid_targets_min": 740
},
{
"epoch": 0.1560379918588874,
"grad_norm": 0.8309738324960866,
"learning_rate": 8.837209302325582e-06,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43095940351486206,
"step": 115,
"valid_targets_mean": 2718.1,
"valid_targets_min": 918
},
{
"epoch": 0.1628222523744912,
"grad_norm": 0.793319858169495,
"learning_rate": 9.224806201550389e-06,
"loss": 0.4186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43605878949165344,
"step": 120,
"valid_targets_mean": 2385.8,
"valid_targets_min": 571
},
{
"epoch": 0.16960651289009498,
"grad_norm": 1.0230399253622091,
"learning_rate": 9.612403100775196e-06,
"loss": 0.4211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3982701897621155,
"step": 125,
"valid_targets_mean": 1617.4,
"valid_targets_min": 683
},
{
"epoch": 0.17639077340569878,
"grad_norm": 0.8209896026771017,
"learning_rate": 1e-05,
"loss": 0.4032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4078044891357422,
"step": 130,
"valid_targets_mean": 2368.6,
"valid_targets_min": 700
},
{
"epoch": 0.18317503392130258,
"grad_norm": 0.7095946770161736,
"learning_rate": 1.0387596899224808e-05,
"loss": 0.414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3884209394454956,
"step": 135,
"valid_targets_mean": 2926.9,
"valid_targets_min": 882
},
{
"epoch": 0.18995929443690637,
"grad_norm": 0.6958216140407364,
"learning_rate": 1.0775193798449613e-05,
"loss": 0.4256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37612026929855347,
"step": 140,
"valid_targets_mean": 3520.8,
"valid_targets_min": 1095
},
{
"epoch": 0.19674355495251017,
"grad_norm": 0.8291040584046291,
"learning_rate": 1.116279069767442e-05,
"loss": 0.4085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4283609986305237,
"step": 145,
"valid_targets_mean": 2811.3,
"valid_targets_min": 1326
},
{
"epoch": 0.20352781546811397,
"grad_norm": 0.8093278558733981,
"learning_rate": 1.1550387596899227e-05,
"loss": 0.4014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4302545189857483,
"step": 150,
"valid_targets_mean": 2660.5,
"valid_targets_min": 874
},
{
"epoch": 0.21031207598371776,
"grad_norm": 0.7238386266854082,
"learning_rate": 1.193798449612403e-05,
"loss": 0.4173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37872761487960815,
"step": 155,
"valid_targets_mean": 2928.2,
"valid_targets_min": 1407
},
{
"epoch": 0.21709633649932158,
"grad_norm": 0.7853375198765415,
"learning_rate": 1.2325581395348838e-05,
"loss": 0.4018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40379324555397034,
"step": 160,
"valid_targets_mean": 2898.9,
"valid_targets_min": 1279
},
{
"epoch": 0.22388059701492538,
"grad_norm": 0.7686517468969368,
"learning_rate": 1.2713178294573645e-05,
"loss": 0.4011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4392387270927429,
"step": 165,
"valid_targets_mean": 2946.6,
"valid_targets_min": 597
},
{
"epoch": 0.23066485753052918,
"grad_norm": 0.7993134466572939,
"learning_rate": 1.3100775193798451e-05,
"loss": 0.3991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41066741943359375,
"step": 170,
"valid_targets_mean": 2813.2,
"valid_targets_min": 1002
},
{
"epoch": 0.23744911804613297,
"grad_norm": 0.6677659446481017,
"learning_rate": 1.3488372093023257e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3710253834724426,
"step": 175,
"valid_targets_mean": 3316.8,
"valid_targets_min": 1334
},
{
"epoch": 0.24423337856173677,
"grad_norm": 0.7909997170086058,
"learning_rate": 1.3875968992248064e-05,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41473937034606934,
"step": 180,
"valid_targets_mean": 2416.4,
"valid_targets_min": 715
},
{
"epoch": 0.2510176390773406,
"grad_norm": 0.8792540068344556,
"learning_rate": 1.426356589147287e-05,
"loss": 0.3846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3967583477497101,
"step": 185,
"valid_targets_mean": 2736.9,
"valid_targets_min": 640
},
{
"epoch": 0.25780189959294436,
"grad_norm": 0.7958264159408515,
"learning_rate": 1.4651162790697674e-05,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40616077184677124,
"step": 190,
"valid_targets_mean": 2568.8,
"valid_targets_min": 623
},
{
"epoch": 0.2645861601085482,
"grad_norm": 0.7604022300459651,
"learning_rate": 1.5038759689922481e-05,
"loss": 0.3754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33513033390045166,
"step": 195,
"valid_targets_mean": 2750.9,
"valid_targets_min": 791
},
{
"epoch": 0.27137042062415195,
"grad_norm": 0.8244610679195269,
"learning_rate": 1.542635658914729e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38060298562049866,
"step": 200,
"valid_targets_mean": 2832.4,
"valid_targets_min": 1334
},
{
"epoch": 0.2781546811397558,
"grad_norm": 0.729183257219207,
"learning_rate": 1.5813953488372095e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36861342191696167,
"step": 205,
"valid_targets_mean": 2902.9,
"valid_targets_min": 1030
},
{
"epoch": 0.28493894165535955,
"grad_norm": 0.8051272259035377,
"learning_rate": 1.62015503875969e-05,
"loss": 0.391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4003250300884247,
"step": 210,
"valid_targets_mean": 2374.9,
"valid_targets_min": 572
},
{
"epoch": 0.29172320217096337,
"grad_norm": 0.7887590950471755,
"learning_rate": 1.6589147286821706e-05,
"loss": 0.3754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3678756356239319,
"step": 215,
"valid_targets_mean": 3166.3,
"valid_targets_min": 1348
},
{
"epoch": 0.29850746268656714,
"grad_norm": 0.8029733763158426,
"learning_rate": 1.697674418604651e-05,
"loss": 0.3681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3723628520965576,
"step": 220,
"valid_targets_mean": 2474.6,
"valid_targets_min": 518
},
{
"epoch": 0.30529172320217096,
"grad_norm": 0.7343226056865998,
"learning_rate": 1.736434108527132e-05,
"loss": 0.3632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38321518898010254,
"step": 225,
"valid_targets_mean": 3262.1,
"valid_targets_min": 1123
},
{
"epoch": 0.3120759837177748,
"grad_norm": 0.7607257346962287,
"learning_rate": 1.7751937984496125e-05,
"loss": 0.3715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34952956438064575,
"step": 230,
"valid_targets_mean": 2810.3,
"valid_targets_min": 1113
},
{
"epoch": 0.31886024423337855,
"grad_norm": 0.8227068076920964,
"learning_rate": 1.813953488372093e-05,
"loss": 0.3819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3929305970668793,
"step": 235,
"valid_targets_mean": 2834.8,
"valid_targets_min": 1701
},
{
"epoch": 0.3256445047489824,
"grad_norm": 0.6827841124705409,
"learning_rate": 1.852713178294574e-05,
"loss": 0.3618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3641515374183655,
"step": 240,
"valid_targets_mean": 3186.5,
"valid_targets_min": 898
},
{
"epoch": 0.33242876526458615,
"grad_norm": 0.7602966954331676,
"learning_rate": 1.8914728682170544e-05,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3500159978866577,
"step": 245,
"valid_targets_mean": 2656.6,
"valid_targets_min": 618
},
{
"epoch": 0.33921302578018997,
"grad_norm": 0.7668023931379694,
"learning_rate": 1.9302325581395353e-05,
"loss": 0.3739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4043837785720825,
"step": 250,
"valid_targets_mean": 3122.2,
"valid_targets_min": 1390
},
{
"epoch": 0.34599728629579374,
"grad_norm": 0.7093670546464718,
"learning_rate": 1.9689922480620155e-05,
"loss": 0.3778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38684576749801636,
"step": 255,
"valid_targets_mean": 3311.2,
"valid_targets_min": 869
},
{
"epoch": 0.35278154681139756,
"grad_norm": 0.6761466382547776,
"learning_rate": 2.0077519379844963e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34655070304870605,
"step": 260,
"valid_targets_mean": 3112.8,
"valid_targets_min": 754
},
{
"epoch": 0.35956580732700133,
"grad_norm": 0.6694834479453904,
"learning_rate": 2.046511627906977e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3410634398460388,
"step": 265,
"valid_targets_mean": 3315.6,
"valid_targets_min": 1369
},
{
"epoch": 0.36635006784260515,
"grad_norm": 0.8155424962452198,
"learning_rate": 2.0852713178294577e-05,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35310614109039307,
"step": 270,
"valid_targets_mean": 2339.4,
"valid_targets_min": 614
},
{
"epoch": 0.373134328358209,
"grad_norm": 0.9070653857602943,
"learning_rate": 2.1240310077519383e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3375753164291382,
"step": 275,
"valid_targets_mean": 3212.9,
"valid_targets_min": 746
},
{
"epoch": 0.37991858887381275,
"grad_norm": 0.7447980160423101,
"learning_rate": 2.1627906976744188e-05,
"loss": 0.3549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3524802327156067,
"step": 280,
"valid_targets_mean": 2781.6,
"valid_targets_min": 1074
},
{
"epoch": 0.38670284938941657,
"grad_norm": 0.910428084386681,
"learning_rate": 2.2015503875968993e-05,
"loss": 0.3546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34246036410331726,
"step": 285,
"valid_targets_mean": 2999.9,
"valid_targets_min": 656
},
{
"epoch": 0.39348710990502034,
"grad_norm": 0.6635427507067181,
"learning_rate": 2.2403100775193802e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35911792516708374,
"step": 290,
"valid_targets_mean": 3345.4,
"valid_targets_min": 882
},
{
"epoch": 0.40027137042062416,
"grad_norm": 0.8108891809655495,
"learning_rate": 2.2790697674418607e-05,
"loss": 0.3676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36157429218292236,
"step": 295,
"valid_targets_mean": 2752.9,
"valid_targets_min": 776
},
{
"epoch": 0.40705563093622793,
"grad_norm": 0.7092963268541641,
"learning_rate": 2.3178294573643412e-05,
"loss": 0.357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3586769700050354,
"step": 300,
"valid_targets_mean": 3229.6,
"valid_targets_min": 644
},
{
"epoch": 0.41383989145183175,
"grad_norm": 0.8313919502710964,
"learning_rate": 2.356589147286822e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40778008103370667,
"step": 305,
"valid_targets_mean": 3072.8,
"valid_targets_min": 714
},
{
"epoch": 0.4206241519674355,
"grad_norm": 0.8521822829383703,
"learning_rate": 2.3953488372093023e-05,
"loss": 0.3571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38653799891471863,
"step": 310,
"valid_targets_mean": 2318.4,
"valid_targets_min": 882
},
{
"epoch": 0.42740841248303935,
"grad_norm": 0.7709743279914623,
"learning_rate": 2.434108527131783e-05,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36175817251205444,
"step": 315,
"valid_targets_mean": 2692.5,
"valid_targets_min": 783
},
{
"epoch": 0.43419267299864317,
"grad_norm": 0.7913741131309853,
"learning_rate": 2.4728682170542637e-05,
"loss": 0.3564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34055837988853455,
"step": 320,
"valid_targets_mean": 2549.1,
"valid_targets_min": 700
},
{
"epoch": 0.44097693351424694,
"grad_norm": 0.7251245992538848,
"learning_rate": 2.5116279069767445e-05,
"loss": 0.3424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3071543574333191,
"step": 325,
"valid_targets_mean": 2746.8,
"valid_targets_min": 1022
},
{
"epoch": 0.44776119402985076,
"grad_norm": 0.877109135791174,
"learning_rate": 2.550387596899225e-05,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3644331395626068,
"step": 330,
"valid_targets_mean": 2258.4,
"valid_targets_min": 731
},
{
"epoch": 0.45454545454545453,
"grad_norm": 0.7463994697165139,
"learning_rate": 2.589147286821706e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3452218770980835,
"step": 335,
"valid_targets_mean": 2618.1,
"valid_targets_min": 1032
},
{
"epoch": 0.46132971506105835,
"grad_norm": 0.826153332286381,
"learning_rate": 2.627906976744186e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3592166006565094,
"step": 340,
"valid_targets_mean": 2649.8,
"valid_targets_min": 648
},
{
"epoch": 0.4681139755766621,
"grad_norm": 0.7556466009720993,
"learning_rate": 2.6666666666666667e-05,
"loss": 0.3796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4219163656234741,
"step": 345,
"valid_targets_mean": 2855.0,
"valid_targets_min": 721
},
{
"epoch": 0.47489823609226595,
"grad_norm": 0.7276710198296943,
"learning_rate": 2.7054263565891475e-05,
"loss": 0.3541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.333509236574173,
"step": 350,
"valid_targets_mean": 2856.6,
"valid_targets_min": 754
},
{
"epoch": 0.4816824966078697,
"grad_norm": 0.8103248615360679,
"learning_rate": 2.744186046511628e-05,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3477519452571869,
"step": 355,
"valid_targets_mean": 2232.4,
"valid_targets_min": 712
},
{
"epoch": 0.48846675712347354,
"grad_norm": 0.9073845669791214,
"learning_rate": 2.782945736434109e-05,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36534401774406433,
"step": 360,
"valid_targets_mean": 2373.4,
"valid_targets_min": 1054
},
{
"epoch": 0.49525101763907736,
"grad_norm": 0.8050927376280175,
"learning_rate": 2.8217054263565894e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3501133620738983,
"step": 365,
"valid_targets_mean": 2434.8,
"valid_targets_min": 694
},
{
"epoch": 0.5020352781546812,
"grad_norm": 0.7660020717643617,
"learning_rate": 2.8604651162790703e-05,
"loss": 0.3492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3313218355178833,
"step": 370,
"valid_targets_mean": 2836.5,
"valid_targets_min": 1353
},
{
"epoch": 0.508819538670285,
"grad_norm": 0.7443344419339243,
"learning_rate": 2.8992248062015505e-05,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33690541982650757,
"step": 375,
"valid_targets_mean": 2837.2,
"valid_targets_min": 890
},
{
"epoch": 0.5156037991858887,
"grad_norm": 0.779004361301433,
"learning_rate": 2.937984496124031e-05,
"loss": 0.3473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34115269780158997,
"step": 380,
"valid_targets_mean": 2826.7,
"valid_targets_min": 662
},
{
"epoch": 0.5223880597014925,
"grad_norm": 0.9341133562668817,
"learning_rate": 2.976744186046512e-05,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3078441023826599,
"step": 385,
"valid_targets_mean": 1897.9,
"valid_targets_min": 537
},
{
"epoch": 0.5291723202170964,
"grad_norm": 0.9049226382408442,
"learning_rate": 3.0155038759689924e-05,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34988129138946533,
"step": 390,
"valid_targets_mean": 3014.6,
"valid_targets_min": 937
},
{
"epoch": 0.5359565807327001,
"grad_norm": 0.8125257555203335,
"learning_rate": 3.054263565891473e-05,
"loss": 0.3505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3929121792316437,
"step": 395,
"valid_targets_mean": 2705.0,
"valid_targets_min": 1179
},
{
"epoch": 0.5427408412483039,
"grad_norm": 0.7384330929303173,
"learning_rate": 3.093023255813954e-05,
"loss": 0.324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30182796716690063,
"step": 400,
"valid_targets_mean": 3520.5,
"valid_targets_min": 764
},
{
"epoch": 0.5495251017639078,
"grad_norm": 0.9344307339860809,
"learning_rate": 3.1317829457364343e-05,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37407636642456055,
"step": 405,
"valid_targets_mean": 2585.3,
"valid_targets_min": 1025
},
{
"epoch": 0.5563093622795116,
"grad_norm": 0.706765156270403,
"learning_rate": 3.170542635658915e-05,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3846889138221741,
"step": 410,
"valid_targets_mean": 3670.8,
"valid_targets_min": 1083
},
{
"epoch": 0.5630936227951153,
"grad_norm": 0.7091546038528599,
"learning_rate": 3.2093023255813954e-05,
"loss": 0.3388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2954094111919403,
"step": 415,
"valid_targets_mean": 2686.8,
"valid_targets_min": 933
},
{
"epoch": 0.5698778833107191,
"grad_norm": 0.720646680324316,
"learning_rate": 3.248062015503876e-05,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36445194482803345,
"step": 420,
"valid_targets_mean": 3180.9,
"valid_targets_min": 978
},
{
"epoch": 0.576662143826323,
"grad_norm": 0.7561273241851728,
"learning_rate": 3.286821705426357e-05,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.330274760723114,
"step": 425,
"valid_targets_mean": 2636.8,
"valid_targets_min": 816
},
{
"epoch": 0.5834464043419267,
"grad_norm": 0.8694755557547249,
"learning_rate": 3.3255813953488377e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3319804072380066,
"step": 430,
"valid_targets_mean": 2225.6,
"valid_targets_min": 1286
},
{
"epoch": 0.5902306648575305,
"grad_norm": 0.68772821314539,
"learning_rate": 3.364341085271318e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33189690113067627,
"step": 435,
"valid_targets_mean": 3022.4,
"valid_targets_min": 837
},
{
"epoch": 0.5970149253731343,
"grad_norm": 0.9588382883930207,
"learning_rate": 3.403100775193799e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3494105339050293,
"step": 440,
"valid_targets_mean": 2476.9,
"valid_targets_min": 800
},
{
"epoch": 0.6037991858887382,
"grad_norm": 0.7838789395466246,
"learning_rate": 3.441860465116279e-05,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32996422052383423,
"step": 445,
"valid_targets_mean": 2342.1,
"valid_targets_min": 1149
},
{
"epoch": 0.6105834464043419,
"grad_norm": 0.7416365052685329,
"learning_rate": 3.48062015503876e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3227633237838745,
"step": 450,
"valid_targets_mean": 3124.1,
"valid_targets_min": 1365
},
{
"epoch": 0.6173677069199457,
"grad_norm": 0.6258235950313648,
"learning_rate": 3.51937984496124e-05,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29047924280166626,
"step": 455,
"valid_targets_mean": 3342.6,
"valid_targets_min": 878
},
{
"epoch": 0.6241519674355496,
"grad_norm": 0.6880630346475627,
"learning_rate": 3.5581395348837215e-05,
"loss": 0.3664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.352108359336853,
"step": 460,
"valid_targets_mean": 3073.2,
"valid_targets_min": 1075
},
{
"epoch": 0.6309362279511533,
"grad_norm": 0.7002916188745265,
"learning_rate": 3.596899224806202e-05,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33518415689468384,
"step": 465,
"valid_targets_mean": 2779.1,
"valid_targets_min": 1072
},
{
"epoch": 0.6377204884667571,
"grad_norm": 0.7760406431300181,
"learning_rate": 3.6356589147286826e-05,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32304704189300537,
"step": 470,
"valid_targets_mean": 2418.1,
"valid_targets_min": 1143
},
{
"epoch": 0.6445047489823609,
"grad_norm": 0.81128665595444,
"learning_rate": 3.674418604651163e-05,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35187655687332153,
"step": 475,
"valid_targets_mean": 2206.1,
"valid_targets_min": 849
},
{
"epoch": 0.6512890094979648,
"grad_norm": 0.6699530012511279,
"learning_rate": 3.7131782945736436e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30837348103523254,
"step": 480,
"valid_targets_mean": 3204.2,
"valid_targets_min": 933
},
{
"epoch": 0.6580732700135685,
"grad_norm": 0.8161088245962455,
"learning_rate": 3.751937984496124e-05,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3431815803050995,
"step": 485,
"valid_targets_mean": 2313.1,
"valid_targets_min": 680
},
{
"epoch": 0.6648575305291723,
"grad_norm": 0.6636433541876118,
"learning_rate": 3.7906976744186053e-05,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3255542516708374,
"step": 490,
"valid_targets_mean": 3133.2,
"valid_targets_min": 702
},
{
"epoch": 0.6716417910447762,
"grad_norm": 0.7193982612960406,
"learning_rate": 3.829457364341086e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3598499894142151,
"step": 495,
"valid_targets_mean": 2609.6,
"valid_targets_min": 758
},
{
"epoch": 0.6784260515603799,
"grad_norm": 0.7893940888720667,
"learning_rate": 3.8682170542635664e-05,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3467223644256592,
"step": 500,
"valid_targets_mean": 2836.8,
"valid_targets_min": 1106
},
{
"epoch": 0.6852103120759837,
"grad_norm": 0.7057772565861374,
"learning_rate": 3.906976744186047e-05,
"loss": 0.3299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3372578024864197,
"step": 505,
"valid_targets_mean": 2930.9,
"valid_targets_min": 654
},
{
"epoch": 0.6919945725915875,
"grad_norm": 0.6963494863151088,
"learning_rate": 3.9457364341085275e-05,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3436594605445862,
"step": 510,
"valid_targets_mean": 3018.2,
"valid_targets_min": 717
},
{
"epoch": 0.6987788331071914,
"grad_norm": 0.7394424529088445,
"learning_rate": 3.984496124031008e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3247559666633606,
"step": 515,
"valid_targets_mean": 2679.7,
"valid_targets_min": 728
},
{
"epoch": 0.7055630936227951,
"grad_norm": 0.6838375834791657,
"learning_rate": 3.9999958795491475e-05,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3312002420425415,
"step": 520,
"valid_targets_mean": 3034.2,
"valid_targets_min": 754
},
{
"epoch": 0.7123473541383989,
"grad_norm": 0.6067455993466966,
"learning_rate": 3.999970699077645e-05,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3216730058193207,
"step": 525,
"valid_targets_mean": 3705.9,
"valid_targets_min": 739
},
{
"epoch": 0.7191316146540027,
"grad_norm": 0.6985270320464033,
"learning_rate": 3.9999226275618605e-05,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33391982316970825,
"step": 530,
"valid_targets_mean": 2748.6,
"valid_targets_min": 869
},
{
"epoch": 0.7259158751696065,
"grad_norm": 0.7662978798224946,
"learning_rate": 3.9998516655520055e-05,
"loss": 0.3397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3417017459869385,
"step": 535,
"valid_targets_mean": 2394.5,
"valid_targets_min": 730
},
{
"epoch": 0.7327001356852103,
"grad_norm": 0.669919043363021,
"learning_rate": 3.999757813860289e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31267890334129333,
"step": 540,
"valid_targets_mean": 3009.2,
"valid_targets_min": 1030
},
{
"epoch": 0.7394843962008141,
"grad_norm": 0.7274166571678258,
"learning_rate": 3.999641073560909e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31356334686279297,
"step": 545,
"valid_targets_mean": 2435.3,
"valid_targets_min": 544
},
{
"epoch": 0.746268656716418,
"grad_norm": 0.7210784987955194,
"learning_rate": 3.999501445990039e-05,
"loss": 0.3518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.358939528465271,
"step": 550,
"valid_targets_mean": 2823.4,
"valid_targets_min": 814
},
{
"epoch": 0.7530529172320217,
"grad_norm": 0.7953791505748733,
"learning_rate": 3.9993389327458125e-05,
"loss": 0.3391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3532836139202118,
"step": 555,
"valid_targets_mean": 2465.7,
"valid_targets_min": 958
},
{
"epoch": 0.7598371777476255,
"grad_norm": 0.8035999831102332,
"learning_rate": 3.9991535356883055e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3166276812553406,
"step": 560,
"valid_targets_mean": 2324.9,
"valid_targets_min": 698
},
{
"epoch": 0.7666214382632293,
"grad_norm": 0.8057221319350136,
"learning_rate": 3.9989452569395154e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37396541237831116,
"step": 565,
"valid_targets_mean": 2373.8,
"valid_targets_min": 919
},
{
"epoch": 0.7734056987788331,
"grad_norm": 0.8130298785771777,
"learning_rate": 3.9987140988833355e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32148557901382446,
"step": 570,
"valid_targets_mean": 2525.6,
"valid_targets_min": 629
},
{
"epoch": 0.7801899592944369,
"grad_norm": 0.7048055789019534,
"learning_rate": 3.9984600641655305e-05,
"loss": 0.334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3230056166648865,
"step": 575,
"valid_targets_mean": 2960.2,
"valid_targets_min": 1018
},
{
"epoch": 0.7869742198100407,
"grad_norm": 0.7505005839634938,
"learning_rate": 3.998183155693702e-05,
"loss": 0.3561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36198025941848755,
"step": 580,
"valid_targets_mean": 2640.8,
"valid_targets_min": 720
},
{
"epoch": 0.7937584803256446,
"grad_norm": 0.5953296109502596,
"learning_rate": 3.997883376637258e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35237035155296326,
"step": 585,
"valid_targets_mean": 4056.9,
"valid_targets_min": 1333
},
{
"epoch": 0.8005427408412483,
"grad_norm": 0.6965335680749082,
"learning_rate": 3.997560730427379e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.349098265171051,
"step": 590,
"valid_targets_mean": 2842.4,
"valid_targets_min": 740
},
{
"epoch": 0.8073270013568521,
"grad_norm": 0.8417459794727778,
"learning_rate": 3.99721522075697e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3189961016178131,
"step": 595,
"valid_targets_mean": 2172.4,
"valid_targets_min": 584
},
{
"epoch": 0.8141112618724559,
"grad_norm": 0.8232217865179002,
"learning_rate": 3.99684685158063e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35521090030670166,
"step": 600,
"valid_targets_mean": 3057.4,
"valid_targets_min": 924
},
{
"epoch": 0.8208955223880597,
"grad_norm": 0.6415450067556615,
"learning_rate": 3.996455627114598e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30212873220443726,
"step": 605,
"valid_targets_mean": 3003.2,
"valid_targets_min": 989
},
{
"epoch": 0.8276797829036635,
"grad_norm": 0.7030806565946134,
"learning_rate": 3.996041551836707e-05,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34246373176574707,
"step": 610,
"valid_targets_mean": 2909.0,
"valid_targets_min": 819
},
{
"epoch": 0.8344640434192673,
"grad_norm": 0.6504343613445783,
"learning_rate": 3.9956046304863354e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3366634249687195,
"step": 615,
"valid_targets_mean": 3280.8,
"valid_targets_min": 563
},
{
"epoch": 0.841248303934871,
"grad_norm": 0.8323739984409763,
"learning_rate": 3.9951448680643485e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31927552819252014,
"step": 620,
"valid_targets_mean": 2005.1,
"valid_targets_min": 656
},
{
"epoch": 0.8480325644504749,
"grad_norm": 0.7434853063494745,
"learning_rate": 3.994662269833044e-05,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33908501267433167,
"step": 625,
"valid_targets_mean": 2536.9,
"valid_targets_min": 665
},
{
"epoch": 0.8548168249660787,
"grad_norm": 0.6740114975827273,
"learning_rate": 3.994156841316093e-05,
"loss": 0.322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3202781677246094,
"step": 630,
"valid_targets_mean": 2874.8,
"valid_targets_min": 801
},
{
"epoch": 0.8616010854816825,
"grad_norm": 0.7855713565247058,
"learning_rate": 3.9936285882984723e-05,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34169870615005493,
"step": 635,
"valid_targets_mean": 2232.2,
"valid_targets_min": 740
},
{
"epoch": 0.8683853459972863,
"grad_norm": 0.6561553473826617,
"learning_rate": 3.993077516826403e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3322102427482605,
"step": 640,
"valid_targets_mean": 2907.2,
"valid_targets_min": 805
},
{
"epoch": 0.8751696065128901,
"grad_norm": 0.7829492620549515,
"learning_rate": 3.9925036332072775e-05,
"loss": 0.3253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32236772775650024,
"step": 645,
"valid_targets_mean": 2319.2,
"valid_targets_min": 981
},
{
"epoch": 0.8819538670284939,
"grad_norm": 0.7216603888066516,
"learning_rate": 3.99190694400959e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35016581416130066,
"step": 650,
"valid_targets_mean": 2640.7,
"valid_targets_min": 828
},
{
"epoch": 0.8887381275440976,
"grad_norm": 0.6378166749356016,
"learning_rate": 3.991287456062861e-05,
"loss": 0.3396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34149160981178284,
"step": 655,
"valid_targets_mean": 3447.8,
"valid_targets_min": 1261
},
{
"epoch": 0.8955223880597015,
"grad_norm": 0.7082789982684017,
"learning_rate": 3.9906451764575544e-05,
"loss": 0.3388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.348561555147171,
"step": 660,
"valid_targets_mean": 2913.9,
"valid_targets_min": 723
},
{
"epoch": 0.9023066485753053,
"grad_norm": 0.7353124573695241,
"learning_rate": 3.989980112545007e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3169977068901062,
"step": 665,
"valid_targets_mean": 2372.2,
"valid_targets_min": 893
},
{
"epoch": 0.9090909090909091,
"grad_norm": 0.6779717293015843,
"learning_rate": 3.989292271937332e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3415604531764984,
"step": 670,
"valid_targets_mean": 3224.8,
"valid_targets_min": 1172
},
{
"epoch": 0.9158751696065129,
"grad_norm": 0.6802704573331115,
"learning_rate": 3.988581662507339e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3390202820301056,
"step": 675,
"valid_targets_mean": 2996.1,
"valid_targets_min": 464
},
{
"epoch": 0.9226594301221167,
"grad_norm": 0.7137326701115103,
"learning_rate": 3.987848292388445e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3149383068084717,
"step": 680,
"valid_targets_mean": 2476.1,
"valid_targets_min": 770
},
{
"epoch": 0.9294436906377205,
"grad_norm": 0.7976853977114939,
"learning_rate": 3.987092169974576e-05,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34196972846984863,
"step": 685,
"valid_targets_mean": 2134.6,
"valid_targets_min": 722
},
{
"epoch": 0.9362279511533242,
"grad_norm": 0.7571960144185641,
"learning_rate": 3.986313303920074e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31737232208251953,
"step": 690,
"valid_targets_mean": 2642.4,
"valid_targets_min": 1254
},
{
"epoch": 0.9430122116689281,
"grad_norm": 0.7686352923550949,
"learning_rate": 3.985511703139599e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30339232087135315,
"step": 695,
"valid_targets_mean": 2095.3,
"valid_targets_min": 714
},
{
"epoch": 0.9497964721845319,
"grad_norm": 0.6986874211530488,
"learning_rate": 3.984687376808025e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34129583835601807,
"step": 700,
"valid_targets_mean": 2803.9,
"valid_targets_min": 744
},
{
"epoch": 0.9565807327001357,
"grad_norm": 0.7610343107451978,
"learning_rate": 3.983840334360336e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33215272426605225,
"step": 705,
"valid_targets_mean": 2625.3,
"valid_targets_min": 1206
},
{
"epoch": 0.9633649932157394,
"grad_norm": 0.6276014942943633,
"learning_rate": 3.982970585491516e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128705620765686,
"step": 710,
"valid_targets_mean": 3215.4,
"valid_targets_min": 1391
},
{
"epoch": 0.9701492537313433,
"grad_norm": 0.6798894086802646,
"learning_rate": 3.982078140156441e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2989204525947571,
"step": 715,
"valid_targets_mean": 2666.4,
"valid_targets_min": 593
},
{
"epoch": 0.9769335142469471,
"grad_norm": 0.7410349510063327,
"learning_rate": 3.981163008569764e-05,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31131139397621155,
"step": 720,
"valid_targets_mean": 3063.8,
"valid_targets_min": 612
},
{
"epoch": 0.9837177747625508,
"grad_norm": 0.6643176359530586,
"learning_rate": 3.9802252012057974e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3558084964752197,
"step": 725,
"valid_targets_mean": 3521.2,
"valid_targets_min": 619
},
{
"epoch": 0.9905020352781547,
"grad_norm": 0.7267283614828455,
"learning_rate": 3.979264728798392e-05,
"loss": 0.3334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3494442105293274,
"step": 730,
"valid_targets_mean": 2547.4,
"valid_targets_min": 837
},
{
"epoch": 0.9972862957937585,
"grad_norm": 0.6814846127090516,
"learning_rate": 3.9782816023408194e-05,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3272936940193176,
"step": 735,
"valid_targets_mean": 2686.4,
"valid_targets_min": 960
},
{
"epoch": 1.0040705563093624,
"grad_norm": 0.6861216126300802,
"learning_rate": 3.977275833085638e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31268030405044556,
"step": 740,
"valid_targets_mean": 2643.2,
"valid_targets_min": 776
},
{
"epoch": 1.010854816824966,
"grad_norm": 0.6898996438799597,
"learning_rate": 3.976247432544571e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911531925201416,
"step": 745,
"valid_targets_mean": 2797.4,
"valid_targets_min": 793
},
{
"epoch": 1.01763907734057,
"grad_norm": 0.8254261194413537,
"learning_rate": 3.9751964124883735e-05,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192952275276184,
"step": 750,
"valid_targets_mean": 2253.1,
"valid_targets_min": 692
},
{
"epoch": 1.0244233378561738,
"grad_norm": 0.7754318957680647,
"learning_rate": 3.974122784946694e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27857261896133423,
"step": 755,
"valid_targets_mean": 2432.6,
"valid_targets_min": 767
},
{
"epoch": 1.0312075983717774,
"grad_norm": 0.7881514631070836,
"learning_rate": 3.97302656220794e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320145845413208,
"step": 760,
"valid_targets_mean": 2445.4,
"valid_targets_min": 748
},
{
"epoch": 1.0379918588873813,
"grad_norm": 0.6506473704894072,
"learning_rate": 3.9719077568191376e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28449857234954834,
"step": 765,
"valid_targets_mean": 3023.9,
"valid_targets_min": 901
},
{
"epoch": 1.044776119402985,
"grad_norm": 0.8042677555990032,
"learning_rate": 3.970766381585786e-05,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26466116309165955,
"step": 770,
"valid_targets_mean": 2212.1,
"valid_targets_min": 820
},
{
"epoch": 1.0515603799185889,
"grad_norm": 0.676421887365203,
"learning_rate": 3.969602449571712e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29949331283569336,
"step": 775,
"valid_targets_mean": 3120.0,
"valid_targets_min": 652
},
{
"epoch": 1.0583446404341927,
"grad_norm": 0.7474747697048539,
"learning_rate": 3.96841597409892e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30292749404907227,
"step": 780,
"valid_targets_mean": 2577.1,
"valid_targets_min": 844
},
{
"epoch": 1.0651289009497964,
"grad_norm": 0.7960660690648608,
"learning_rate": 3.9672069687474415e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28914356231689453,
"step": 785,
"valid_targets_mean": 2216.7,
"valid_targets_min": 656
},
{
"epoch": 1.0719131614654003,
"grad_norm": 0.6763388576498762,
"learning_rate": 3.965975447355176e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30142050981521606,
"step": 790,
"valid_targets_mean": 2811.3,
"valid_targets_min": 1151
},
{
"epoch": 1.0786974219810042,
"grad_norm": 0.8330584303910075,
"learning_rate": 3.964721424017735e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303778737783432,
"step": 795,
"valid_targets_mean": 2451.8,
"valid_targets_min": 521
},
{
"epoch": 1.0854816824966078,
"grad_norm": 0.7262140518757996,
"learning_rate": 3.963444913088281e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3419913649559021,
"step": 800,
"valid_targets_mean": 3062.5,
"valid_targets_min": 678
},
{
"epoch": 1.0922659430122117,
"grad_norm": 0.701846588477317,
"learning_rate": 3.9621459291773626e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3039608597755432,
"step": 805,
"valid_targets_mean": 2721.3,
"valid_targets_min": 649
},
{
"epoch": 1.0990502035278156,
"grad_norm": 0.764825483304104,
"learning_rate": 3.960824487152746e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3330846428871155,
"step": 810,
"valid_targets_mean": 2494.1,
"valid_targets_min": 704
},
{
"epoch": 1.1058344640434192,
"grad_norm": 0.8702738985222226,
"learning_rate": 3.959480602139247e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2918407917022705,
"step": 815,
"valid_targets_mean": 2434.2,
"valid_targets_min": 759
},
{
"epoch": 1.112618724559023,
"grad_norm": 0.6076347441974812,
"learning_rate": 3.958114289518557e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2711153030395508,
"step": 820,
"valid_targets_mean": 3189.2,
"valid_targets_min": 809
},
{
"epoch": 1.1194029850746268,
"grad_norm": 0.6404883109837152,
"learning_rate": 3.956725564929066e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2949562072753906,
"step": 825,
"valid_targets_mean": 3202.6,
"valid_targets_min": 1170
},
{
"epoch": 1.1261872455902306,
"grad_norm": 0.6942618107302919,
"learning_rate": 3.955314444265685e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29515475034713745,
"step": 830,
"valid_targets_mean": 2622.8,
"valid_targets_min": 753
},
{
"epoch": 1.1329715061058345,
"grad_norm": 0.7378195219174956,
"learning_rate": 3.9538809436796635e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31367671489715576,
"step": 835,
"valid_targets_mean": 2731.7,
"valid_targets_min": 1299
},
{
"epoch": 1.1397557666214382,
"grad_norm": 0.7537202284076141,
"learning_rate": 3.952425079578405e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3013504147529602,
"step": 840,
"valid_targets_mean": 2165.1,
"valid_targets_min": 675
},
{
"epoch": 1.146540027137042,
"grad_norm": 0.7523754539948808,
"learning_rate": 3.9509468686252776e-05,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2941988706588745,
"step": 845,
"valid_targets_mean": 2384.8,
"valid_targets_min": 835
},
{
"epoch": 1.153324287652646,
"grad_norm": 0.5769173901162691,
"learning_rate": 3.9494463277394256e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812822461128235,
"step": 850,
"valid_targets_mean": 3832.6,
"valid_targets_min": 944
},
{
"epoch": 1.1601085481682496,
"grad_norm": 0.6902875767301633,
"learning_rate": 3.947923474095575e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2795878052711487,
"step": 855,
"valid_targets_mean": 2588.9,
"valid_targets_min": 937
},
{
"epoch": 1.1668928086838535,
"grad_norm": 0.6932765985873842,
"learning_rate": 3.946378325123836e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29586702585220337,
"step": 860,
"valid_targets_mean": 2557.6,
"valid_targets_min": 1059
},
{
"epoch": 1.1736770691994574,
"grad_norm": 0.8142184847264059,
"learning_rate": 3.9448108985095036e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3577713966369629,
"step": 865,
"valid_targets_mean": 2609.6,
"valid_targets_min": 1031
},
{
"epoch": 1.180461329715061,
"grad_norm": 0.6535181326922942,
"learning_rate": 3.943221212192859e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148359954357147,
"step": 870,
"valid_targets_mean": 3229.5,
"valid_targets_min": 1220
},
{
"epoch": 1.187245590230665,
"grad_norm": 0.6505841244224432,
"learning_rate": 3.941609284368956e-05,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2802058458328247,
"step": 875,
"valid_targets_mean": 3026.5,
"valid_targets_min": 858
},
{
"epoch": 1.1940298507462686,
"grad_norm": 0.6960891267075039,
"learning_rate": 3.939975133487422e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3029175400733948,
"step": 880,
"valid_targets_mean": 2756.3,
"valid_targets_min": 611
},
{
"epoch": 1.2008141112618724,
"grad_norm": 0.6800823657754136,
"learning_rate": 3.938318778252241e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29470711946487427,
"step": 885,
"valid_targets_mean": 3122.9,
"valid_targets_min": 1028
},
{
"epoch": 1.2075983717774763,
"grad_norm": 0.7814295994587976,
"learning_rate": 3.9366402376215405e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31138426065444946,
"step": 890,
"valid_targets_mean": 2320.1,
"valid_targets_min": 714
},
{
"epoch": 1.21438263229308,
"grad_norm": 0.7335457886775086,
"learning_rate": 3.934939530807376e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2950824797153473,
"step": 895,
"valid_targets_mean": 2272.6,
"valid_targets_min": 623
},
{
"epoch": 1.2211668928086838,
"grad_norm": 0.7406055989848646,
"learning_rate": 3.933216677275512e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30795565247535706,
"step": 900,
"valid_targets_mean": 2708.2,
"valid_targets_min": 618
},
{
"epoch": 1.2279511533242877,
"grad_norm": 0.7271310816643761,
"learning_rate": 3.931471696745194e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3034670650959015,
"step": 905,
"valid_targets_mean": 2719.8,
"valid_targets_min": 1144
},
{
"epoch": 1.2347354138398914,
"grad_norm": 0.6098483261250427,
"learning_rate": 3.929704609188927e-05,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30650919675827026,
"step": 910,
"valid_targets_mean": 3541.2,
"valid_targets_min": 837
},
{
"epoch": 1.2415196743554953,
"grad_norm": 0.6695184378675495,
"learning_rate": 3.9279154348322495e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29480671882629395,
"step": 915,
"valid_targets_mean": 2631.8,
"valid_targets_min": 627
},
{
"epoch": 1.2483039348710991,
"grad_norm": 0.6364092125880288,
"learning_rate": 3.926104194153495e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2782565951347351,
"step": 920,
"valid_targets_mean": 2974.1,
"valid_targets_min": 881
},
{
"epoch": 1.2550881953867028,
"grad_norm": 0.8301944651771248,
"learning_rate": 3.924270907883562e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791467607021332,
"step": 925,
"valid_targets_mean": 2883.7,
"valid_targets_min": 703
},
{
"epoch": 1.2618724559023067,
"grad_norm": 0.8022627958583087,
"learning_rate": 3.922415597005677e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.281793475151062,
"step": 930,
"valid_targets_mean": 1910.9,
"valid_targets_min": 643
},
{
"epoch": 1.2686567164179103,
"grad_norm": 0.6363883403354091,
"learning_rate": 3.920538282755153e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2905217707157135,
"step": 935,
"valid_targets_mean": 3314.0,
"valid_targets_min": 1133
},
{
"epoch": 1.2754409769335142,
"grad_norm": 0.637738645846229,
"learning_rate": 3.918638986619146e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2899988889694214,
"step": 940,
"valid_targets_mean": 3262.2,
"valid_targets_min": 807
},
{
"epoch": 1.282225237449118,
"grad_norm": 0.6487116870961588,
"learning_rate": 3.9167177303364115e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3026847243309021,
"step": 945,
"valid_targets_mean": 3640.3,
"valid_targets_min": 1299
},
{
"epoch": 1.289009497964722,
"grad_norm": 0.7490100317858217,
"learning_rate": 3.9147745358970524e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28088971972465515,
"step": 950,
"valid_targets_mean": 2377.6,
"valid_targets_min": 909
},
{
"epoch": 1.2957937584803256,
"grad_norm": 0.7137946081945997,
"learning_rate": 3.9128094255422696e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796930968761444,
"step": 955,
"valid_targets_mean": 2555.9,
"valid_targets_min": 631
},
{
"epoch": 1.3025780189959295,
"grad_norm": 0.5993098074500324,
"learning_rate": 3.910822421764106e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2874249219894409,
"step": 960,
"valid_targets_mean": 3206.5,
"valid_targets_min": 1560
},
{
"epoch": 1.3093622795115332,
"grad_norm": 0.9231815200437856,
"learning_rate": 3.9088135473051914e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33113178610801697,
"step": 965,
"valid_targets_mean": 2220.5,
"valid_targets_min": 484
},
{
"epoch": 1.316146540027137,
"grad_norm": 0.6697716973175908,
"learning_rate": 3.906782825158479e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.285530149936676,
"step": 970,
"valid_targets_mean": 2935.3,
"valid_targets_min": 1225
},
{
"epoch": 1.322930800542741,
"grad_norm": 0.7281815877744984,
"learning_rate": 3.904730278566986e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005235493183136,
"step": 975,
"valid_targets_mean": 2603.3,
"valid_targets_min": 768
},
{
"epoch": 1.3297150610583446,
"grad_norm": 0.748646343253343,
"learning_rate": 3.9026559310235234e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904489040374756,
"step": 980,
"valid_targets_mean": 2551.4,
"valid_targets_min": 1193
},
{
"epoch": 1.3364993215739485,
"grad_norm": 0.6174464137752114,
"learning_rate": 3.900559806270429e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24410629272460938,
"step": 985,
"valid_targets_mean": 2941.9,
"valid_targets_min": 692
},
{
"epoch": 1.3432835820895521,
"grad_norm": 0.7452637300432898,
"learning_rate": 3.898441928299297e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30062615871429443,
"step": 990,
"valid_targets_mean": 2270.9,
"valid_targets_min": 937
},
{
"epoch": 1.350067842605156,
"grad_norm": 0.6464889713515524,
"learning_rate": 3.896302321350702e-05,
"loss": 0.313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2945151925086975,
"step": 995,
"valid_targets_mean": 3044.5,
"valid_targets_min": 1167
},
{
"epoch": 1.3568521031207599,
"grad_norm": 0.7017509437824359,
"learning_rate": 3.894141009913921e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29814016819000244,
"step": 1000,
"valid_targets_mean": 2468.2,
"valid_targets_min": 530
},
{
"epoch": 1.3636363636363638,
"grad_norm": 0.6780559700998617,
"learning_rate": 3.891958018726655e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28629612922668457,
"step": 1005,
"valid_targets_mean": 2853.8,
"valid_targets_min": 807
},
{
"epoch": 1.3704206241519674,
"grad_norm": 0.8191037771052176,
"learning_rate": 3.8897533727747434e-05,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3040386438369751,
"step": 1010,
"valid_targets_mean": 2648.5,
"valid_targets_min": 740
},
{
"epoch": 1.3772048846675713,
"grad_norm": 0.668502617185383,
"learning_rate": 3.88752709729188e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31058913469314575,
"step": 1015,
"valid_targets_mean": 3066.1,
"valid_targets_min": 1388
},
{
"epoch": 1.383989145183175,
"grad_norm": 0.7094563085559425,
"learning_rate": 3.885279217759324e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27286526560783386,
"step": 1020,
"valid_targets_mean": 2670.2,
"valid_targets_min": 698
},
{
"epoch": 1.3907734056987788,
"grad_norm": 0.6912293288922038,
"learning_rate": 3.883009759905607e-05,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29000505805015564,
"step": 1025,
"valid_targets_mean": 3009.6,
"valid_targets_min": 635
},
{
"epoch": 1.3975576662143827,
"grad_norm": 0.598939732528779,
"learning_rate": 3.8807187497062394e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27007484436035156,
"step": 1030,
"valid_targets_mean": 3264.9,
"valid_targets_min": 637
},
{
"epoch": 1.4043419267299864,
"grad_norm": 0.6399031295655998,
"learning_rate": 3.8784062133834136e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30463242530822754,
"step": 1035,
"valid_targets_mean": 2838.9,
"valid_targets_min": 957
},
{
"epoch": 1.4111261872455902,
"grad_norm": 0.6746984691711082,
"learning_rate": 3.876072177405703e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3121001720428467,
"step": 1040,
"valid_targets_mean": 2916.5,
"valid_targets_min": 956
},
{
"epoch": 1.417910447761194,
"grad_norm": 0.7284630600724608,
"learning_rate": 3.8737166684877596e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644261121749878,
"step": 1045,
"valid_targets_mean": 2068.2,
"valid_targets_min": 671
},
{
"epoch": 1.4246947082767978,
"grad_norm": 0.6562294087271845,
"learning_rate": 3.871339713590007e-05,
"loss": 0.2954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642728388309479,
"step": 1050,
"valid_targets_mean": 2884.8,
"valid_targets_min": 920
},
{
"epoch": 1.4314789687924017,
"grad_norm": 0.6478250945987496,
"learning_rate": 3.868941339918335e-05,
"loss": 0.2929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32172685861587524,
"step": 1055,
"valid_targets_mean": 3082.5,
"valid_targets_min": 1197
},
{
"epoch": 1.4382632293080055,
"grad_norm": 0.644202603849787,
"learning_rate": 3.866521574923784e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31228554248809814,
"step": 1060,
"valid_targets_mean": 3175.8,
"valid_targets_min": 1451
},
{
"epoch": 1.4450474898236092,
"grad_norm": 0.661879013668605,
"learning_rate": 3.864080446302234e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3252270519733429,
"step": 1065,
"valid_targets_mean": 3194.7,
"valid_targets_min": 711
},
{
"epoch": 1.451831750339213,
"grad_norm": 0.6549935813841651,
"learning_rate": 3.8616179819940857e-05,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28648945689201355,
"step": 1070,
"valid_targets_mean": 2721.0,
"valid_targets_min": 1331
},
{
"epoch": 1.4586160108548167,
"grad_norm": 0.6531723880805292,
"learning_rate": 3.859134210183941e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31207776069641113,
"step": 1075,
"valid_targets_mean": 2777.7,
"valid_targets_min": 676
},
{
"epoch": 1.4654002713704206,
"grad_norm": 0.6716764880355328,
"learning_rate": 3.856629159300283e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32089391350746155,
"step": 1080,
"valid_targets_mean": 3052.2,
"valid_targets_min": 690
},
{
"epoch": 1.4721845318860245,
"grad_norm": 0.6655307018039186,
"learning_rate": 3.8541028580151465e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26921534538269043,
"step": 1085,
"valid_targets_mean": 2680.0,
"valid_targets_min": 889
},
{
"epoch": 1.4789687924016282,
"grad_norm": 0.7389639492671433,
"learning_rate": 3.8515553352437927e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28306636214256287,
"step": 1090,
"valid_targets_mean": 2348.4,
"valid_targets_min": 737
},
{
"epoch": 1.485753052917232,
"grad_norm": 0.6679028777069137,
"learning_rate": 3.848986620144376e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26913198828697205,
"step": 1095,
"valid_targets_mean": 2657.7,
"valid_targets_min": 1243
},
{
"epoch": 1.4925373134328357,
"grad_norm": 0.6297786728759884,
"learning_rate": 3.846396742117614e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31999313831329346,
"step": 1100,
"valid_targets_mean": 3368.2,
"valid_targets_min": 1524
},
{
"epoch": 1.4993215739484396,
"grad_norm": 0.6149463581344302,
"learning_rate": 3.843785730806447e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29018402099609375,
"step": 1105,
"valid_targets_mean": 3319.4,
"valid_targets_min": 1354
},
{
"epoch": 1.5061058344640434,
"grad_norm": 0.809702645817836,
"learning_rate": 3.8411536160957004e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29155030846595764,
"step": 1110,
"valid_targets_mean": 2079.1,
"valid_targets_min": 939
},
{
"epoch": 1.5128900949796473,
"grad_norm": 0.6375577416325251,
"learning_rate": 3.8385004281117425e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26376283168792725,
"step": 1115,
"valid_targets_mean": 3094.1,
"valid_targets_min": 951
},
{
"epoch": 1.519674355495251,
"grad_norm": 0.7117061338880089,
"learning_rate": 3.83582619722214e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32851043343544006,
"step": 1120,
"valid_targets_mean": 2709.3,
"valid_targets_min": 1321
},
{
"epoch": 1.5264586160108549,
"grad_norm": 0.7195810818077915,
"learning_rate": 3.833130954035311e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29876279830932617,
"step": 1125,
"valid_targets_mean": 2322.1,
"valid_targets_min": 728
},
{
"epoch": 1.5332428765264585,
"grad_norm": 0.6893087648021691,
"learning_rate": 3.830414729400172e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32284027338027954,
"step": 1130,
"valid_targets_mean": 2666.9,
"valid_targets_min": 882
},
{
"epoch": 1.5400271370420624,
"grad_norm": 0.6375253452820985,
"learning_rate": 3.8276775544057886e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2919315695762634,
"step": 1135,
"valid_targets_mean": 3260.2,
"valid_targets_min": 754
},
{
"epoch": 1.5468113975576663,
"grad_norm": 0.7850898957886953,
"learning_rate": 3.824919460381016e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2958727180957794,
"step": 1140,
"valid_targets_mean": 3326.9,
"valid_targets_min": 1021
},
{
"epoch": 1.5535956580732702,
"grad_norm": 0.6951131898750251,
"learning_rate": 3.822140478894143e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3108687102794647,
"step": 1145,
"valid_targets_mean": 2787.1,
"valid_targets_min": 842
},
{
"epoch": 1.5603799185888738,
"grad_norm": 0.733903133533046,
"learning_rate": 3.8193406417525304e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3235079050064087,
"step": 1150,
"valid_targets_mean": 2633.2,
"valid_targets_min": 1181
},
{
"epoch": 1.5671641791044775,
"grad_norm": 0.731200133367719,
"learning_rate": 3.816519981002245e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996997535228729,
"step": 1155,
"valid_targets_mean": 2690.8,
"valid_targets_min": 1251
},
{
"epoch": 1.5739484396200814,
"grad_norm": 0.6385315926667753,
"learning_rate": 3.8136785289276953e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27406877279281616,
"step": 1160,
"valid_targets_mean": 3035.6,
"valid_targets_min": 1429
},
{
"epoch": 1.5807327001356852,
"grad_norm": 0.7362793886550267,
"learning_rate": 3.81081631805126e-05,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34110113978385925,
"step": 1165,
"valid_targets_mean": 2940.3,
"valid_targets_min": 805
},
{
"epoch": 1.587516960651289,
"grad_norm": 0.7349732590117125,
"learning_rate": 3.807933381132917e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2936994135379791,
"step": 1170,
"valid_targets_mean": 2527.9,
"valid_targets_min": 746
},
{
"epoch": 1.5943012211668928,
"grad_norm": 0.7064877699762256,
"learning_rate": 3.805029751169869e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29555004835128784,
"step": 1175,
"valid_targets_mean": 2654.1,
"valid_targets_min": 650
},
{
"epoch": 1.6010854816824966,
"grad_norm": 0.6447256804044132,
"learning_rate": 3.802105461396163e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31151026487350464,
"step": 1180,
"valid_targets_mean": 2946.4,
"valid_targets_min": 738
},
{
"epoch": 1.6078697421981003,
"grad_norm": 0.5108082252163869,
"learning_rate": 3.799160545282312e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2245091050863266,
"step": 1185,
"valid_targets_mean": 3714.3,
"valid_targets_min": 846
},
{
"epoch": 1.6146540027137042,
"grad_norm": 0.6878930154133356,
"learning_rate": 3.796195036534914e-05,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2854118049144745,
"step": 1190,
"valid_targets_mean": 2541.6,
"valid_targets_min": 772
},
{
"epoch": 1.621438263229308,
"grad_norm": 0.8006673353310524,
"learning_rate": 3.793208969096261e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28456225991249084,
"step": 1195,
"valid_targets_mean": 2468.4,
"valid_targets_min": 700
},
{
"epoch": 1.628222523744912,
"grad_norm": 0.7653832467394758,
"learning_rate": 3.790202377143956e-05,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31006136536598206,
"step": 1200,
"valid_targets_mean": 2955.1,
"valid_targets_min": 1195
},
{
"epoch": 1.6350067842605156,
"grad_norm": 0.7315864774837488,
"learning_rate": 3.7871752950905174e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3193378448486328,
"step": 1205,
"valid_targets_mean": 2490.4,
"valid_targets_min": 612
},
{
"epoch": 1.6417910447761193,
"grad_norm": 0.7643610632774577,
"learning_rate": 3.784127757582987e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3098391592502594,
"step": 1210,
"valid_targets_mean": 2237.9,
"valid_targets_min": 662
},
{
"epoch": 1.6485753052917231,
"grad_norm": 0.6008604291150627,
"learning_rate": 3.7810597995025336e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2691340446472168,
"step": 1215,
"valid_targets_mean": 2998.4,
"valid_targets_min": 685
},
{
"epoch": 1.655359565807327,
"grad_norm": 0.6364039836954427,
"learning_rate": 3.7779714559640555e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29183879494667053,
"step": 1220,
"valid_targets_mean": 3299.7,
"valid_targets_min": 768
},
{
"epoch": 1.662143826322931,
"grad_norm": 0.8360956147817608,
"learning_rate": 3.774862762315772e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30887937545776367,
"step": 1225,
"valid_targets_mean": 2721.2,
"valid_targets_min": 467
},
{
"epoch": 1.6689280868385346,
"grad_norm": 0.6028843978675598,
"learning_rate": 3.771733754138829e-05,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2811635732650757,
"step": 1230,
"valid_targets_mean": 3361.2,
"valid_targets_min": 839
},
{
"epoch": 1.6757123473541384,
"grad_norm": 0.7428753179701643,
"learning_rate": 3.768584467246883e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30133670568466187,
"step": 1235,
"valid_targets_mean": 3111.6,
"valid_targets_min": 683
},
{
"epoch": 1.682496607869742,
"grad_norm": 0.7569776252384394,
"learning_rate": 3.765414937685695e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009093999862671,
"step": 1240,
"valid_targets_mean": 2188.5,
"valid_targets_min": 697
},
{
"epoch": 1.689280868385346,
"grad_norm": 0.5814940877820675,
"learning_rate": 3.762225201732715e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26204395294189453,
"step": 1245,
"valid_targets_mean": 3493.9,
"valid_targets_min": 800
},
{
"epoch": 1.6960651289009498,
"grad_norm": 0.726614967916978,
"learning_rate": 3.7590152958966745e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.321370929479599,
"step": 1250,
"valid_targets_mean": 2850.1,
"valid_targets_min": 715
},
{
"epoch": 1.7028493894165537,
"grad_norm": 0.7426123839264059,
"learning_rate": 3.7557852569171585e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2817172110080719,
"step": 1255,
"valid_targets_mean": 2224.9,
"valid_targets_min": 754
},
{
"epoch": 1.7096336499321574,
"grad_norm": 0.8799943306194825,
"learning_rate": 3.7525351217641915e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3357008993625641,
"step": 1260,
"valid_targets_mean": 3111.0,
"valid_targets_min": 578
},
{
"epoch": 1.716417910447761,
"grad_norm": 0.6111490118620997,
"learning_rate": 3.7492649276378124e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2888554632663727,
"step": 1265,
"valid_targets_mean": 3284.9,
"valid_targets_min": 1267
},
{
"epoch": 1.723202170963365,
"grad_norm": 0.6589094616205049,
"learning_rate": 3.7459747119676484e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30003267526626587,
"step": 1270,
"valid_targets_mean": 2895.2,
"valid_targets_min": 1178
},
{
"epoch": 1.7299864314789688,
"grad_norm": 0.640067102221961,
"learning_rate": 3.742664512412488e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31731560826301575,
"step": 1275,
"valid_targets_mean": 3285.7,
"valid_targets_min": 1465
},
{
"epoch": 1.7367706919945727,
"grad_norm": 0.6939365904317435,
"learning_rate": 3.7393343668598495e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2893563210964203,
"step": 1280,
"valid_targets_mean": 2671.6,
"valid_targets_min": 1204
},
{
"epoch": 1.7435549525101763,
"grad_norm": 0.6861699873490201,
"learning_rate": 3.735984313425544e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3145902156829834,
"step": 1285,
"valid_targets_mean": 2858.2,
"valid_targets_min": 1055
},
{
"epoch": 1.7503392130257802,
"grad_norm": 0.5893287065962871,
"learning_rate": 3.732614390453245e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815445065498352,
"step": 1290,
"valid_targets_mean": 3251.5,
"valid_targets_min": 760
},
{
"epoch": 1.7571234735413839,
"grad_norm": 0.6605129026405406,
"learning_rate": 3.729224636514046e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28478604555130005,
"step": 1295,
"valid_targets_mean": 2549.3,
"valid_targets_min": 961
},
{
"epoch": 1.7639077340569878,
"grad_norm": 0.7080612755113385,
"learning_rate": 3.7258150904060184e-05,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30780327320098877,
"step": 1300,
"valid_targets_mean": 2727.4,
"valid_targets_min": 1274
},
{
"epoch": 1.7706919945725916,
"grad_norm": 0.6157145299604274,
"learning_rate": 3.72238579115377e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31349170207977295,
"step": 1305,
"valid_targets_mean": 3526.4,
"valid_targets_min": 911
},
{
"epoch": 1.7774762550881955,
"grad_norm": 0.6628037819653686,
"learning_rate": 3.7189367780079956e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30656638741493225,
"step": 1310,
"valid_targets_mean": 2991.2,
"valid_targets_min": 815
},
{
"epoch": 1.7842605156037992,
"grad_norm": 0.7303577186056781,
"learning_rate": 3.7154680904450306e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25550299882888794,
"step": 1315,
"valid_targets_mean": 2137.6,
"valid_targets_min": 780
},
{
"epoch": 1.7910447761194028,
"grad_norm": 0.7432172204712651,
"learning_rate": 3.711979768166397e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851966619491577,
"step": 1320,
"valid_targets_mean": 2175.0,
"valid_targets_min": 782
},
{
"epoch": 1.7978290366350067,
"grad_norm": 0.6101418921075195,
"learning_rate": 3.708471851098349e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29730525612831116,
"step": 1325,
"valid_targets_mean": 3097.9,
"valid_targets_min": 819
},
{
"epoch": 1.8046132971506106,
"grad_norm": 0.6995136361312011,
"learning_rate": 3.704944379391418e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28219103813171387,
"step": 1330,
"valid_targets_mean": 2626.4,
"valid_targets_min": 963
},
{
"epoch": 1.8113975576662145,
"grad_norm": 0.7747003781816696,
"learning_rate": 3.70139739341995e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2927844226360321,
"step": 1335,
"valid_targets_mean": 2138.4,
"valid_targets_min": 1030
},
{
"epoch": 1.8181818181818183,
"grad_norm": 0.6296472975547316,
"learning_rate": 3.6978309337816475e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978728413581848,
"step": 1340,
"valid_targets_mean": 2901.1,
"valid_targets_min": 1269
},
{
"epoch": 1.824966078697422,
"grad_norm": 0.6529444503372535,
"learning_rate": 3.6942450412971006e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2776811420917511,
"step": 1345,
"valid_targets_mean": 2990.2,
"valid_targets_min": 1290
},
{
"epoch": 1.8317503392130257,
"grad_norm": 0.6073872705332342,
"learning_rate": 3.690639757009322e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2847082316875458,
"step": 1350,
"valid_targets_mean": 3336.8,
"valid_targets_min": 1011
},
{
"epoch": 1.8385345997286295,
"grad_norm": 0.6726342078161094,
"learning_rate": 3.687015122183278e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31284165382385254,
"step": 1355,
"valid_targets_mean": 3056.4,
"valid_targets_min": 878
},
{
"epoch": 1.8453188602442334,
"grad_norm": 0.6570381591584823,
"learning_rate": 3.6833711783054146e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27733927965164185,
"step": 1360,
"valid_targets_mean": 2751.9,
"valid_targets_min": 627
},
{
"epoch": 1.8521031207598373,
"grad_norm": 0.7873750592257918,
"learning_rate": 3.6797079670831835e-05,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2843400537967682,
"step": 1365,
"valid_targets_mean": 2333.1,
"valid_targets_min": 1105
},
{
"epoch": 1.858887381275441,
"grad_norm": 0.6324090204988919,
"learning_rate": 3.676025530444563e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2516278326511383,
"step": 1370,
"valid_targets_mean": 2830.2,
"valid_targets_min": 739
},
{
"epoch": 1.8656716417910446,
"grad_norm": 0.7359610094620258,
"learning_rate": 3.672323910537581e-05,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31318145990371704,
"step": 1375,
"valid_targets_mean": 2449.1,
"valid_targets_min": 627
},
{
"epoch": 1.8724559023066485,
"grad_norm": 0.6497309545854958,
"learning_rate": 3.668603149729832e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26779574155807495,
"step": 1380,
"valid_targets_mean": 2840.0,
"valid_targets_min": 1094
},
{
"epoch": 1.8792401628222524,
"grad_norm": 0.6267804873051095,
"learning_rate": 3.664863290607989e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28004786372184753,
"step": 1385,
"valid_targets_mean": 2897.0,
"valid_targets_min": 929
},
{
"epoch": 1.8860244233378562,
"grad_norm": 0.6879680447864663,
"learning_rate": 3.6611043759773195e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31352704763412476,
"step": 1390,
"valid_targets_mean": 2756.0,
"valid_targets_min": 928
},
{
"epoch": 1.8928086838534601,
"grad_norm": 0.6301096600514708,
"learning_rate": 3.6573264488611944e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3064451217651367,
"step": 1395,
"valid_targets_mean": 3032.6,
"valid_targets_min": 791
},
{
"epoch": 1.8995929443690638,
"grad_norm": 0.6958211841970261,
"learning_rate": 3.6535295525005964e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2943972647190094,
"step": 1400,
"valid_targets_mean": 2836.4,
"valid_targets_min": 648
},
{
"epoch": 1.9063772048846674,
"grad_norm": 0.7887387389485876,
"learning_rate": 3.649713730353623e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28154975175857544,
"step": 1405,
"valid_targets_mean": 2262.3,
"valid_targets_min": 916
},
{
"epoch": 1.9131614654002713,
"grad_norm": 1.5313410215337464,
"learning_rate": 3.645879026094991e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29764658212661743,
"step": 1410,
"valid_targets_mean": 2811.7,
"valid_targets_min": 821
},
{
"epoch": 1.9199457259158752,
"grad_norm": 0.7151356767653663,
"learning_rate": 3.642025483615536e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090359568595886,
"step": 1415,
"valid_targets_mean": 2566.2,
"valid_targets_min": 659
},
{
"epoch": 1.926729986431479,
"grad_norm": 0.7117696747551553,
"learning_rate": 3.6381531470217095e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32978102564811707,
"step": 1420,
"valid_targets_mean": 2933.4,
"valid_targets_min": 1166
},
{
"epoch": 1.9335142469470827,
"grad_norm": 0.7645454065347908,
"learning_rate": 3.634262060635075e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31343501806259155,
"step": 1425,
"valid_targets_mean": 2486.8,
"valid_targets_min": 706
},
{
"epoch": 1.9402985074626866,
"grad_norm": 0.6774335342238738,
"learning_rate": 3.6303522689918015e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2950223684310913,
"step": 1430,
"valid_targets_mean": 2928.6,
"valid_targets_min": 713
},
{
"epoch": 1.9470827679782903,
"grad_norm": 0.6640212258014019,
"learning_rate": 3.6264238168421505e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2745462656021118,
"step": 1435,
"valid_targets_mean": 2628.1,
"valid_targets_min": 1206
},
{
"epoch": 1.9538670284938942,
"grad_norm": 0.6832788009297351,
"learning_rate": 3.622476749149967e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921183705329895,
"step": 1440,
"valid_targets_mean": 2838.4,
"valid_targets_min": 617
},
{
"epoch": 1.960651289009498,
"grad_norm": 1.02465763567763,
"learning_rate": 3.618511111092164e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30975252389907837,
"step": 1445,
"valid_targets_mean": 2425.6,
"valid_targets_min": 1024
},
{
"epoch": 1.967435549525102,
"grad_norm": 0.853915586974603,
"learning_rate": 3.6145269480582035e-05,
"loss": 0.309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3293916583061218,
"step": 1450,
"valid_targets_mean": 3230.9,
"valid_targets_min": 1358
},
{
"epoch": 1.9742198100407056,
"grad_norm": 0.7500252855517454,
"learning_rate": 3.61052430564958e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.285286545753479,
"step": 1455,
"valid_targets_mean": 1947.4,
"valid_targets_min": 848
},
{
"epoch": 1.9810040705563092,
"grad_norm": 0.6777810077646718,
"learning_rate": 3.606503229679299e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30354389548301697,
"step": 1460,
"valid_targets_mean": 2624.3,
"valid_targets_min": 1035
},
{
"epoch": 1.987788331071913,
"grad_norm": 0.7750533185261688,
"learning_rate": 3.6024637661713463e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793115973472595,
"step": 1465,
"valid_targets_mean": 2612.2,
"valid_targets_min": 941
},
{
"epoch": 1.994572591587517,
"grad_norm": 0.7919665782855059,
"learning_rate": 3.59840596136017e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27840328216552734,
"step": 1470,
"valid_targets_mean": 2205.1,
"valid_targets_min": 992
},
{
"epoch": 2.001356852103121,
"grad_norm": 0.6677080223559784,
"learning_rate": 3.5943298616901434e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252011239528656,
"step": 1475,
"valid_targets_mean": 3309.2,
"valid_targets_min": 1337
},
{
"epoch": 2.0081411126187247,
"grad_norm": 0.7207007939374871,
"learning_rate": 3.590235513815041e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2334105670452118,
"step": 1480,
"valid_targets_mean": 2218.1,
"valid_targets_min": 739
},
{
"epoch": 2.014925373134328,
"grad_norm": 0.7632243131847694,
"learning_rate": 3.586122964597499e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2754613161087036,
"step": 1485,
"valid_targets_mean": 2588.3,
"valid_targets_min": 678
},
{
"epoch": 2.021709633649932,
"grad_norm": 0.7149262249272994,
"learning_rate": 3.581992261108478e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22789128124713898,
"step": 1490,
"valid_targets_mean": 2391.2,
"valid_targets_min": 791
},
{
"epoch": 2.028493894165536,
"grad_norm": 0.7021382513288259,
"learning_rate": 3.577843450626729e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2544996738433838,
"step": 1495,
"valid_targets_mean": 3086.4,
"valid_targets_min": 1196
},
{
"epoch": 2.03527815468114,
"grad_norm": 0.6740781431872369,
"learning_rate": 3.573676580638252e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830080986022949,
"step": 1500,
"valid_targets_mean": 3231.4,
"valid_targets_min": 820
},
{
"epoch": 2.0420624151967437,
"grad_norm": 0.6625091780634826,
"learning_rate": 3.569491698835747e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644336223602295,
"step": 1505,
"valid_targets_mean": 3546.1,
"valid_targets_min": 790
},
{
"epoch": 2.0488466757123476,
"grad_norm": 0.772346491835651,
"learning_rate": 3.565288853118073e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25193676352500916,
"step": 1510,
"valid_targets_mean": 2011.5,
"valid_targets_min": 692
},
{
"epoch": 2.055630936227951,
"grad_norm": 0.7015358520017895,
"learning_rate": 3.561068091589699e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2524373531341553,
"step": 1515,
"valid_targets_mean": 2833.7,
"valid_targets_min": 1076
},
{
"epoch": 2.062415196743555,
"grad_norm": 0.6819591135273353,
"learning_rate": 3.556829462560152e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2732108533382416,
"step": 1520,
"valid_targets_mean": 3037.2,
"valid_targets_min": 544
},
{
"epoch": 2.0691994572591588,
"grad_norm": 0.7308638462885366,
"learning_rate": 3.552573014543465e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24330492317676544,
"step": 1525,
"valid_targets_mean": 2520.2,
"valid_targets_min": 965
},
{
"epoch": 2.0759837177747626,
"grad_norm": 0.7835094284328342,
"learning_rate": 3.548298796257623e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812742590904236,
"step": 1530,
"valid_targets_mean": 2378.4,
"valid_targets_min": 512
},
{
"epoch": 2.0827679782903665,
"grad_norm": 0.6968412144913585,
"learning_rate": 3.5440068566240006e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25412964820861816,
"step": 1535,
"valid_targets_mean": 2384.0,
"valid_targets_min": 972
},
{
"epoch": 2.08955223880597,
"grad_norm": 0.7616955455624203,
"learning_rate": 3.539697244766809e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29562467336654663,
"step": 1540,
"valid_targets_mean": 2267.1,
"valid_targets_min": 777
},
{
"epoch": 2.096336499321574,
"grad_norm": 0.7131875884565378,
"learning_rate": 3.5353700100125285e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696763873100281,
"step": 1545,
"valid_targets_mean": 2582.3,
"valid_targets_min": 909
},
{
"epoch": 2.1031207598371777,
"grad_norm": 0.7768997711520144,
"learning_rate": 3.531025201889346e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27121901512145996,
"step": 1550,
"valid_targets_mean": 2734.2,
"valid_targets_min": 684
},
{
"epoch": 2.1099050203527816,
"grad_norm": 0.5972671434746235,
"learning_rate": 3.526662870126588e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21913185715675354,
"step": 1555,
"valid_targets_mean": 3436.5,
"valid_targets_min": 880
},
{
"epoch": 2.1166892808683855,
"grad_norm": 0.8928905338020054,
"learning_rate": 3.5222830646541495e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2423502504825592,
"step": 1560,
"valid_targets_mean": 3034.4,
"valid_targets_min": 1466
},
{
"epoch": 2.123473541383989,
"grad_norm": 0.7792302275809843,
"learning_rate": 3.517885835601927e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23429229855537415,
"step": 1565,
"valid_targets_mean": 2170.3,
"valid_targets_min": 656
},
{
"epoch": 2.130257801899593,
"grad_norm": 0.6637166367797426,
"learning_rate": 3.5134712332992396e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2654414474964142,
"step": 1570,
"valid_targets_mean": 3309.1,
"valid_targets_min": 783
},
{
"epoch": 2.1370420624151967,
"grad_norm": 0.7708919189354086,
"learning_rate": 3.5090393082742555e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26184701919555664,
"step": 1575,
"valid_targets_mean": 2298.2,
"valid_targets_min": 737
},
{
"epoch": 2.1438263229308006,
"grad_norm": 0.7215973806908841,
"learning_rate": 3.504590111253414e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27381983399391174,
"step": 1580,
"valid_targets_mean": 2703.3,
"valid_targets_min": 1289
},
{
"epoch": 2.1506105834464044,
"grad_norm": 0.8043249601230251,
"learning_rate": 3.5001236931608446e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2702006995677948,
"step": 1585,
"valid_targets_mean": 2177.4,
"valid_targets_min": 793
},
{
"epoch": 2.1573948439620083,
"grad_norm": 0.6914069724407004,
"learning_rate": 3.495640105117784e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27623242139816284,
"step": 1590,
"valid_targets_mean": 2991.8,
"valid_targets_min": 1354
},
{
"epoch": 2.1641791044776117,
"grad_norm": 0.8082050307344478,
"learning_rate": 3.491139398441989e-05,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768654525279999,
"step": 1595,
"valid_targets_mean": 2209.0,
"valid_targets_min": 740
},
{
"epoch": 2.1709633649932156,
"grad_norm": 0.7574042859615202,
"learning_rate": 3.4866216246471536e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28827136754989624,
"step": 1600,
"valid_targets_mean": 2482.6,
"valid_targets_min": 746
},
{
"epoch": 2.1777476255088195,
"grad_norm": 0.6561439016270234,
"learning_rate": 3.482086835442313e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2732161581516266,
"step": 1605,
"valid_targets_mean": 3250.7,
"valid_targets_min": 819
},
{
"epoch": 2.1845318860244234,
"grad_norm": 0.6444399840162086,
"learning_rate": 3.47753508273126e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27326977252960205,
"step": 1610,
"valid_targets_mean": 2993.8,
"valid_targets_min": 997
},
{
"epoch": 2.1913161465400273,
"grad_norm": 0.6624015010390857,
"learning_rate": 3.472966418611944e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766575217247009,
"step": 1615,
"valid_targets_mean": 3185.8,
"valid_targets_min": 728
},
{
"epoch": 2.198100407055631,
"grad_norm": 0.6436526455011548,
"learning_rate": 3.468380895375876e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2507815957069397,
"step": 1620,
"valid_targets_mean": 3060.2,
"valid_targets_min": 933
},
{
"epoch": 2.2048846675712346,
"grad_norm": 0.6752004219899516,
"learning_rate": 3.463778565507536e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24225379526615143,
"step": 1625,
"valid_targets_mean": 2709.7,
"valid_targets_min": 758
},
{
"epoch": 2.2116689280868385,
"grad_norm": 0.6096818559003151,
"learning_rate": 3.45915948168376e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24749873578548431,
"step": 1630,
"valid_targets_mean": 3076.5,
"valid_targets_min": 708
},
{
"epoch": 2.2184531886024423,
"grad_norm": 0.6382946984463229,
"learning_rate": 3.454523696773152e-05,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28292831778526306,
"step": 1635,
"valid_targets_mean": 3444.9,
"valid_targets_min": 661
},
{
"epoch": 2.225237449118046,
"grad_norm": 0.7180530567460727,
"learning_rate": 3.4498712638354646e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2660506069660187,
"step": 1640,
"valid_targets_mean": 2654.6,
"valid_targets_min": 1015
},
{
"epoch": 2.23202170963365,
"grad_norm": 0.6477313971324171,
"learning_rate": 3.445202236121006e-05,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23461966216564178,
"step": 1645,
"valid_targets_mean": 2946.6,
"valid_targets_min": 876
},
{
"epoch": 2.2388059701492535,
"grad_norm": 0.758634223425707,
"learning_rate": 3.440516667070017e-05,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572581470012665,
"step": 1650,
"valid_targets_mean": 2419.9,
"valid_targets_min": 799
},
{
"epoch": 2.2455902306648574,
"grad_norm": 0.7525020456973835,
"learning_rate": 3.435814610312068e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2762409448623657,
"step": 1655,
"valid_targets_mean": 2593.2,
"valid_targets_min": 930
},
{
"epoch": 2.2523744911804613,
"grad_norm": 0.6900366742315267,
"learning_rate": 3.431096119665443e-05,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2573353052139282,
"step": 1660,
"valid_targets_mean": 2404.2,
"valid_targets_min": 832
},
{
"epoch": 2.259158751696065,
"grad_norm": 0.7966484389836349,
"learning_rate": 3.426361249136522e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512604892253876,
"step": 1665,
"valid_targets_mean": 2740.3,
"valid_targets_min": 933
},
{
"epoch": 2.265943012211669,
"grad_norm": 0.6267399197635503,
"learning_rate": 3.421610052919163e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536308467388153,
"step": 1670,
"valid_targets_mean": 2806.4,
"valid_targets_min": 666
},
{
"epoch": 2.2727272727272725,
"grad_norm": 0.710274498225842,
"learning_rate": 3.4168425853940865e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23908887803554535,
"step": 1675,
"valid_targets_mean": 2732.9,
"valid_targets_min": 803
},
{
"epoch": 2.2795115332428764,
"grad_norm": 0.6223626538847287,
"learning_rate": 3.412058901128245e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23127231001853943,
"step": 1680,
"valid_targets_mean": 2821.8,
"valid_targets_min": 1270
},
{
"epoch": 2.2862957937584802,
"grad_norm": 0.6294319468393673,
"learning_rate": 3.407259054874206e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2410857379436493,
"step": 1685,
"valid_targets_mean": 2965.4,
"valid_targets_min": 734
},
{
"epoch": 2.293080054274084,
"grad_norm": 0.8008654337703052,
"learning_rate": 3.402443101569521e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26027989387512207,
"step": 1690,
"valid_targets_mean": 2395.8,
"valid_targets_min": 881
},
{
"epoch": 2.299864314789688,
"grad_norm": 0.7218010335927416,
"learning_rate": 3.397611096336097e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3087459206581116,
"step": 1695,
"valid_targets_mean": 2789.3,
"valid_targets_min": 820
},
{
"epoch": 2.306648575305292,
"grad_norm": 0.7847076898478889,
"learning_rate": 3.392763094479568e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26217982172966003,
"step": 1700,
"valid_targets_mean": 2132.0,
"valid_targets_min": 722
},
{
"epoch": 2.3134328358208958,
"grad_norm": 0.7515258396714922,
"learning_rate": 3.387899151488659e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2646181583404541,
"step": 1705,
"valid_targets_mean": 2402.3,
"valid_targets_min": 627
},
{
"epoch": 2.320217096336499,
"grad_norm": 0.6310084529124328,
"learning_rate": 3.383019323034552e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26773834228515625,
"step": 1710,
"valid_targets_mean": 3745.5,
"valid_targets_min": 1312
},
{
"epoch": 2.327001356852103,
"grad_norm": 0.6476866135246807,
"learning_rate": 3.378123664970252e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23596899211406708,
"step": 1715,
"valid_targets_mean": 2782.4,
"valid_targets_min": 1037
},
{
"epoch": 2.333785617367707,
"grad_norm": 0.6635878932623026,
"learning_rate": 3.373212233329941e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669086158275604,
"step": 1720,
"valid_targets_mean": 2656.4,
"valid_targets_min": 656
},
{
"epoch": 2.340569877883311,
"grad_norm": 0.8372787858249849,
"learning_rate": 3.368285084328343e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27093416452407837,
"step": 1725,
"valid_targets_mean": 2007.2,
"valid_targets_min": 788
},
{
"epoch": 2.3473541383989147,
"grad_norm": 0.7084081316996159,
"learning_rate": 3.363342274360076e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27293896675109863,
"step": 1730,
"valid_targets_mean": 2628.9,
"valid_targets_min": 670
},
{
"epoch": 2.354138398914518,
"grad_norm": 0.7361649736055962,
"learning_rate": 3.358383859999011e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24949458241462708,
"step": 1735,
"valid_targets_mean": 2166.1,
"valid_targets_min": 682
},
{
"epoch": 2.360922659430122,
"grad_norm": 0.6601077278545686,
"learning_rate": 3.353409897997621e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252005398273468,
"step": 1740,
"valid_targets_mean": 2885.6,
"valid_targets_min": 953
},
{
"epoch": 2.367706919945726,
"grad_norm": 0.7833459948759297,
"learning_rate": 3.348420445286331e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25346460938453674,
"step": 1745,
"valid_targets_mean": 2880.2,
"valid_targets_min": 635
},
{
"epoch": 2.37449118046133,
"grad_norm": 0.6917728614350838,
"learning_rate": 3.3434155589728695e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21869820356369019,
"step": 1750,
"valid_targets_mean": 2367.4,
"valid_targets_min": 859
},
{
"epoch": 2.3812754409769337,
"grad_norm": 0.6338539881836546,
"learning_rate": 3.338395296341614e-05,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602981925010681,
"step": 1755,
"valid_targets_mean": 3345.6,
"valid_targets_min": 1233
},
{
"epoch": 2.388059701492537,
"grad_norm": 0.6645949196725213,
"learning_rate": 3.333359714852932e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770848870277405,
"step": 1760,
"valid_targets_mean": 2870.8,
"valid_targets_min": 699
},
{
"epoch": 2.394843962008141,
"grad_norm": 0.6971754384837836,
"learning_rate": 3.328308872142528e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24311913549900055,
"step": 1765,
"valid_targets_mean": 2503.1,
"valid_targets_min": 1021
},
{
"epoch": 2.401628222523745,
"grad_norm": 0.6356007444165893,
"learning_rate": 3.3232428260207804e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26365482807159424,
"step": 1770,
"valid_targets_mean": 3150.6,
"valid_targets_min": 1107
},
{
"epoch": 2.4084124830393487,
"grad_norm": 0.7060984927170915,
"learning_rate": 3.318161634472083e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27592113614082336,
"step": 1775,
"valid_targets_mean": 2829.7,
"valid_targets_min": 992
},
{
"epoch": 2.4151967435549526,
"grad_norm": 0.6510612732829962,
"learning_rate": 3.3130653556541774e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24161876738071442,
"step": 1780,
"valid_targets_mean": 3045.9,
"valid_targets_min": 746
},
{
"epoch": 2.4219810040705565,
"grad_norm": 0.6847258251540859,
"learning_rate": 3.30795404789749e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27078160643577576,
"step": 1785,
"valid_targets_mean": 3208.2,
"valid_targets_min": 759
},
{
"epoch": 2.42876526458616,
"grad_norm": 0.7808291039965765,
"learning_rate": 3.302827769704464e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25728699564933777,
"step": 1790,
"valid_targets_mean": 2815.0,
"valid_targets_min": 1277
},
{
"epoch": 2.435549525101764,
"grad_norm": 0.7272148707674393,
"learning_rate": 3.29768657974889e-05,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.258420467376709,
"step": 1795,
"valid_targets_mean": 2726.6,
"valid_targets_min": 720
},
{
"epoch": 2.4423337856173677,
"grad_norm": 0.7459339825138199,
"learning_rate": 3.2925305368752346e-05,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28670960664749146,
"step": 1800,
"valid_targets_mean": 2654.2,
"valid_targets_min": 807
},
{
"epoch": 2.4491180461329716,
"grad_norm": 0.7287330807026949,
"learning_rate": 3.2873597000979626e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25203102827072144,
"step": 1805,
"valid_targets_mean": 3238.3,
"valid_targets_min": 1310
},
{
"epoch": 2.4559023066485755,
"grad_norm": 0.7104083422326701,
"learning_rate": 3.28217412860087e-05,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21682174503803253,
"step": 1810,
"valid_targets_mean": 3128.4,
"valid_targets_min": 640
},
{
"epoch": 2.4626865671641793,
"grad_norm": 0.6057916542411326,
"learning_rate": 3.276973881736399e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25353389978408813,
"step": 1815,
"valid_targets_mean": 3672.1,
"valid_targets_min": 1024
},
{
"epoch": 2.4694708276797828,
"grad_norm": 0.7923986851890575,
"learning_rate": 3.2717590190249617e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22225558757781982,
"step": 1820,
"valid_targets_mean": 2796.2,
"valid_targets_min": 750
},
{
"epoch": 2.4762550881953866,
"grad_norm": 0.6652659164621177,
"learning_rate": 3.2665296001542606e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28310340642929077,
"step": 1825,
"valid_targets_mean": 3224.8,
"valid_targets_min": 916
},
{
"epoch": 2.4830393487109905,
"grad_norm": 0.7654192310941611,
"learning_rate": 3.261285684978601e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2906759977340698,
"step": 1830,
"valid_targets_mean": 2817.2,
"valid_targets_min": 867
},
{
"epoch": 2.4898236092265944,
"grad_norm": 0.7118429223959195,
"learning_rate": 3.256027333518209e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2705893814563751,
"step": 1835,
"valid_targets_mean": 2739.5,
"valid_targets_min": 785
},
{
"epoch": 2.4966078697421983,
"grad_norm": 0.7194235047620599,
"learning_rate": 3.250754605958546e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2895210385322571,
"step": 1840,
"valid_targets_mean": 2776.8,
"valid_targets_min": 875
},
{
"epoch": 2.5033921302578017,
"grad_norm": 0.7159119323725041,
"learning_rate": 3.245467562649615e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22497795522212982,
"step": 1845,
"valid_targets_mean": 2419.1,
"valid_targets_min": 685
},
{
"epoch": 2.5101763907734056,
"grad_norm": 0.6776377638938433,
"learning_rate": 3.240166264105274e-05,
"loss": 0.257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2763141989707947,
"step": 1850,
"valid_targets_mean": 2846.4,
"valid_targets_min": 713
},
{
"epoch": 2.5169606512890095,
"grad_norm": 0.6865655138064035,
"learning_rate": 3.234850771002542e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24978536367416382,
"step": 1855,
"valid_targets_mean": 2978.5,
"valid_targets_min": 968
},
{
"epoch": 2.5237449118046134,
"grad_norm": 0.6699601179099225,
"learning_rate": 3.2295211441809043e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25676673650741577,
"step": 1860,
"valid_targets_mean": 2917.8,
"valid_targets_min": 1075
},
{
"epoch": 2.5305291723202172,
"grad_norm": 0.6889764980124685,
"learning_rate": 3.224177444641616e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3100902736186981,
"step": 1865,
"valid_targets_mean": 2546.6,
"valid_targets_min": 912
},
{
"epoch": 2.5373134328358207,
"grad_norm": 0.6793757318097332,
"learning_rate": 3.218819733547006e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2357414960861206,
"step": 1870,
"valid_targets_mean": 2497.8,
"valid_targets_min": 772
},
{
"epoch": 2.5440976933514245,
"grad_norm": 0.8152453145431383,
"learning_rate": 3.2134480722197707e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29958784580230713,
"step": 1875,
"valid_targets_mean": 2523.8,
"valid_targets_min": 584
},
{
"epoch": 2.5508819538670284,
"grad_norm": 0.7495650389529989,
"learning_rate": 3.208062522142282e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2574930191040039,
"step": 1880,
"valid_targets_mean": 2723.4,
"valid_targets_min": 951
},
{
"epoch": 2.5576662143826323,
"grad_norm": 0.7714988898913233,
"learning_rate": 3.202663144955875e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2438960075378418,
"step": 1885,
"valid_targets_mean": 2427.2,
"valid_targets_min": 1263
},
{
"epoch": 2.564450474898236,
"grad_norm": 0.8149406397413984,
"learning_rate": 3.1972500024601475e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2427600771188736,
"step": 1890,
"valid_targets_mean": 2379.7,
"valid_targets_min": 648
},
{
"epoch": 2.5712347354138396,
"grad_norm": 0.835575869140074,
"learning_rate": 3.1918231566122467e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951461672782898,
"step": 1895,
"valid_targets_mean": 2883.2,
"valid_targets_min": 691
},
{
"epoch": 2.578018995929444,
"grad_norm": 0.6480761129447208,
"learning_rate": 3.186382669526169e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25713399052619934,
"step": 1900,
"valid_targets_mean": 3203.1,
"valid_targets_min": 1042
},
{
"epoch": 2.5848032564450474,
"grad_norm": 0.6296775116161838,
"learning_rate": 3.180928603472041e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24473142623901367,
"step": 1905,
"valid_targets_mean": 3100.0,
"valid_targets_min": 683
},
{
"epoch": 2.5915875169606513,
"grad_norm": 0.6495398797854156,
"learning_rate": 3.175461020875412e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23860132694244385,
"step": 1910,
"valid_targets_mean": 3028.4,
"valid_targets_min": 1066
},
{
"epoch": 2.598371777476255,
"grad_norm": 0.6700738944682313,
"learning_rate": 3.1699799843165356e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2498638927936554,
"step": 1915,
"valid_targets_mean": 2918.0,
"valid_targets_min": 530
},
{
"epoch": 2.605156037991859,
"grad_norm": 0.6577566326274685,
"learning_rate": 3.164485556529657e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25191181898117065,
"step": 1920,
"valid_targets_mean": 2755.8,
"valid_targets_min": 693
},
{
"epoch": 2.611940298507463,
"grad_norm": 0.6054859630469727,
"learning_rate": 3.158977800402292e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2440011352300644,
"step": 1925,
"valid_targets_mean": 3179.1,
"valid_targets_min": 1141
},
{
"epoch": 2.6187245590230663,
"grad_norm": 0.6786451801971204,
"learning_rate": 3.1534567789745084e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2818109095096588,
"step": 1930,
"valid_targets_mean": 2949.1,
"valid_targets_min": 999
},
{
"epoch": 2.62550881953867,
"grad_norm": 0.6942883497416937,
"learning_rate": 3.147922555438206e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24890519678592682,
"step": 1935,
"valid_targets_mean": 2585.8,
"valid_targets_min": 837
},
{
"epoch": 2.632293080054274,
"grad_norm": 0.7058789473959215,
"learning_rate": 3.14237519313639e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726551294326782,
"step": 1940,
"valid_targets_mean": 2646.4,
"valid_targets_min": 764
},
{
"epoch": 2.639077340569878,
"grad_norm": 0.6700353317554494,
"learning_rate": 3.1368147555624486e-05,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2708538770675659,
"step": 1945,
"valid_targets_mean": 3069.9,
"valid_targets_min": 1199
},
{
"epoch": 2.645861601085482,
"grad_norm": 0.7323325511038016,
"learning_rate": 3.131241306359426e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605024576187134,
"step": 1950,
"valid_targets_mean": 2873.1,
"valid_targets_min": 680
},
{
"epoch": 2.6526458616010853,
"grad_norm": 0.6879553895964564,
"learning_rate": 3.125654909319294e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2747609615325928,
"step": 1955,
"valid_targets_mean": 3061.4,
"valid_targets_min": 865
},
{
"epoch": 2.659430122116689,
"grad_norm": 0.6920353888734679,
"learning_rate": 3.120055628382218e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23946809768676758,
"step": 1960,
"valid_targets_mean": 2961.5,
"valid_targets_min": 1092
},
{
"epoch": 2.666214382632293,
"grad_norm": 0.6453205678625881,
"learning_rate": 3.1144435276358325e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27227306365966797,
"step": 1965,
"valid_targets_mean": 3088.8,
"valid_targets_min": 1145
},
{
"epoch": 2.672998643147897,
"grad_norm": 0.6921138419734034,
"learning_rate": 3.1088186713145024e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25944316387176514,
"step": 1970,
"valid_targets_mean": 2601.7,
"valid_targets_min": 762
},
{
"epoch": 2.679782903663501,
"grad_norm": 0.6778135167815581,
"learning_rate": 3.103181123798587e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24725311994552612,
"step": 1975,
"valid_targets_mean": 2674.5,
"valid_targets_min": 869
},
{
"epoch": 2.6865671641791042,
"grad_norm": 0.7351183532910395,
"learning_rate": 3.0975309496137066e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25560200214385986,
"step": 1980,
"valid_targets_mean": 2353.3,
"valid_targets_min": 538
},
{
"epoch": 2.693351424694708,
"grad_norm": 0.6182324179687427,
"learning_rate": 3.091868213430004e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22743821144104004,
"step": 1985,
"valid_targets_mean": 2698.8,
"valid_targets_min": 701
},
{
"epoch": 2.700135685210312,
"grad_norm": 0.7363935013486361,
"learning_rate": 3.086192980061399e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27139535546302795,
"step": 1990,
"valid_targets_mean": 2369.6,
"valid_targets_min": 1089
},
{
"epoch": 2.706919945725916,
"grad_norm": 0.6440601737571228,
"learning_rate": 3.080505314464854e-05,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23245973885059357,
"step": 1995,
"valid_targets_mean": 2775.4,
"valid_targets_min": 810
},
{
"epoch": 2.7137042062415198,
"grad_norm": 0.6702282934429393,
"learning_rate": 3.0748052817396254e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2478809952735901,
"step": 2000,
"valid_targets_mean": 2646.8,
"valid_targets_min": 1399
},
{
"epoch": 2.7204884667571236,
"grad_norm": 0.6800473944399235,
"learning_rate": 3.0690929471265185e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24637192487716675,
"step": 2005,
"valid_targets_mean": 2696.4,
"valid_targets_min": 793
},
{
"epoch": 2.7272727272727275,
"grad_norm": 0.6303354724046744,
"learning_rate": 3.063368376007145e-05,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26109838485717773,
"step": 2010,
"valid_targets_mean": 3292.2,
"valid_targets_min": 1629
},
{
"epoch": 2.734056987788331,
"grad_norm": 0.6765904914853859,
"learning_rate": 3.057631633903167e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24430710077285767,
"step": 2015,
"valid_targets_mean": 2731.6,
"valid_targets_min": 746
},
{
"epoch": 2.740841248303935,
"grad_norm": 0.6432972439515613,
"learning_rate": 3.05188278647556e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23854488134384155,
"step": 2020,
"valid_targets_mean": 2842.9,
"valid_targets_min": 1268
},
{
"epoch": 2.7476255088195387,
"grad_norm": 0.6577825459454796,
"learning_rate": 3.0461218995238453e-05,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.254770427942276,
"step": 2025,
"valid_targets_mean": 2721.9,
"valid_targets_min": 1257
},
{
"epoch": 2.7544097693351426,
"grad_norm": 0.6949351773395782,
"learning_rate": 3.0403490389853484e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23568594455718994,
"step": 2030,
"valid_targets_mean": 2796.5,
"valid_targets_min": 1147
},
{
"epoch": 2.7611940298507465,
"grad_norm": 0.7323091372332017,
"learning_rate": 3.034564270934442e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26838138699531555,
"step": 2035,
"valid_targets_mean": 2450.1,
"valid_targets_min": 627
},
{
"epoch": 2.76797829036635,
"grad_norm": 0.7072050298374907,
"learning_rate": 3.0287676615817854e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2603970468044281,
"step": 2040,
"valid_targets_mean": 2724.6,
"valid_targets_min": 662
},
{
"epoch": 2.774762550881954,
"grad_norm": 0.7013954312412192,
"learning_rate": 3.0229592772735717e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2462655007839203,
"step": 2045,
"valid_targets_mean": 2669.0,
"valid_targets_min": 796
},
{
"epoch": 2.7815468113975577,
"grad_norm": 0.7194087010991239,
"learning_rate": 3.0171391844907663e-05,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22803866863250732,
"step": 2050,
"valid_targets_mean": 2516.1,
"valid_targets_min": 1199
},
{
"epoch": 2.7883310719131615,
"grad_norm": 0.6532424708668592,
"learning_rate": 3.011307449848345e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25693702697753906,
"step": 2055,
"valid_targets_mean": 2905.6,
"valid_targets_min": 981
},
{
"epoch": 2.7951153324287654,
"grad_norm": 0.6019841138198014,
"learning_rate": 3.0054641400945354e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2629098892211914,
"step": 2060,
"valid_targets_mean": 3336.9,
"valid_targets_min": 1009
},
{
"epoch": 2.801899592944369,
"grad_norm": 0.590938009064258,
"learning_rate": 2.9996093221100468e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24467141926288605,
"step": 2065,
"valid_targets_mean": 3226.9,
"valid_targets_min": 597
},
{
"epoch": 2.8086838534599727,
"grad_norm": 0.6853913375855859,
"learning_rate": 2.993743062907311e-05,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3042706549167633,
"step": 2070,
"valid_targets_mean": 3042.9,
"valid_targets_min": 1170
},
{
"epoch": 2.8154681139755766,
"grad_norm": 0.6566966730503214,
"learning_rate": 2.9878654296297112e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26403605937957764,
"step": 2075,
"valid_targets_mean": 3035.4,
"valid_targets_min": 1044
},
{
"epoch": 2.8222523744911805,
"grad_norm": 0.7543020252020352,
"learning_rate": 2.981976489550814e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24550700187683105,
"step": 2080,
"valid_targets_mean": 2845.9,
"valid_targets_min": 1216
},
{
"epoch": 2.8290366350067844,
"grad_norm": 0.7093980696165589,
"learning_rate": 2.9760763100736016e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2348649501800537,
"step": 2085,
"valid_targets_mean": 2346.6,
"valid_targets_min": 692
},
{
"epoch": 2.835820895522388,
"grad_norm": 0.6549172444022449,
"learning_rate": 2.970164958729698e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21750161051750183,
"step": 2090,
"valid_targets_mean": 2408.1,
"valid_targets_min": 799
},
{
"epoch": 2.842605156037992,
"grad_norm": 0.8065514310435659,
"learning_rate": 2.964242503178597e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26003286242485046,
"step": 2095,
"valid_targets_mean": 1907.9,
"valid_targets_min": 793
},
{
"epoch": 2.8493894165535956,
"grad_norm": 0.578124344699749,
"learning_rate": 2.958309011206888e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605810761451721,
"step": 2100,
"valid_targets_mean": 3794.0,
"valid_targets_min": 1360
},
{
"epoch": 2.8561736770691994,
"grad_norm": 0.6706934642907637,
"learning_rate": 2.9523645507274798e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569592297077179,
"step": 2105,
"valid_targets_mean": 2656.1,
"valid_targets_min": 1266
},
{
"epoch": 2.8629579375848033,
"grad_norm": 0.7102884408604969,
"learning_rate": 2.9464091897788232e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27441930770874023,
"step": 2110,
"valid_targets_mean": 2542.4,
"valid_targets_min": 821
},
{
"epoch": 2.869742198100407,
"grad_norm": 0.6396640888363082,
"learning_rate": 2.940442996524132e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28722479939460754,
"step": 2115,
"valid_targets_mean": 3116.9,
"valid_targets_min": 1036
},
{
"epoch": 2.876526458616011,
"grad_norm": 0.8432323434605307,
"learning_rate": 2.9344660392506043e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28614795207977295,
"step": 2120,
"valid_targets_mean": 3104.6,
"valid_targets_min": 818
},
{
"epoch": 2.8833107191316145,
"grad_norm": 0.6395419218584879,
"learning_rate": 2.9284783863686382e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2634587287902832,
"step": 2125,
"valid_targets_mean": 3117.6,
"valid_targets_min": 760
},
{
"epoch": 2.8900949796472184,
"grad_norm": 0.5718851345375481,
"learning_rate": 2.922480106411053e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612381875514984,
"step": 2130,
"valid_targets_mean": 3635.0,
"valid_targets_min": 761
},
{
"epoch": 2.8968792401628223,
"grad_norm": 0.6528582956501181,
"learning_rate": 2.9164712680322984e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2157207727432251,
"step": 2135,
"valid_targets_mean": 2491.8,
"valid_targets_min": 765
},
{
"epoch": 2.903663500678426,
"grad_norm": 0.8098720111841451,
"learning_rate": 2.9104519400076766e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25750282406806946,
"step": 2140,
"valid_targets_mean": 2004.3,
"valid_targets_min": 743
},
{
"epoch": 2.91044776119403,
"grad_norm": 0.6201356506537019,
"learning_rate": 2.9044221912325486e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2485671043395996,
"step": 2145,
"valid_targets_mean": 3226.1,
"valid_targets_min": 697
},
{
"epoch": 2.9172320217096335,
"grad_norm": 0.6786949165909485,
"learning_rate": 2.8983820907215475e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21794003248214722,
"step": 2150,
"valid_targets_mean": 2685.1,
"valid_targets_min": 803
},
{
"epoch": 2.9240162822252374,
"grad_norm": 0.6196782492846893,
"learning_rate": 2.8923317076077915e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.259111225605011,
"step": 2155,
"valid_targets_mean": 3168.1,
"valid_targets_min": 1185
},
{
"epoch": 2.9308005427408412,
"grad_norm": 0.6506882542165565,
"learning_rate": 2.8862711111420893e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25076574087142944,
"step": 2160,
"valid_targets_mean": 3034.2,
"valid_targets_min": 1049
},
{
"epoch": 2.937584803256445,
"grad_norm": 0.6853337250211714,
"learning_rate": 2.8802003706921468e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2712341547012329,
"step": 2165,
"valid_targets_mean": 2867.3,
"valid_targets_min": 786
},
{
"epoch": 2.944369063772049,
"grad_norm": 0.7641884011034288,
"learning_rate": 2.8741195557417775e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769216001033783,
"step": 2170,
"valid_targets_mean": 2302.2,
"valid_targets_min": 705
},
{
"epoch": 2.9511533242876524,
"grad_norm": 0.6826360549379976,
"learning_rate": 2.8680287358901028e-05,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24993981420993805,
"step": 2175,
"valid_targets_mean": 2850.9,
"valid_targets_min": 761
},
{
"epoch": 2.9579375848032563,
"grad_norm": 0.7221044998473106,
"learning_rate": 2.861927980850757e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25909918546676636,
"step": 2180,
"valid_targets_mean": 2386.6,
"valid_targets_min": 671
},
{
"epoch": 2.96472184531886,
"grad_norm": 0.7377714080476292,
"learning_rate": 2.8558173604510907e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22513189911842346,
"step": 2185,
"valid_targets_mean": 2357.4,
"valid_targets_min": 634
},
{
"epoch": 2.971506105834464,
"grad_norm": 0.5623921608095559,
"learning_rate": 2.849696944631369e-05,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26851212978363037,
"step": 2190,
"valid_targets_mean": 4109.2,
"valid_targets_min": 1134
},
{
"epoch": 2.978290366350068,
"grad_norm": 0.6103524586471685,
"learning_rate": 2.8435668034439738e-05,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2774103879928589,
"step": 2195,
"valid_targets_mean": 3372.1,
"valid_targets_min": 1052
},
{
"epoch": 2.9850746268656714,
"grad_norm": 0.6165970882379855,
"learning_rate": 2.8374270070525988e-05,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23035350441932678,
"step": 2200,
"valid_targets_mean": 3327.9,
"valid_targets_min": 857
},
{
"epoch": 2.9918588873812757,
"grad_norm": 0.7660874337227206,
"learning_rate": 2.8312776257314497e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2771637737751007,
"step": 2205,
"valid_targets_mean": 2188.8,
"valid_targets_min": 712
},
{
"epoch": 2.998643147896879,
"grad_norm": 0.678819967572549,
"learning_rate": 2.8251187298644372e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25125089287757874,
"step": 2210,
"valid_targets_mean": 2593.7,
"valid_targets_min": 826
},
{
"epoch": 3.005427408412483,
"grad_norm": 0.6195799648166698,
"learning_rate": 2.818950389944374e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21490924060344696,
"step": 2215,
"valid_targets_mean": 3076.2,
"valid_targets_min": 1375
},
{
"epoch": 3.012211668928087,
"grad_norm": 0.741799685467653,
"learning_rate": 2.812772676572165e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2147355079650879,
"step": 2220,
"valid_targets_mean": 2800.7,
"valid_targets_min": 842
},
{
"epoch": 3.0189959294436908,
"grad_norm": 0.6481778989984706,
"learning_rate": 2.806585660456001e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21204230189323425,
"step": 2225,
"valid_targets_mean": 3253.1,
"valid_targets_min": 1058
},
{
"epoch": 3.0257801899592947,
"grad_norm": 0.7528798552940739,
"learning_rate": 2.8003894124105494e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24220474064350128,
"step": 2230,
"valid_targets_mean": 2921.9,
"valid_targets_min": 1386
},
{
"epoch": 3.032564450474898,
"grad_norm": 0.7539503673228278,
"learning_rate": 2.794184003356144e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2737279236316681,
"step": 2235,
"valid_targets_mean": 2459.6,
"valid_targets_min": 938
},
{
"epoch": 3.039348710990502,
"grad_norm": 0.6860093065024846,
"learning_rate": 2.787969504317972e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23056598007678986,
"step": 2240,
"valid_targets_mean": 3120.1,
"valid_targets_min": 700
},
{
"epoch": 3.046132971506106,
"grad_norm": 0.6742437476536095,
"learning_rate": 2.7817459864252606e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2076399177312851,
"step": 2245,
"valid_targets_mean": 2751.0,
"valid_targets_min": 716
},
{
"epoch": 3.0529172320217097,
"grad_norm": 0.6601870684447021,
"learning_rate": 2.7755135209104673e-05,
"loss": 0.2115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21040399372577667,
"step": 2250,
"valid_targets_mean": 2970.5,
"valid_targets_min": 1266
},
{
"epoch": 3.0597014925373136,
"grad_norm": 0.7655435099255181,
"learning_rate": 2.769272179108458e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24985858798027039,
"step": 2255,
"valid_targets_mean": 3437.8,
"valid_targets_min": 1114
},
{
"epoch": 3.066485753052917,
"grad_norm": 0.7149714320640186,
"learning_rate": 2.7630220324556947e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21348509192466736,
"step": 2260,
"valid_targets_mean": 2941.0,
"valid_targets_min": 1039
},
{
"epoch": 3.073270013568521,
"grad_norm": 0.7792687892843089,
"learning_rate": 2.756763152489418e-05,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20965218544006348,
"step": 2265,
"valid_targets_mean": 1918.6,
"valid_targets_min": 822
},
{
"epoch": 3.080054274084125,
"grad_norm": 0.6597990538607253,
"learning_rate": 2.7504956108468262e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24037772417068481,
"step": 2270,
"valid_targets_mean": 3295.2,
"valid_targets_min": 1204
},
{
"epoch": 3.0868385345997287,
"grad_norm": 0.7852404129824124,
"learning_rate": 2.7442194792642576e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26370474696159363,
"step": 2275,
"valid_targets_mean": 2461.3,
"valid_targets_min": 1207
},
{
"epoch": 3.0936227951153326,
"grad_norm": 0.6324909016089244,
"learning_rate": 2.737934829576367e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19589462876319885,
"step": 2280,
"valid_targets_mean": 2882.0,
"valid_targets_min": 1016
},
{
"epoch": 3.1004070556309364,
"grad_norm": 0.7132616114200901,
"learning_rate": 2.7316417337153053e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21955709159374237,
"step": 2285,
"valid_targets_mean": 2424.4,
"valid_targets_min": 744
},
{
"epoch": 3.10719131614654,
"grad_norm": 0.6627034885187564,
"learning_rate": 2.7253402637098963e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2161223590373993,
"step": 2290,
"valid_targets_mean": 2994.9,
"valid_targets_min": 1254
},
{
"epoch": 3.1139755766621438,
"grad_norm": 0.7133154934701709,
"learning_rate": 2.7190304916848114e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22376814484596252,
"step": 2295,
"valid_targets_mean": 2787.6,
"valid_targets_min": 952
},
{
"epoch": 3.1207598371777476,
"grad_norm": 0.7291074383267475,
"learning_rate": 2.712712489859743e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23834912478923798,
"step": 2300,
"valid_targets_mean": 2901.0,
"valid_targets_min": 615
},
{
"epoch": 3.1275440976933515,
"grad_norm": 0.7568349432173351,
"learning_rate": 2.706386330548581e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19825339317321777,
"step": 2305,
"valid_targets_mean": 2677.8,
"valid_targets_min": 967
},
{
"epoch": 3.1343283582089554,
"grad_norm": 0.7241979030877912,
"learning_rate": 2.7000520861585825e-05,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22395247220993042,
"step": 2310,
"valid_targets_mean": 2555.9,
"valid_targets_min": 890
},
{
"epoch": 3.141112618724559,
"grad_norm": 0.7176875343032588,
"learning_rate": 2.693709829189544e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21689847111701965,
"step": 2315,
"valid_targets_mean": 2447.6,
"valid_targets_min": 865
},
{
"epoch": 3.1478968792401627,
"grad_norm": 0.8624810704747251,
"learning_rate": 2.6873596322329717e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509344816207886,
"step": 2320,
"valid_targets_mean": 1913.9,
"valid_targets_min": 676
},
{
"epoch": 3.1546811397557666,
"grad_norm": 0.6434418388849583,
"learning_rate": 2.6810015679712505e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22354134917259216,
"step": 2325,
"valid_targets_mean": 3262.2,
"valid_targets_min": 1113
},
{
"epoch": 3.1614654002713705,
"grad_norm": 0.7907645012767848,
"learning_rate": 2.6746357091768116e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22720026969909668,
"step": 2330,
"valid_targets_mean": 2312.9,
"valid_targets_min": 774
},
{
"epoch": 3.1682496607869743,
"grad_norm": 0.7095701119398697,
"learning_rate": 2.6682621287113e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23232200741767883,
"step": 2335,
"valid_targets_mean": 2940.6,
"valid_targets_min": 1009
},
{
"epoch": 3.175033921302578,
"grad_norm": 0.6882795435130347,
"learning_rate": 2.6618808995247408e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22832772135734558,
"step": 2340,
"valid_targets_mean": 2938.8,
"valid_targets_min": 888
},
{
"epoch": 3.1818181818181817,
"grad_norm": 0.6135099997369059,
"learning_rate": 2.6554920946547044e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23073089122772217,
"step": 2345,
"valid_targets_mean": 3286.8,
"valid_targets_min": 768
},
{
"epoch": 3.1886024423337855,
"grad_norm": 0.9423077941270365,
"learning_rate": 2.649095787225469e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2254088819026947,
"step": 2350,
"valid_targets_mean": 2568.0,
"valid_targets_min": 1236
},
{
"epoch": 3.1953867028493894,
"grad_norm": 0.810975408154495,
"learning_rate": 2.6426920504471865e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21835219860076904,
"step": 2355,
"valid_targets_mean": 2296.8,
"valid_targets_min": 692
},
{
"epoch": 3.2021709633649933,
"grad_norm": 0.672655439805317,
"learning_rate": 2.636280957615041e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22122296690940857,
"step": 2360,
"valid_targets_mean": 2792.6,
"valid_targets_min": 802
},
{
"epoch": 3.208955223880597,
"grad_norm": 0.7434847650835706,
"learning_rate": 2.6298625821084128e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21797284483909607,
"step": 2365,
"valid_targets_mean": 2498.4,
"valid_targets_min": 1153
},
{
"epoch": 3.2157394843962006,
"grad_norm": 0.6570222965023365,
"learning_rate": 2.6234369973900372e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033863663673401,
"step": 2370,
"valid_targets_mean": 2630.6,
"valid_targets_min": 770
},
{
"epoch": 3.2225237449118045,
"grad_norm": 0.8657617678949259,
"learning_rate": 2.6170042770051635e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.225327730178833,
"step": 2375,
"valid_targets_mean": 1854.9,
"valid_targets_min": 732
},
{
"epoch": 3.2293080054274084,
"grad_norm": 0.7046910890483484,
"learning_rate": 2.610564494580714e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22602598369121552,
"step": 2380,
"valid_targets_mean": 2542.6,
"valid_targets_min": 742
},
{
"epoch": 3.2360922659430122,
"grad_norm": 0.6740596140779037,
"learning_rate": 2.604117723824441e-05,
"loss": 0.2288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23400309681892395,
"step": 2385,
"valid_targets_mean": 3017.3,
"valid_targets_min": 760
},
{
"epoch": 3.242876526458616,
"grad_norm": 0.7404070619144895,
"learning_rate": 2.597664038524083e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2237531542778015,
"step": 2390,
"valid_targets_mean": 2550.8,
"valid_targets_min": 1095
},
{
"epoch": 3.24966078697422,
"grad_norm": 0.6731318456534926,
"learning_rate": 2.5912035125465208e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2236143946647644,
"step": 2395,
"valid_targets_mean": 2946.1,
"valid_targets_min": 800
},
{
"epoch": 3.2564450474898234,
"grad_norm": 0.7464562402100164,
"learning_rate": 2.5847362198369297e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542741298675537,
"step": 2400,
"valid_targets_mean": 2603.9,
"valid_targets_min": 746
},
{
"epoch": 3.2632293080054273,
"grad_norm": 0.7388159380991954,
"learning_rate": 2.578262234417937e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21536928415298462,
"step": 2405,
"valid_targets_mean": 2555.2,
"valid_targets_min": 974
},
{
"epoch": 3.270013568521031,
"grad_norm": 0.7355746785542672,
"learning_rate": 2.5717816303887703e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21950095891952515,
"step": 2410,
"valid_targets_mean": 2990.9,
"valid_targets_min": 996
},
{
"epoch": 3.276797829036635,
"grad_norm": 0.7517171398028017,
"learning_rate": 2.565294481924415e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20042955875396729,
"step": 2415,
"valid_targets_mean": 2606.8,
"valid_targets_min": 799
},
{
"epoch": 3.283582089552239,
"grad_norm": 0.7068185853149664,
"learning_rate": 2.5588008632747593e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22197219729423523,
"step": 2420,
"valid_targets_mean": 3084.1,
"valid_targets_min": 825
},
{
"epoch": 3.290366350067843,
"grad_norm": 0.7279583182044714,
"learning_rate": 2.5523008487637482e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2149057388305664,
"step": 2425,
"valid_targets_mean": 2391.9,
"valid_targets_min": 734
},
{
"epoch": 3.2971506105834463,
"grad_norm": 0.6422722168754591,
"learning_rate": 2.5457945127885318e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24687312543392181,
"step": 2430,
"valid_targets_mean": 3709.7,
"valid_targets_min": 952
},
{
"epoch": 3.30393487109905,
"grad_norm": 0.6945878436621437,
"learning_rate": 2.539281929818614e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2088148444890976,
"step": 2435,
"valid_targets_mean": 2683.1,
"valid_targets_min": 797
},
{
"epoch": 3.310719131614654,
"grad_norm": 0.8469589878253486,
"learning_rate": 2.5327631743949982e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22623956203460693,
"step": 2440,
"valid_targets_mean": 2050.2,
"valid_targets_min": 625
},
{
"epoch": 3.317503392130258,
"grad_norm": 0.7039682068648079,
"learning_rate": 2.5262383211293386e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22464679181575775,
"step": 2445,
"valid_targets_mean": 3066.5,
"valid_targets_min": 835
},
{
"epoch": 3.324287652645862,
"grad_norm": 0.6549956329113884,
"learning_rate": 2.51970744470308e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25542882084846497,
"step": 2450,
"valid_targets_mean": 3588.2,
"valid_targets_min": 741
},
{
"epoch": 3.3310719131614652,
"grad_norm": 0.6922641541400616,
"learning_rate": 2.5131706198666104e-05,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21417692303657532,
"step": 2455,
"valid_targets_mean": 2714.5,
"valid_targets_min": 933
},
{
"epoch": 3.337856173677069,
"grad_norm": 0.6313775940838555,
"learning_rate": 2.506627921438397e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20802749693393707,
"step": 2460,
"valid_targets_mean": 3045.8,
"valid_targets_min": 852
},
{
"epoch": 3.344640434192673,
"grad_norm": 0.6419716617358177,
"learning_rate": 2.5000794243041386e-05,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20835299789905548,
"step": 2465,
"valid_targets_mean": 2813.1,
"valid_targets_min": 734
},
{
"epoch": 3.351424694708277,
"grad_norm": 0.6155938516766296,
"learning_rate": 2.4935252034159016e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23357100784778595,
"step": 2470,
"valid_targets_mean": 3461.4,
"valid_targets_min": 1589
},
{
"epoch": 3.3582089552238807,
"grad_norm": 0.6931971140884506,
"learning_rate": 2.4869653337912652e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23858122527599335,
"step": 2475,
"valid_targets_mean": 3166.2,
"valid_targets_min": 1026
},
{
"epoch": 3.364993215739484,
"grad_norm": 0.7398849431239813,
"learning_rate": 2.480399890512462e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24428343772888184,
"step": 2480,
"valid_targets_mean": 2540.5,
"valid_targets_min": 1101
},
{
"epoch": 3.371777476255088,
"grad_norm": 0.7128166603516436,
"learning_rate": 2.4738289487255198e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22879432141780853,
"step": 2485,
"valid_targets_mean": 2861.1,
"valid_targets_min": 1266
},
{
"epoch": 3.378561736770692,
"grad_norm": 0.7552252749221059,
"learning_rate": 2.4672525836394003e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22698278725147247,
"step": 2490,
"valid_targets_mean": 2579.4,
"valid_targets_min": 889
},
{
"epoch": 3.385345997286296,
"grad_norm": 0.8012197815964346,
"learning_rate": 2.4606708705251383e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23777778446674347,
"step": 2495,
"valid_targets_mean": 2214.4,
"valid_targets_min": 873
},
{
"epoch": 3.3921302578018997,
"grad_norm": 0.7100109651223878,
"learning_rate": 2.4540838847149805e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2334587723016739,
"step": 2500,
"valid_targets_mean": 2754.7,
"valid_targets_min": 1320
},
{
"epoch": 3.3989145183175036,
"grad_norm": 0.7594298936519028,
"learning_rate": 2.4474917016015233e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21707573533058167,
"step": 2505,
"valid_targets_mean": 2143.0,
"valid_targets_min": 538
},
{
"epoch": 3.405698778833107,
"grad_norm": 0.6554539535978531,
"learning_rate": 2.4408943966368502e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22429423034191132,
"step": 2510,
"valid_targets_mean": 3002.5,
"valid_targets_min": 698
},
{
"epoch": 3.412483039348711,
"grad_norm": 0.5678144037578754,
"learning_rate": 2.4342920453316677e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21168120205402374,
"step": 2515,
"valid_targets_mean": 4258.6,
"valid_targets_min": 839
},
{
"epoch": 3.4192672998643148,
"grad_norm": 1.1608859512029313,
"learning_rate": 2.42768472325444e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512350082397461,
"step": 2520,
"valid_targets_mean": 2730.8,
"valid_targets_min": 1116
},
{
"epoch": 3.4260515603799186,
"grad_norm": 0.6794646407442558,
"learning_rate": 2.4210725060305277e-05,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23531343042850494,
"step": 2525,
"valid_targets_mean": 3514.7,
"valid_targets_min": 1334
},
{
"epoch": 3.4328358208955225,
"grad_norm": 0.6399640137952785,
"learning_rate": 2.4144554693413165e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22536537051200867,
"step": 2530,
"valid_targets_mean": 3192.2,
"valid_targets_min": 960
},
{
"epoch": 3.4396200814111264,
"grad_norm": 0.6662119295193443,
"learning_rate": 2.407833688923357e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22147254645824432,
"step": 2535,
"valid_targets_mean": 2992.2,
"valid_targets_min": 1501
},
{
"epoch": 3.44640434192673,
"grad_norm": 0.6891237720043712,
"learning_rate": 2.401207240567493e-05,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20989638566970825,
"step": 2540,
"valid_targets_mean": 2869.4,
"valid_targets_min": 810
},
{
"epoch": 3.4531886024423337,
"grad_norm": 0.5733593611937268,
"learning_rate": 2.3945762001179988e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20587453246116638,
"step": 2545,
"valid_targets_mean": 3843.9,
"valid_targets_min": 1250
},
{
"epoch": 3.4599728629579376,
"grad_norm": 0.7227077896335035,
"learning_rate": 2.3879406434717048e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688782811164856,
"step": 2550,
"valid_targets_mean": 3092.1,
"valid_targets_min": 800
},
{
"epoch": 3.4667571234735415,
"grad_norm": 0.729804276811994,
"learning_rate": 2.381300646577135e-05,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2293173372745514,
"step": 2555,
"valid_targets_mean": 2722.3,
"valid_targets_min": 725
},
{
"epoch": 3.4735413839891454,
"grad_norm": 0.7089336749170233,
"learning_rate": 2.3746562854336347e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24235443770885468,
"step": 2560,
"valid_targets_mean": 2771.2,
"valid_targets_min": 795
},
{
"epoch": 3.480325644504749,
"grad_norm": 0.7144987230267648,
"learning_rate": 2.3680076360904996e-05,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22750988602638245,
"step": 2565,
"valid_targets_mean": 2600.1,
"valid_targets_min": 686
},
{
"epoch": 3.4871099050203527,
"grad_norm": 0.6752212573282049,
"learning_rate": 2.3613547746461082e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24150076508522034,
"step": 2570,
"valid_targets_mean": 3270.1,
"valid_targets_min": 874
},
{
"epoch": 3.4938941655359566,
"grad_norm": 0.7590308205931211,
"learning_rate": 2.3546977772470494e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22371584177017212,
"step": 2575,
"valid_targets_mean": 2490.2,
"valid_targets_min": 810
},
{
"epoch": 3.5006784260515604,
"grad_norm": 0.7870240421440323,
"learning_rate": 2.3480367200872504e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23015907406806946,
"step": 2580,
"valid_targets_mean": 2033.2,
"valid_targets_min": 1066
},
{
"epoch": 3.5074626865671643,
"grad_norm": 0.923419749026049,
"learning_rate": 2.341371679407106e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207190603017807,
"step": 2585,
"valid_targets_mean": 2550.9,
"valid_targets_min": 822
},
{
"epoch": 3.5142469470827677,
"grad_norm": 0.7046771506431182,
"learning_rate": 2.3347027314926032e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22681497037410736,
"step": 2590,
"valid_targets_mean": 2633.1,
"valid_targets_min": 719
},
{
"epoch": 3.5210312075983716,
"grad_norm": 0.6097178720133104,
"learning_rate": 2.328029952674452e-05,
"loss": 0.2303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21856877207756042,
"step": 2595,
"valid_targets_mean": 4060.4,
"valid_targets_min": 1722
},
{
"epoch": 3.5278154681139755,
"grad_norm": 0.7646075625057801,
"learning_rate": 2.321353419327209e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2248585820198059,
"step": 2600,
"valid_targets_mean": 2429.2,
"valid_targets_min": 810
},
{
"epoch": 3.5345997286295794,
"grad_norm": 0.6929279550589781,
"learning_rate": 2.314673207868404e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24431878328323364,
"step": 2605,
"valid_targets_mean": 2962.9,
"valid_targets_min": 655
},
{
"epoch": 3.5413839891451833,
"grad_norm": 0.6480909726367313,
"learning_rate": 2.307989394757665e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22717615962028503,
"step": 2610,
"valid_targets_mean": 3731.4,
"valid_targets_min": 1001
},
{
"epoch": 3.5481682496607867,
"grad_norm": 0.7186879086898086,
"learning_rate": 2.301302056495845e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2136261910200119,
"step": 2615,
"valid_targets_mean": 2418.2,
"valid_targets_min": 705
},
{
"epoch": 3.554952510176391,
"grad_norm": 0.806809670872252,
"learning_rate": 2.2946112696241414e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22997555136680603,
"step": 2620,
"valid_targets_mean": 2120.0,
"valid_targets_min": 680
},
{
"epoch": 3.5617367706919945,
"grad_norm": 0.6741591468113703,
"learning_rate": 2.2879171107232274e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2275179922580719,
"step": 2625,
"valid_targets_mean": 3001.9,
"valid_targets_min": 1175
},
{
"epoch": 3.5685210312075983,
"grad_norm": 0.7318902025413816,
"learning_rate": 2.2812196564123683e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21598154306411743,
"step": 2630,
"valid_targets_mean": 2405.4,
"valid_targets_min": 986
},
{
"epoch": 3.575305291723202,
"grad_norm": 0.7506970585357591,
"learning_rate": 2.274518983348549e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24321120977401733,
"step": 2635,
"valid_targets_mean": 2461.9,
"valid_targets_min": 907
},
{
"epoch": 3.582089552238806,
"grad_norm": 0.6629205823156629,
"learning_rate": 2.267815168225596e-05,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2191721647977829,
"step": 2640,
"valid_targets_mean": 2622.9,
"valid_targets_min": 882
},
{
"epoch": 3.58887381275441,
"grad_norm": 0.7533189468195941,
"learning_rate": 2.2611082877732954e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24864350259304047,
"step": 2645,
"valid_targets_mean": 2555.6,
"valid_targets_min": 684
},
{
"epoch": 3.5956580732700134,
"grad_norm": 0.6177690316825468,
"learning_rate": 2.2543984187565227e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23729315400123596,
"step": 2650,
"valid_targets_mean": 3457.9,
"valid_targets_min": 1279
},
{
"epoch": 3.6024423337856173,
"grad_norm": 0.7158165102846912,
"learning_rate": 2.2476856379743567e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23067063093185425,
"step": 2655,
"valid_targets_mean": 2960.2,
"valid_targets_min": 722
},
{
"epoch": 3.609226594301221,
"grad_norm": 0.7707372511866211,
"learning_rate": 2.2409700222592042e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22069093585014343,
"step": 2660,
"valid_targets_mean": 2546.6,
"valid_targets_min": 668
},
{
"epoch": 3.616010854816825,
"grad_norm": 0.6052180371912904,
"learning_rate": 2.23425164847592e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21380861103534698,
"step": 2665,
"valid_targets_mean": 3455.1,
"valid_targets_min": 742
},
{
"epoch": 3.622795115332429,
"grad_norm": 0.7047656744984836,
"learning_rate": 2.227530593520926e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24715712666511536,
"step": 2670,
"valid_targets_mean": 3540.6,
"valid_targets_min": 1327
},
{
"epoch": 3.6295793758480324,
"grad_norm": 0.6745230951755198,
"learning_rate": 2.2208069343213326e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23651158809661865,
"step": 2675,
"valid_targets_mean": 3037.1,
"valid_targets_min": 972
},
{
"epoch": 3.6363636363636362,
"grad_norm": 0.623368182400207,
"learning_rate": 2.2140807478340582e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22128023207187653,
"step": 2680,
"valid_targets_mean": 3301.1,
"valid_targets_min": 724
},
{
"epoch": 3.64314789687924,
"grad_norm": 0.6649128121001402,
"learning_rate": 2.2073521110449456e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2295609414577484,
"step": 2685,
"valid_targets_mean": 3177.9,
"valid_targets_min": 1144
},
{
"epoch": 3.649932157394844,
"grad_norm": 0.6882954051754054,
"learning_rate": 2.200621100967886e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2442229986190796,
"step": 2690,
"valid_targets_mean": 3074.8,
"valid_targets_min": 856
},
{
"epoch": 3.656716417910448,
"grad_norm": 0.6820903463422161,
"learning_rate": 2.193887794643932e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23110562562942505,
"step": 2695,
"valid_targets_mean": 3172.8,
"valid_targets_min": 1124
},
{
"epoch": 3.6635006784260513,
"grad_norm": 0.6997238880911637,
"learning_rate": 2.187152269140419e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21552921831607819,
"step": 2700,
"valid_targets_mean": 2677.4,
"valid_targets_min": 814
},
{
"epoch": 3.670284938941655,
"grad_norm": 0.7131884522201282,
"learning_rate": 2.180414601550084e-05,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2269384115934372,
"step": 2705,
"valid_targets_mean": 2801.8,
"valid_targets_min": 1388
},
{
"epoch": 3.677069199457259,
"grad_norm": 0.7172347353831631,
"learning_rate": 2.1736748689901792e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22936025261878967,
"step": 2710,
"valid_targets_mean": 2702.1,
"valid_targets_min": 1312
},
{
"epoch": 3.683853459972863,
"grad_norm": 0.6583901504326424,
"learning_rate": 2.1669331486015942e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.221341073513031,
"step": 2715,
"valid_targets_mean": 2726.4,
"valid_targets_min": 1008
},
{
"epoch": 3.690637720488467,
"grad_norm": 0.6670649918476067,
"learning_rate": 2.1601895175479677e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18742845952510834,
"step": 2720,
"valid_targets_mean": 2824.9,
"valid_targets_min": 741
},
{
"epoch": 3.6974219810040707,
"grad_norm": 0.7043411361057197,
"learning_rate": 2.1534440530148104e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.224558025598526,
"step": 2725,
"valid_targets_mean": 2730.9,
"valid_targets_min": 901
},
{
"epoch": 3.7042062415196746,
"grad_norm": 0.8290546440140429,
"learning_rate": 2.1466968322086168e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24871769547462463,
"step": 2730,
"valid_targets_mean": 2595.6,
"valid_targets_min": 629
},
{
"epoch": 3.710990502035278,
"grad_norm": 0.6684634109147515,
"learning_rate": 2.1399479323559837e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22964484989643097,
"step": 2735,
"valid_targets_mean": 3235.6,
"valid_targets_min": 657
},
{
"epoch": 3.717774762550882,
"grad_norm": 0.6468283601913088,
"learning_rate": 2.133197430702725e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22138440608978271,
"step": 2740,
"valid_targets_mean": 2955.9,
"valid_targets_min": 742
},
{
"epoch": 3.724559023066486,
"grad_norm": 0.6848302786495842,
"learning_rate": 2.1264454045129885e-05,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23357048630714417,
"step": 2745,
"valid_targets_mean": 2971.2,
"valid_targets_min": 876
},
{
"epoch": 3.7313432835820897,
"grad_norm": 0.8076399629104075,
"learning_rate": 2.1196919310683722e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24134433269500732,
"step": 2750,
"valid_targets_mean": 2742.0,
"valid_targets_min": 1227
},
{
"epoch": 3.7381275440976935,
"grad_norm": 0.7937429467781824,
"learning_rate": 2.112937087667039e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23753595352172852,
"step": 2755,
"valid_targets_mean": 2422.7,
"valid_targets_min": 1122
},
{
"epoch": 3.744911804613297,
"grad_norm": 0.6806559152552468,
"learning_rate": 2.106180951622829e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.241061270236969,
"step": 2760,
"valid_targets_mean": 2973.4,
"valid_targets_min": 1078
},
{
"epoch": 3.751696065128901,
"grad_norm": 0.695950276005158,
"learning_rate": 2.0994236002643822e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20735937356948853,
"step": 2765,
"valid_targets_mean": 2495.0,
"valid_targets_min": 728
},
{
"epoch": 3.7584803256445047,
"grad_norm": 0.8597190728087525,
"learning_rate": 2.0926651109342457e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2300506830215454,
"step": 2770,
"valid_targets_mean": 2055.6,
"valid_targets_min": 730
},
{
"epoch": 3.7652645861601086,
"grad_norm": 0.7385601024810353,
"learning_rate": 2.0859055609879916e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23074880242347717,
"step": 2775,
"valid_targets_mean": 2834.2,
"valid_targets_min": 611
},
{
"epoch": 3.7720488466757125,
"grad_norm": 0.7000695708428455,
"learning_rate": 2.0791450277933322e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21346724033355713,
"step": 2780,
"valid_targets_mean": 2711.2,
"valid_targets_min": 763
},
{
"epoch": 3.778833107191316,
"grad_norm": 0.6921395024706539,
"learning_rate": 2.0723835887292334e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2142827957868576,
"step": 2785,
"valid_targets_mean": 2578.4,
"valid_targets_min": 1125
},
{
"epoch": 3.78561736770692,
"grad_norm": 0.7682439574392755,
"learning_rate": 2.0656213211850295e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21348156034946442,
"step": 2790,
"valid_targets_mean": 2177.8,
"valid_targets_min": 635
},
{
"epoch": 3.7924016282225237,
"grad_norm": 0.7600371041182261,
"learning_rate": 2.058858302559537e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23701968789100647,
"step": 2795,
"valid_targets_mean": 2633.8,
"valid_targets_min": 868
},
{
"epoch": 3.7991858887381276,
"grad_norm": 0.7139158160982614,
"learning_rate": 2.05209461026017e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.233786478638649,
"step": 2800,
"valid_targets_mean": 2587.3,
"valid_targets_min": 943
},
{
"epoch": 3.8059701492537314,
"grad_norm": 0.7176024981852444,
"learning_rate": 2.045330321702053e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22029541432857513,
"step": 2805,
"valid_targets_mean": 2586.6,
"valid_targets_min": 770
},
{
"epoch": 3.812754409769335,
"grad_norm": 0.6149619152466096,
"learning_rate": 2.0385655143071336e-05,
"loss": 0.2159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19177527725696564,
"step": 2810,
"valid_targets_mean": 3115.8,
"valid_targets_min": 634
},
{
"epoch": 3.819538670284939,
"grad_norm": 0.6945022382481121,
"learning_rate": 2.031800265503299e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2345021814107895,
"step": 2815,
"valid_targets_mean": 3089.4,
"valid_targets_min": 484
},
{
"epoch": 3.8263229308005426,
"grad_norm": 0.718365382422882,
"learning_rate": 2.02503465272349e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21639087796211243,
"step": 2820,
"valid_targets_mean": 2522.1,
"valid_targets_min": 675
},
{
"epoch": 3.8331071913161465,
"grad_norm": 0.7049711808427084,
"learning_rate": 2.0182687534048107e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24925465881824493,
"step": 2825,
"valid_targets_mean": 2881.4,
"valid_targets_min": 875
},
{
"epoch": 3.8398914518317504,
"grad_norm": 0.7569193242813216,
"learning_rate": 2.011502644987646e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2595372796058655,
"step": 2830,
"valid_targets_mean": 2309.4,
"valid_targets_min": 801
},
{
"epoch": 3.8466757123473543,
"grad_norm": 0.6067978450699282,
"learning_rate": 2.0047364049147747e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21039123833179474,
"step": 2835,
"valid_targets_mean": 3391.3,
"valid_targets_min": 805
},
{
"epoch": 3.853459972862958,
"grad_norm": 0.6539018194253448,
"learning_rate": 1.9979701106304824e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.241075336933136,
"step": 2840,
"valid_targets_mean": 2985.6,
"valid_targets_min": 1362
},
{
"epoch": 3.8602442333785616,
"grad_norm": 0.672599881101891,
"learning_rate": 1.991203839579674e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2360815405845642,
"step": 2845,
"valid_targets_mean": 2885.5,
"valid_targets_min": 663
},
{
"epoch": 3.8670284938941655,
"grad_norm": 0.7800657928131475,
"learning_rate": 1.984437669206989e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20892655849456787,
"step": 2850,
"valid_targets_mean": 2320.9,
"valid_targets_min": 917
},
{
"epoch": 3.8738127544097694,
"grad_norm": 0.6676687527814975,
"learning_rate": 1.9776716769559157e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22498619556427002,
"step": 2855,
"valid_targets_mean": 3164.1,
"valid_targets_min": 1241
},
{
"epoch": 3.8805970149253732,
"grad_norm": 0.5995122983093996,
"learning_rate": 1.970905940267902e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21802213788032532,
"step": 2860,
"valid_targets_mean": 3898.9,
"valid_targets_min": 914
},
{
"epoch": 3.887381275440977,
"grad_norm": 0.647688327782899,
"learning_rate": 1.9641405365814717e-05,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21417051553726196,
"step": 2865,
"valid_targets_mean": 3167.7,
"valid_targets_min": 758
},
{
"epoch": 3.8941655359565805,
"grad_norm": 0.6546310967035971,
"learning_rate": 1.9573755433313378e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323242872953415,
"step": 2870,
"valid_targets_mean": 3041.1,
"valid_targets_min": 1319
},
{
"epoch": 3.9009497964721844,
"grad_norm": 0.7383143695334415,
"learning_rate": 1.9506110379475128e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311961054801941,
"step": 2875,
"valid_targets_mean": 2362.9,
"valid_targets_min": 750
},
{
"epoch": 3.9077340569877883,
"grad_norm": 0.8430450237904688,
"learning_rate": 1.9438470978544287e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21592223644256592,
"step": 2880,
"valid_targets_mean": 3625.7,
"valid_targets_min": 1167
},
{
"epoch": 3.914518317503392,
"grad_norm": 0.7707831179099163,
"learning_rate": 1.9370838004700455e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24675382673740387,
"step": 2885,
"valid_targets_mean": 2393.0,
"valid_targets_min": 1011
},
{
"epoch": 3.921302578018996,
"grad_norm": 0.7280249588483818,
"learning_rate": 1.930321223204967e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24415768682956696,
"step": 2890,
"valid_targets_mean": 2570.4,
"valid_targets_min": 1242
},
{
"epoch": 3.9280868385345995,
"grad_norm": 0.7871720247148984,
"learning_rate": 1.9235594434615552e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21705761551856995,
"step": 2895,
"valid_targets_mean": 2329.9,
"valid_targets_min": 934
},
{
"epoch": 3.9348710990502034,
"grad_norm": 0.6824607839533505,
"learning_rate": 1.9167985386330435e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2021501511335373,
"step": 2900,
"valid_targets_mean": 3006.3,
"valid_targets_min": 1460
},
{
"epoch": 3.9416553595658073,
"grad_norm": 0.580360164037747,
"learning_rate": 1.910038586102652e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18379102647304535,
"step": 2905,
"valid_targets_mean": 2916.4,
"valid_targets_min": 927
},
{
"epoch": 3.948439620081411,
"grad_norm": 0.7244276692797579,
"learning_rate": 1.9032796632427e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22763890027999878,
"step": 2910,
"valid_targets_mean": 2483.5,
"valid_targets_min": 831
},
{
"epoch": 3.955223880597015,
"grad_norm": 0.7606015895849964,
"learning_rate": 1.896521847413722e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2129872590303421,
"step": 2915,
"valid_targets_mean": 2604.8,
"valid_targets_min": 1424
},
{
"epoch": 3.9620081411126185,
"grad_norm": 0.7996005811272329,
"learning_rate": 1.8897652159635826e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2276165634393692,
"step": 2920,
"valid_targets_mean": 2545.5,
"valid_targets_min": 1333
},
{
"epoch": 3.9687924016282228,
"grad_norm": 0.6306491453103433,
"learning_rate": 1.8830098462265892e-05,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2229669839143753,
"step": 2925,
"valid_targets_mean": 3271.3,
"valid_targets_min": 1296
},
{
"epoch": 3.975576662143826,
"grad_norm": 0.7155034374723849,
"learning_rate": 1.8762558155226086e-05,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23799753189086914,
"step": 2930,
"valid_targets_mean": 2748.9,
"valid_targets_min": 632
},
{
"epoch": 3.98236092265943,
"grad_norm": 0.8976533438979097,
"learning_rate": 1.869503201156181e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20464091002941132,
"step": 2935,
"valid_targets_mean": 1909.6,
"valid_targets_min": 883
},
{
"epoch": 3.989145183175034,
"grad_norm": 0.6624349548194711,
"learning_rate": 1.8627520804156365e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22667071223258972,
"step": 2940,
"valid_targets_mean": 3271.6,
"valid_targets_min": 623
},
{
"epoch": 3.995929443690638,
"grad_norm": 0.6151495628097419,
"learning_rate": 1.856002530572209e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21382832527160645,
"step": 2945,
"valid_targets_mean": 3332.6,
"valid_targets_min": 1190
},
{
"epoch": 4.002713704206242,
"grad_norm": 0.615787649304689,
"learning_rate": 1.8492546288791518e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19524888694286346,
"step": 2950,
"valid_targets_mean": 3521.4,
"valid_targets_min": 1057
},
{
"epoch": 4.009497964721845,
"grad_norm": 0.7774165923273912,
"learning_rate": 1.842508452570855e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20001152157783508,
"step": 2955,
"valid_targets_mean": 2349.4,
"valid_targets_min": 662
},
{
"epoch": 4.0162822252374495,
"grad_norm": 0.664596861061304,
"learning_rate": 1.8357640788619605e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21963298320770264,
"step": 2960,
"valid_targets_mean": 3053.3,
"valid_targets_min": 789
},
{
"epoch": 4.023066485753053,
"grad_norm": 0.7193062756351686,
"learning_rate": 1.8290215849464773e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2050497829914093,
"step": 2965,
"valid_targets_mean": 2874.3,
"valid_targets_min": 1465
},
{
"epoch": 4.029850746268656,
"grad_norm": 0.7682247189848644,
"learning_rate": 1.8222810479969e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20245233178138733,
"step": 2970,
"valid_targets_mean": 2529.4,
"valid_targets_min": 706
},
{
"epoch": 4.036635006784261,
"grad_norm": 0.7099650203393719,
"learning_rate": 1.815542545163323e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18782241642475128,
"step": 2975,
"valid_targets_mean": 2867.7,
"valid_targets_min": 856
},
{
"epoch": 4.043419267299864,
"grad_norm": 0.6679826007373775,
"learning_rate": 1.808806153572561e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18531766533851624,
"step": 2980,
"valid_targets_mean": 3430.7,
"valid_targets_min": 733
},
{
"epoch": 4.050203527815468,
"grad_norm": 0.6971278596727647,
"learning_rate": 1.802071950327261e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1951214224100113,
"step": 2985,
"valid_targets_mean": 2909.7,
"valid_targets_min": 728
},
{
"epoch": 4.056987788331072,
"grad_norm": 0.6975225843392714,
"learning_rate": 1.7953400125050252e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19596266746520996,
"step": 2990,
"valid_targets_mean": 3136.7,
"valid_targets_min": 591
},
{
"epoch": 4.063772048846675,
"grad_norm": 0.616610532499199,
"learning_rate": 1.7886104171575264e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17603719234466553,
"step": 2995,
"valid_targets_mean": 3788.1,
"valid_targets_min": 700
},
{
"epoch": 4.07055630936228,
"grad_norm": 0.8204028517819303,
"learning_rate": 1.7818832413096248e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1822405755519867,
"step": 3000,
"valid_targets_mean": 2084.1,
"valid_targets_min": 950
},
{
"epoch": 4.077340569877883,
"grad_norm": 0.8644454831039673,
"learning_rate": 1.775158561958489e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21637216210365295,
"step": 3005,
"valid_targets_mean": 2142.1,
"valid_targets_min": 1117
},
{
"epoch": 4.084124830393487,
"grad_norm": 0.6868713845692973,
"learning_rate": 1.768436456072713e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17520518600940704,
"step": 3010,
"valid_targets_mean": 3152.6,
"valid_targets_min": 1144
},
{
"epoch": 4.090909090909091,
"grad_norm": 0.646335349816201,
"learning_rate": 1.7617170005914363e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18921396136283875,
"step": 3015,
"valid_targets_mean": 3166.6,
"valid_targets_min": 1255
},
{
"epoch": 4.097693351424695,
"grad_norm": 0.7095934220573488,
"learning_rate": 1.755000272423461e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18535733222961426,
"step": 3020,
"valid_targets_mean": 2847.2,
"valid_targets_min": 1211
},
{
"epoch": 4.104477611940299,
"grad_norm": 0.7722733457306606,
"learning_rate": 1.7482863484463747e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1878623217344284,
"step": 3025,
"valid_targets_mean": 2357.7,
"valid_targets_min": 796
},
{
"epoch": 4.111261872455902,
"grad_norm": 0.7558210158635994,
"learning_rate": 1.7415753055056693e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20962506532669067,
"step": 3030,
"valid_targets_mean": 2774.4,
"valid_targets_min": 689
},
{
"epoch": 4.118046132971506,
"grad_norm": 0.7019234157644559,
"learning_rate": 1.73486722041386e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17214052379131317,
"step": 3035,
"valid_targets_mean": 2344.8,
"valid_targets_min": 720
},
{
"epoch": 4.12483039348711,
"grad_norm": 0.7056358240413717,
"learning_rate": 1.7281621699496086e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18809084594249725,
"step": 3040,
"valid_targets_mean": 2753.2,
"valid_targets_min": 985
},
{
"epoch": 4.131614654002714,
"grad_norm": 0.7928593105079518,
"learning_rate": 1.7214602308568426e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16787604987621307,
"step": 3045,
"valid_targets_mean": 2298.5,
"valid_targets_min": 883
},
{
"epoch": 4.1383989145183175,
"grad_norm": 0.7453927190983547,
"learning_rate": 1.714761479843879e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2303515374660492,
"step": 3050,
"valid_targets_mean": 3051.8,
"valid_targets_min": 1135
},
{
"epoch": 4.145183175033921,
"grad_norm": 0.7004503623184913,
"learning_rate": 1.708065993582543e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1861414909362793,
"step": 3055,
"valid_targets_mean": 2926.8,
"valid_targets_min": 704
},
{
"epoch": 4.151967435549525,
"grad_norm": 0.5969912948853561,
"learning_rate": 1.701373848707294e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16732157766819,
"step": 3060,
"valid_targets_mean": 3249.8,
"valid_targets_min": 759
},
{
"epoch": 4.158751696065129,
"grad_norm": 0.7889354028527934,
"learning_rate": 1.6946851218143464e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2116738259792328,
"step": 3065,
"valid_targets_mean": 2610.2,
"valid_targets_min": 1017
},
{
"epoch": 4.165535956580733,
"grad_norm": 0.6969382167538735,
"learning_rate": 1.6879998894607937e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.184125155210495,
"step": 3070,
"valid_targets_mean": 2778.3,
"valid_targets_min": 761
},
{
"epoch": 4.1723202170963365,
"grad_norm": 0.7661282970421094,
"learning_rate": 1.6813182281637318e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18725869059562683,
"step": 3075,
"valid_targets_mean": 2373.2,
"valid_targets_min": 785
},
{
"epoch": 4.17910447761194,
"grad_norm": 0.7127514162035592,
"learning_rate": 1.674640214399383e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20451834797859192,
"step": 3080,
"valid_targets_mean": 3058.9,
"valid_targets_min": 804
},
{
"epoch": 4.185888738127544,
"grad_norm": 0.7261600863010719,
"learning_rate": 1.6679659246022224e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19646155834197998,
"step": 3085,
"valid_targets_mean": 2840.0,
"valid_targets_min": 742
},
{
"epoch": 4.192672998643148,
"grad_norm": 0.7318920710785716,
"learning_rate": 1.6612954351641004e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1673353910446167,
"step": 3090,
"valid_targets_mean": 2456.0,
"valid_targets_min": 774
},
{
"epoch": 4.199457259158752,
"grad_norm": 0.7618896273234488,
"learning_rate": 1.65462882243337e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2328355312347412,
"step": 3095,
"valid_targets_mean": 2732.4,
"valid_targets_min": 662
},
{
"epoch": 4.2062415196743554,
"grad_norm": 0.6950613889947367,
"learning_rate": 1.6479661627140125e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21082782745361328,
"step": 3100,
"valid_targets_mean": 3076.4,
"valid_targets_min": 993
},
{
"epoch": 4.213025780189959,
"grad_norm": 0.7422212651396944,
"learning_rate": 1.6413075322647645e-05,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17804861068725586,
"step": 3105,
"valid_targets_mean": 2741.3,
"valid_targets_min": 1230
},
{
"epoch": 4.219810040705563,
"grad_norm": 0.8313162708546203,
"learning_rate": 1.634653007298245e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21381892263889313,
"step": 3110,
"valid_targets_mean": 2521.1,
"valid_targets_min": 918
},
{
"epoch": 4.226594301221167,
"grad_norm": 0.7343807869521366,
"learning_rate": 1.628002663980083e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18454739451408386,
"step": 3115,
"valid_targets_mean": 3389.7,
"valid_targets_min": 944
},
{
"epoch": 4.233378561736771,
"grad_norm": 0.7180737684834317,
"learning_rate": 1.6213565784280448e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20628373324871063,
"step": 3120,
"valid_targets_mean": 2695.5,
"valid_targets_min": 1330
},
{
"epoch": 4.240162822252374,
"grad_norm": 0.7446535802715553,
"learning_rate": 1.6147148267111648e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20070384442806244,
"step": 3125,
"valid_targets_mean": 2581.9,
"valid_targets_min": 1108
},
{
"epoch": 4.246947082767978,
"grad_norm": 0.7867961809991622,
"learning_rate": 1.608077484848872e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21188589930534363,
"step": 3130,
"valid_targets_mean": 2598.0,
"valid_targets_min": 754
},
{
"epoch": 4.253731343283582,
"grad_norm": 0.7452760690333677,
"learning_rate": 1.601444628810124e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19212831556797028,
"step": 3135,
"valid_targets_mean": 2548.9,
"valid_targets_min": 801
},
{
"epoch": 4.260515603799186,
"grad_norm": 0.640609370408385,
"learning_rate": 1.5948163345125322e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867392212152481,
"step": 3140,
"valid_targets_mean": 2978.2,
"valid_targets_min": 893
},
{
"epoch": 4.26729986431479,
"grad_norm": 0.7904463927412828,
"learning_rate": 1.5881926778214985e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18848653137683868,
"step": 3145,
"valid_targets_mean": 2162.2,
"valid_targets_min": 657
},
{
"epoch": 4.274084124830393,
"grad_norm": 0.6862590326254344,
"learning_rate": 1.581573734549342e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19391348958015442,
"step": 3150,
"valid_targets_mean": 2840.2,
"valid_targets_min": 796
},
{
"epoch": 4.280868385345998,
"grad_norm": 0.753930226852254,
"learning_rate": 1.574959580454435e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2218829095363617,
"step": 3155,
"valid_targets_mean": 2770.5,
"valid_targets_min": 791
},
{
"epoch": 4.287652645861601,
"grad_norm": 0.7173848707428967,
"learning_rate": 1.5683502912403334e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18789169192314148,
"step": 3160,
"valid_targets_mean": 2473.1,
"valid_targets_min": 1324
},
{
"epoch": 4.2944369063772045,
"grad_norm": 0.6756808344570617,
"learning_rate": 1.5617459425549118e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17631642520427704,
"step": 3165,
"valid_targets_mean": 2783.0,
"valid_targets_min": 898
},
{
"epoch": 4.301221166892809,
"grad_norm": 0.7596274040196479,
"learning_rate": 1.555146609989496e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19371306896209717,
"step": 3170,
"valid_targets_mean": 2678.5,
"valid_targets_min": 999
},
{
"epoch": 4.308005427408412,
"grad_norm": 0.7950503499609197,
"learning_rate": 1.5485523690780003e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20015594363212585,
"step": 3175,
"valid_targets_mean": 2270.9,
"valid_targets_min": 1330
},
{
"epoch": 4.314789687924017,
"grad_norm": 0.6284596925256105,
"learning_rate": 1.5419632952960605e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16846656799316406,
"step": 3180,
"valid_targets_mean": 3001.5,
"valid_targets_min": 584
},
{
"epoch": 4.32157394843962,
"grad_norm": 0.6201630615003697,
"learning_rate": 1.5353794640601716e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18524964153766632,
"step": 3185,
"valid_targets_mean": 3645.7,
"valid_targets_min": 1501
},
{
"epoch": 4.3283582089552235,
"grad_norm": 0.711809826493421,
"learning_rate": 1.5288009507268237e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21540531516075134,
"step": 3190,
"valid_targets_mean": 3402.2,
"valid_targets_min": 1522
},
{
"epoch": 4.335142469470828,
"grad_norm": 0.6972934803265656,
"learning_rate": 1.5222278305916398e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18640825152397156,
"step": 3195,
"valid_targets_mean": 3293.5,
"valid_targets_min": 1126
},
{
"epoch": 4.341926729986431,
"grad_norm": 0.6481026199784268,
"learning_rate": 1.5156601788885148e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1833941638469696,
"step": 3200,
"valid_targets_mean": 3167.9,
"valid_targets_min": 1106
},
{
"epoch": 4.348710990502036,
"grad_norm": 0.8208339691617204,
"learning_rate": 1.5090980707887516e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2145204246044159,
"step": 3205,
"valid_targets_mean": 2193.7,
"valid_targets_min": 739
},
{
"epoch": 4.355495251017639,
"grad_norm": 0.6739050449873922,
"learning_rate": 1.5025415814002053e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19558805227279663,
"step": 3210,
"valid_targets_mean": 3247.9,
"valid_targets_min": 930
},
{
"epoch": 4.362279511533243,
"grad_norm": 0.7330699785639507,
"learning_rate": 1.4959907857664193e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20514100790023804,
"step": 3215,
"valid_targets_mean": 2830.6,
"valid_targets_min": 947
},
{
"epoch": 4.369063772048847,
"grad_norm": 0.7397083988883265,
"learning_rate": 1.4894457588657685e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20222502946853638,
"step": 3220,
"valid_targets_mean": 2764.8,
"valid_targets_min": 815
},
{
"epoch": 4.37584803256445,
"grad_norm": 0.8585950766535199,
"learning_rate": 1.4829065756106011e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2083539068698883,
"step": 3225,
"valid_targets_mean": 3063.8,
"valid_targets_min": 704
},
{
"epoch": 4.3826322930800545,
"grad_norm": 0.6992154976029811,
"learning_rate": 1.47637331084638e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18280436098575592,
"step": 3230,
"valid_targets_mean": 2991.1,
"valid_targets_min": 922
},
{
"epoch": 4.389416553595658,
"grad_norm": 0.7220348383997678,
"learning_rate": 1.4698460393508279e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17603710293769836,
"step": 3235,
"valid_targets_mean": 2676.9,
"valid_targets_min": 683
},
{
"epoch": 4.396200814111262,
"grad_norm": 0.6815437556740436,
"learning_rate": 1.4633248358330685e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17538878321647644,
"step": 3240,
"valid_targets_mean": 2802.6,
"valid_targets_min": 923
},
{
"epoch": 4.402985074626866,
"grad_norm": 0.7423631904328546,
"learning_rate": 1.4568097749327755e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101781815290451,
"step": 3245,
"valid_targets_mean": 2564.9,
"valid_targets_min": 933
},
{
"epoch": 4.409769335142469,
"grad_norm": 0.6279743544457285,
"learning_rate": 1.4503009312193145e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18776188790798187,
"step": 3250,
"valid_targets_mean": 3485.3,
"valid_targets_min": 1216
},
{
"epoch": 4.4165535956580735,
"grad_norm": 0.72461497188728,
"learning_rate": 1.4437983791908927e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19717328250408173,
"step": 3255,
"valid_targets_mean": 2907.9,
"valid_targets_min": 875
},
{
"epoch": 4.423337856173677,
"grad_norm": 0.8394035988938123,
"learning_rate": 1.4373021932737029e-05,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2060231864452362,
"step": 3260,
"valid_targets_mean": 2521.2,
"valid_targets_min": 861
},
{
"epoch": 4.430122116689281,
"grad_norm": 0.7846496377698511,
"learning_rate": 1.4308124478210743e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18877476453781128,
"step": 3265,
"valid_targets_mean": 2120.6,
"valid_targets_min": 908
},
{
"epoch": 4.436906377204885,
"grad_norm": 0.7718040186575822,
"learning_rate": 1.4243292171126206e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1813274621963501,
"step": 3270,
"valid_targets_mean": 2067.4,
"valid_targets_min": 744
},
{
"epoch": 4.443690637720488,
"grad_norm": 0.8763562192740045,
"learning_rate": 1.4178525753533898e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1990664005279541,
"step": 3275,
"valid_targets_mean": 1895.3,
"valid_targets_min": 675
},
{
"epoch": 4.450474898236092,
"grad_norm": 0.7818367524680697,
"learning_rate": 1.4113825966730141e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2248629331588745,
"step": 3280,
"valid_targets_mean": 2445.3,
"valid_targets_min": 686
},
{
"epoch": 4.457259158751696,
"grad_norm": 0.7080706103494964,
"learning_rate": 1.4049193551248625e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19344773888587952,
"step": 3285,
"valid_targets_mean": 2806.9,
"valid_targets_min": 1092
},
{
"epoch": 4.4640434192673,
"grad_norm": 0.6352432822796971,
"learning_rate": 1.3984629246851938e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18108458817005157,
"step": 3290,
"valid_targets_mean": 3230.6,
"valid_targets_min": 703
},
{
"epoch": 4.470827679782904,
"grad_norm": 0.7766733822813426,
"learning_rate": 1.3920133792523075e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20187707245349884,
"step": 3295,
"valid_targets_mean": 2388.1,
"valid_targets_min": 898
},
{
"epoch": 4.477611940298507,
"grad_norm": 0.6809158943751472,
"learning_rate": 1.3855707926457003e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1838938295841217,
"step": 3300,
"valid_targets_mean": 2920.3,
"valid_targets_min": 837
},
{
"epoch": 4.484396200814111,
"grad_norm": 0.7081716006567864,
"learning_rate": 1.3791352386052201e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18974432349205017,
"step": 3305,
"valid_targets_mean": 2833.9,
"valid_targets_min": 818
},
{
"epoch": 4.491180461329715,
"grad_norm": 0.767864152806456,
"learning_rate": 1.3727067907902232e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18521273136138916,
"step": 3310,
"valid_targets_mean": 2255.4,
"valid_targets_min": 420
},
{
"epoch": 4.497964721845319,
"grad_norm": 0.688596857727443,
"learning_rate": 1.366285522778728e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1874987781047821,
"step": 3315,
"valid_targets_mean": 2975.4,
"valid_targets_min": 1163
},
{
"epoch": 4.504748982360923,
"grad_norm": 0.7386731368747045,
"learning_rate": 1.359871508066577e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20306339859962463,
"step": 3320,
"valid_targets_mean": 2857.8,
"valid_targets_min": 757
},
{
"epoch": 4.511533242876526,
"grad_norm": 0.8257894045478894,
"learning_rate": 1.3534648200665933e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18575474619865417,
"step": 3325,
"valid_targets_mean": 2783.4,
"valid_targets_min": 980
},
{
"epoch": 4.51831750339213,
"grad_norm": 0.6867092598234874,
"learning_rate": 1.3470655321077403e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18126091361045837,
"step": 3330,
"valid_targets_mean": 2647.6,
"valid_targets_min": 848
},
{
"epoch": 4.525101763907734,
"grad_norm": 0.7798112286441644,
"learning_rate": 1.3406737174342834e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23899130523204803,
"step": 3335,
"valid_targets_mean": 2828.8,
"valid_targets_min": 738
},
{
"epoch": 4.531886024423338,
"grad_norm": 0.7069921488313058,
"learning_rate": 1.3342894492049504e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20431819558143616,
"step": 3340,
"valid_targets_mean": 3127.2,
"valid_targets_min": 1317
},
{
"epoch": 4.5386702849389415,
"grad_norm": 0.7506355898759934,
"learning_rate": 1.3279128004920958e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1895807385444641,
"step": 3345,
"valid_targets_mean": 2666.6,
"valid_targets_min": 1005
},
{
"epoch": 4.545454545454545,
"grad_norm": 0.6725468343286256,
"learning_rate": 1.3215438442808624e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2019132673740387,
"step": 3350,
"valid_targets_mean": 3209.2,
"valid_targets_min": 1059
},
{
"epoch": 4.552238805970149,
"grad_norm": 0.6889050275687484,
"learning_rate": 1.3151826534683474e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1907675564289093,
"step": 3355,
"valid_targets_mean": 3152.4,
"valid_targets_min": 785
},
{
"epoch": 4.559023066485753,
"grad_norm": 0.7190846116998305,
"learning_rate": 1.308829300862768e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18840348720550537,
"step": 3360,
"valid_targets_mean": 2810.2,
"valid_targets_min": 803
},
{
"epoch": 4.565807327001357,
"grad_norm": 0.6702795320500231,
"learning_rate": 1.3024838591826274e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18903514742851257,
"step": 3365,
"valid_targets_mean": 3127.1,
"valid_targets_min": 1283
},
{
"epoch": 4.5725915875169605,
"grad_norm": 0.7488732753982411,
"learning_rate": 1.296146401055883e-05,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22193178534507751,
"step": 3370,
"valid_targets_mean": 3123.5,
"valid_targets_min": 700
},
{
"epoch": 4.579375848032565,
"grad_norm": 0.7263613305452004,
"learning_rate": 1.2898169990191148e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1917208731174469,
"step": 3375,
"valid_targets_mean": 2815.2,
"valid_targets_min": 734
},
{
"epoch": 4.586160108548168,
"grad_norm": 0.7868953900274589,
"learning_rate": 1.2834957255166948e-05,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17863771319389343,
"step": 3380,
"valid_targets_mean": 2261.1,
"valid_targets_min": 537
},
{
"epoch": 4.592944369063772,
"grad_norm": 0.7888410061782655,
"learning_rate": 1.2771826528999602e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20688292384147644,
"step": 3385,
"valid_targets_mean": 2547.2,
"valid_targets_min": 1028
},
{
"epoch": 4.599728629579376,
"grad_norm": 0.690580382285912,
"learning_rate": 1.2708778534263803e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17476820945739746,
"step": 3390,
"valid_targets_mean": 2701.8,
"valid_targets_min": 832
},
{
"epoch": 4.606512890094979,
"grad_norm": 0.7470662126944148,
"learning_rate": 1.2645813992587352e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.187617227435112,
"step": 3395,
"valid_targets_mean": 2586.8,
"valid_targets_min": 682
},
{
"epoch": 4.613297150610584,
"grad_norm": 1.2159270387590686,
"learning_rate": 1.258293362464286e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1858140230178833,
"step": 3400,
"valid_targets_mean": 2249.7,
"valid_targets_min": 1083
},
{
"epoch": 4.620081411126187,
"grad_norm": 0.7718829974398066,
"learning_rate": 1.2520138150139515e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.183822900056839,
"step": 3405,
"valid_targets_mean": 2386.8,
"valid_targets_min": 821
},
{
"epoch": 4.6268656716417915,
"grad_norm": 0.7237060148317359,
"learning_rate": 1.2457428287814843e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2160126268863678,
"step": 3410,
"valid_targets_mean": 3024.9,
"valid_targets_min": 1350
},
{
"epoch": 4.633649932157395,
"grad_norm": 0.6970676682341086,
"learning_rate": 1.2394804755426478e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19945994019508362,
"step": 3415,
"valid_targets_mean": 2918.2,
"valid_targets_min": 474
},
{
"epoch": 4.640434192672998,
"grad_norm": 0.7002590495581039,
"learning_rate": 1.233226826974395e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1719842553138733,
"step": 3420,
"valid_targets_mean": 2718.7,
"valid_targets_min": 691
},
{
"epoch": 4.647218453188603,
"grad_norm": 0.6667044269630936,
"learning_rate": 1.2269819546540463e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17064428329467773,
"step": 3425,
"valid_targets_mean": 2865.0,
"valid_targets_min": 760
},
{
"epoch": 4.654002713704206,
"grad_norm": 0.6723526548267423,
"learning_rate": 1.2207459300584743e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17956231534481049,
"step": 3430,
"valid_targets_mean": 2932.9,
"valid_targets_min": 777
},
{
"epoch": 4.6607869742198105,
"grad_norm": 0.7597739606585969,
"learning_rate": 1.2145188245632825e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2012956440448761,
"step": 3435,
"valid_targets_mean": 2589.2,
"valid_targets_min": 847
},
{
"epoch": 4.667571234735414,
"grad_norm": 0.7411616368636825,
"learning_rate": 1.2083007094419883e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20920173823833466,
"step": 3440,
"valid_targets_mean": 2706.8,
"valid_targets_min": 802
},
{
"epoch": 4.674355495251017,
"grad_norm": 0.7282082144235389,
"learning_rate": 1.2020916558652089e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19379201531410217,
"step": 3445,
"valid_targets_mean": 2854.1,
"valid_targets_min": 1386
},
{
"epoch": 4.681139755766622,
"grad_norm": 0.7634331226060735,
"learning_rate": 1.195891734899846e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17866259813308716,
"step": 3450,
"valid_targets_mean": 2573.5,
"valid_targets_min": 655
},
{
"epoch": 4.687924016282225,
"grad_norm": 0.7399644965932646,
"learning_rate": 1.1897010175082722e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17755639553070068,
"step": 3455,
"valid_targets_mean": 2317.8,
"valid_targets_min": 727
},
{
"epoch": 4.694708276797829,
"grad_norm": 0.6760992330649304,
"learning_rate": 1.1835195745475167e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2119104415178299,
"step": 3460,
"valid_targets_mean": 3410.1,
"valid_targets_min": 1576
},
{
"epoch": 4.701492537313433,
"grad_norm": 0.804513682015714,
"learning_rate": 1.17734747676846e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19752076268196106,
"step": 3465,
"valid_targets_mean": 2760.2,
"valid_targets_min": 1040
},
{
"epoch": 4.708276797829036,
"grad_norm": 0.707949135936285,
"learning_rate": 1.1711847948150186e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20585331320762634,
"step": 3470,
"valid_targets_mean": 3060.6,
"valid_targets_min": 822
},
{
"epoch": 4.715061058344641,
"grad_norm": 0.7166396129531338,
"learning_rate": 1.1650315992233385e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20005938410758972,
"step": 3475,
"valid_targets_mean": 2918.9,
"valid_targets_min": 1040
},
{
"epoch": 4.721845318860244,
"grad_norm": 0.7074627055555082,
"learning_rate": 1.1588879604209881e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19769035279750824,
"step": 3480,
"valid_targets_mean": 2911.6,
"valid_targets_min": 897
},
{
"epoch": 4.728629579375848,
"grad_norm": 0.6735143020870807,
"learning_rate": 1.1527539487261506e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22932162880897522,
"step": 3485,
"valid_targets_mean": 3123.0,
"valid_targets_min": 992
},
{
"epoch": 4.735413839891452,
"grad_norm": 0.869273594031702,
"learning_rate": 1.1466296343468226e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19944173097610474,
"step": 3490,
"valid_targets_mean": 3747.2,
"valid_targets_min": 1122
},
{
"epoch": 4.742198100407055,
"grad_norm": 0.6999556266338184,
"learning_rate": 1.1405150873800061e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19584204256534576,
"step": 3495,
"valid_targets_mean": 2844.7,
"valid_targets_min": 659
},
{
"epoch": 4.74898236092266,
"grad_norm": 0.8746934337613864,
"learning_rate": 1.1344103778109087e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20564094185829163,
"step": 3500,
"valid_targets_mean": 2151.8,
"valid_targets_min": 854
},
{
"epoch": 4.755766621438263,
"grad_norm": 0.7003484221778359,
"learning_rate": 1.1283155755121435e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18846553564071655,
"step": 3505,
"valid_targets_mean": 3061.2,
"valid_targets_min": 734
},
{
"epoch": 4.762550881953867,
"grad_norm": 0.6735835369736797,
"learning_rate": 1.1222307502429263e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19506067037582397,
"step": 3510,
"valid_targets_mean": 3378.4,
"valid_targets_min": 1042
},
{
"epoch": 4.769335142469471,
"grad_norm": 0.6771476818137822,
"learning_rate": 1.116155971648281e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2082287073135376,
"step": 3515,
"valid_targets_mean": 3448.1,
"valid_targets_min": 1111
},
{
"epoch": 4.776119402985074,
"grad_norm": 0.6422854879412622,
"learning_rate": 1.1100913092582374e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17519763112068176,
"step": 3520,
"valid_targets_mean": 3188.4,
"valid_targets_min": 627
},
{
"epoch": 4.7829036635006785,
"grad_norm": 0.6470472236301349,
"learning_rate": 1.1040368324870423e-05,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18372002243995667,
"step": 3525,
"valid_targets_mean": 3492.9,
"valid_targets_min": 1281
},
{
"epoch": 4.789687924016282,
"grad_norm": 0.6869308415003494,
"learning_rate": 1.0979926106323573e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19661110639572144,
"step": 3530,
"valid_targets_mean": 2938.6,
"valid_targets_min": 1216
},
{
"epoch": 4.796472184531886,
"grad_norm": 0.7662043660493066,
"learning_rate": 1.0919587128744706e-05,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22166971862316132,
"step": 3535,
"valid_targets_mean": 2690.3,
"valid_targets_min": 870
},
{
"epoch": 4.80325644504749,
"grad_norm": 0.7199094564088079,
"learning_rate": 1.0859352082755063e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20869404077529907,
"step": 3540,
"valid_targets_mean": 2830.1,
"valid_targets_min": 974
},
{
"epoch": 4.810040705563093,
"grad_norm": 0.7328326298477729,
"learning_rate": 1.0799221657786277e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19416038691997528,
"step": 3545,
"valid_targets_mean": 2855.2,
"valid_targets_min": 930
},
{
"epoch": 4.8168249660786975,
"grad_norm": 0.7338773028161634,
"learning_rate": 1.0739196542072554e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18774661421775818,
"step": 3550,
"valid_targets_mean": 2434.1,
"valid_targets_min": 548
},
{
"epoch": 4.823609226594301,
"grad_norm": 0.7453504801028396,
"learning_rate": 1.067927742264274e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19881319999694824,
"step": 3555,
"valid_targets_mean": 2629.6,
"valid_targets_min": 898
},
{
"epoch": 4.830393487109905,
"grad_norm": 0.7369431692578411,
"learning_rate": 1.0619464985312504e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17585620284080505,
"step": 3560,
"valid_targets_mean": 2719.1,
"valid_targets_min": 788
},
{
"epoch": 4.837177747625509,
"grad_norm": 0.9297708502664351,
"learning_rate": 1.0559759914676446e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22836661338806152,
"step": 3565,
"valid_targets_mean": 2168.1,
"valid_targets_min": 1005
},
{
"epoch": 4.843962008141113,
"grad_norm": 0.6894574277930866,
"learning_rate": 1.0500162894100274e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19786593317985535,
"step": 3570,
"valid_targets_mean": 3260.4,
"valid_targets_min": 927
},
{
"epoch": 4.850746268656716,
"grad_norm": 0.8540680237621792,
"learning_rate": 1.0440674605713017e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18931138515472412,
"step": 3575,
"valid_targets_mean": 2123.2,
"valid_targets_min": 835
},
{
"epoch": 4.85753052917232,
"grad_norm": 0.7445669474855375,
"learning_rate": 1.0381295730399156e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191728413105011,
"step": 3580,
"valid_targets_mean": 2410.1,
"valid_targets_min": 926
},
{
"epoch": 4.864314789687924,
"grad_norm": 0.7329229972435735,
"learning_rate": 1.03220269477909e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22075408697128296,
"step": 3585,
"valid_targets_mean": 2925.0,
"valid_targets_min": 1200
},
{
"epoch": 4.871099050203528,
"grad_norm": 0.6758139766478201,
"learning_rate": 1.026286893626033e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19056375324726105,
"step": 3590,
"valid_targets_mean": 3506.6,
"valid_targets_min": 906
},
{
"epoch": 4.877883310719132,
"grad_norm": 0.7551370606263685,
"learning_rate": 1.0203822372911714e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027992308139801,
"step": 3595,
"valid_targets_mean": 2676.6,
"valid_targets_min": 1214
},
{
"epoch": 4.884667571234735,
"grad_norm": 0.7381200265506531,
"learning_rate": 1.0144887933573686e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18408526480197906,
"step": 3600,
"valid_targets_mean": 2631.5,
"valid_targets_min": 930
},
{
"epoch": 4.89145183175034,
"grad_norm": 0.7270532833777729,
"learning_rate": 1.0086066292791573e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17591014504432678,
"step": 3605,
"valid_targets_mean": 2436.2,
"valid_targets_min": 817
},
{
"epoch": 4.898236092265943,
"grad_norm": 0.7296787884141677,
"learning_rate": 1.0027358123819625e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1968274563550949,
"step": 3610,
"valid_targets_mean": 2829.1,
"valid_targets_min": 733
},
{
"epoch": 4.905020352781547,
"grad_norm": 0.6735262562716569,
"learning_rate": 9.968764098613329e-06,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.178671196103096,
"step": 3615,
"valid_targets_mean": 2898.8,
"valid_targets_min": 727
},
{
"epoch": 4.911804613297151,
"grad_norm": 0.7274784816663047,
"learning_rate": 9.910284887821733e-06,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20386825501918793,
"step": 3620,
"valid_targets_mean": 2990.9,
"valid_targets_min": 1363
},
{
"epoch": 4.918588873812754,
"grad_norm": 0.8018638530971335,
"learning_rate": 9.851921160779729e-06,
"loss": 0.192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19886431097984314,
"step": 3625,
"valid_targets_mean": 2382.4,
"valid_targets_min": 614
},
{
"epoch": 4.925373134328359,
"grad_norm": 0.8315431805467934,
"learning_rate": 9.793673585500454e-06,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18963271379470825,
"step": 3630,
"valid_targets_mean": 2400.6,
"valid_targets_min": 770
},
{
"epoch": 4.932157394843962,
"grad_norm": 0.7403065285740312,
"learning_rate": 9.73554282866757e-06,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1916884034872055,
"step": 3635,
"valid_targets_mean": 2484.9,
"valid_targets_min": 801
},
{
"epoch": 4.9389416553595655,
"grad_norm": 0.8056592037843991,
"learning_rate": 9.677529555627705e-06,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1968856304883957,
"step": 3640,
"valid_targets_mean": 2373.9,
"valid_targets_min": 1222
},
{
"epoch": 4.94572591587517,
"grad_norm": 0.6847276217753911,
"learning_rate": 9.61963443038278e-06,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19165253639221191,
"step": 3645,
"valid_targets_mean": 3296.9,
"valid_targets_min": 642
},
{
"epoch": 4.952510176390773,
"grad_norm": 0.7481331426159193,
"learning_rate": 9.561858115582432e-06,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1881834864616394,
"step": 3650,
"valid_targets_mean": 2459.1,
"valid_targets_min": 737
},
{
"epoch": 4.959294436906378,
"grad_norm": 0.7380750762114332,
"learning_rate": 9.504201272516456e-06,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18983861804008484,
"step": 3655,
"valid_targets_mean": 2577.3,
"valid_targets_min": 896
},
{
"epoch": 4.966078697421981,
"grad_norm": 0.7036147611876263,
"learning_rate": 9.44666456110718e-06,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19570358097553253,
"step": 3660,
"valid_targets_mean": 3040.5,
"valid_targets_min": 724
},
{
"epoch": 4.9728629579375845,
"grad_norm": 0.7932038159884709,
"learning_rate": 9.38924863990197e-06,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1836714744567871,
"step": 3665,
"valid_targets_mean": 2151.7,
"valid_targets_min": 923
},
{
"epoch": 4.979647218453189,
"grad_norm": 0.6964386837916756,
"learning_rate": 9.331954166065635e-06,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18505831062793732,
"step": 3670,
"valid_targets_mean": 2731.6,
"valid_targets_min": 1165
},
{
"epoch": 4.986431478968792,
"grad_norm": 0.7601196537242972,
"learning_rate": 9.27478179537297e-06,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19253486394882202,
"step": 3675,
"valid_targets_mean": 2509.4,
"valid_targets_min": 548
},
{
"epoch": 4.993215739484397,
"grad_norm": 0.8155086323774635,
"learning_rate": 9.217732182201184e-06,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19509343802928925,
"step": 3680,
"valid_targets_mean": 2026.9,
"valid_targets_min": 644
},
{
"epoch": 5.0,
"grad_norm": 0.7646808703457486,
"learning_rate": 9.160805979522452e-06,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18792404234409332,
"step": 3685,
"valid_targets_mean": 2684.2,
"valid_targets_min": 685
},
{
"epoch": 5.006784260515603,
"grad_norm": 0.6860326719249955,
"learning_rate": 9.104003838896445e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1950758993625641,
"step": 3690,
"valid_targets_mean": 3155.7,
"valid_targets_min": 1030
},
{
"epoch": 5.013568521031208,
"grad_norm": 0.8441160581115864,
"learning_rate": 9.047326410462829e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161452516913414,
"step": 3695,
"valid_targets_mean": 1863.4,
"valid_targets_min": 839
},
{
"epoch": 5.020352781546811,
"grad_norm": 0.7067203784439574,
"learning_rate": 8.990774342933888e-06,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1699763685464859,
"step": 3700,
"valid_targets_mean": 3295.1,
"valid_targets_min": 923
},
{
"epoch": 5.0271370420624155,
"grad_norm": 0.7615352549068712,
"learning_rate": 8.934348283587029e-06,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1905319094657898,
"step": 3705,
"valid_targets_mean": 2832.2,
"valid_targets_min": 886
},
{
"epoch": 5.033921302578019,
"grad_norm": 0.7103293756116349,
"learning_rate": 8.878048878257443e-06,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1622033417224884,
"step": 3710,
"valid_targets_mean": 2561.1,
"valid_targets_min": 1241
},
{
"epoch": 5.040705563093622,
"grad_norm": 0.6718184525017369,
"learning_rate": 8.82187677133065e-06,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16609933972358704,
"step": 3715,
"valid_targets_mean": 3126.9,
"valid_targets_min": 881
},
{
"epoch": 5.047489823609227,
"grad_norm": 0.7837080600442082,
"learning_rate": 8.765832605735159e-06,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19446608424186707,
"step": 3720,
"valid_targets_mean": 2856.1,
"valid_targets_min": 880
},
{
"epoch": 5.05427408412483,
"grad_norm": 0.6563421792158702,
"learning_rate": 8.709917022935117e-06,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14738069474697113,
"step": 3725,
"valid_targets_mean": 2943.3,
"valid_targets_min": 901
},
{
"epoch": 5.0610583446404345,
"grad_norm": 0.8034887747351711,
"learning_rate": 8.654130662922927e-06,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18572455644607544,
"step": 3730,
"valid_targets_mean": 3047.0,
"valid_targets_min": 772
},
{
"epoch": 5.067842605156038,
"grad_norm": 0.7592407786525501,
"learning_rate": 8.59847416421198e-06,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18500494956970215,
"step": 3735,
"valid_targets_mean": 2576.2,
"valid_targets_min": 1356
},
{
"epoch": 5.074626865671641,
"grad_norm": 0.7045855658185989,
"learning_rate": 8.542948163829281e-06,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16853509843349457,
"step": 3740,
"valid_targets_mean": 3002.3,
"valid_targets_min": 765
},
{
"epoch": 5.081411126187246,
"grad_norm": 0.7766566314367146,
"learning_rate": 8.48755329730822e-06,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1695399284362793,
"step": 3745,
"valid_targets_mean": 3074.8,
"valid_targets_min": 705
},
{
"epoch": 5.088195386702849,
"grad_norm": 0.7988370685668423,
"learning_rate": 8.432290198681252e-06,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2006351202726364,
"step": 3750,
"valid_targets_mean": 2525.8,
"valid_targets_min": 1122
},
{
"epoch": 5.094979647218453,
"grad_norm": 0.7054424649548406,
"learning_rate": 8.377159500472655e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17677809298038483,
"step": 3755,
"valid_targets_mean": 3203.8,
"valid_targets_min": 1011
},
{
"epoch": 5.101763907734057,
"grad_norm": 0.713725738511338,
"learning_rate": 8.322161833691314e-06,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16771814227104187,
"step": 3760,
"valid_targets_mean": 2823.8,
"valid_targets_min": 822
},
{
"epoch": 5.108548168249661,
"grad_norm": 0.8555144387463031,
"learning_rate": 8.267297827823451e-06,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18097899854183197,
"step": 3765,
"valid_targets_mean": 2239.5,
"valid_targets_min": 873
},
{
"epoch": 5.115332428765265,
"grad_norm": 0.6934604273299277,
"learning_rate": 8.212568110825475e-06,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15618851780891418,
"step": 3770,
"valid_targets_mean": 2868.4,
"valid_targets_min": 914
},
{
"epoch": 5.122116689280868,
"grad_norm": 0.7648492466356746,
"learning_rate": 8.157973309116734e-06,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17531245946884155,
"step": 3775,
"valid_targets_mean": 2618.1,
"valid_targets_min": 722
},
{
"epoch": 5.128900949796472,
"grad_norm": 0.7285693028786157,
"learning_rate": 8.103514047572409e-06,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17099301517009735,
"step": 3780,
"valid_targets_mean": 3425.1,
"valid_targets_min": 675
},
{
"epoch": 5.135685210312076,
"grad_norm": 0.8202795361017104,
"learning_rate": 8.049190949516312e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1414903700351715,
"step": 3785,
"valid_targets_mean": 1912.8,
"valid_targets_min": 727
},
{
"epoch": 5.14246947082768,
"grad_norm": 0.8263248998725861,
"learning_rate": 7.995004636713763e-06,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19762666523456573,
"step": 3790,
"valid_targets_mean": 2408.8,
"valid_targets_min": 952
},
{
"epoch": 5.149253731343284,
"grad_norm": 0.7393185445325677,
"learning_rate": 7.940955729364508e-06,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1720680445432663,
"step": 3795,
"valid_targets_mean": 2906.4,
"valid_targets_min": 1179
},
{
"epoch": 5.156037991858887,
"grad_norm": 0.803370399333462,
"learning_rate": 7.88704484609556e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17175140976905823,
"step": 3800,
"valid_targets_mean": 2323.2,
"valid_targets_min": 754
},
{
"epoch": 5.162822252374491,
"grad_norm": 0.6536820438575788,
"learning_rate": 7.83327260395418e-06,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15294823050498962,
"step": 3805,
"valid_targets_mean": 3594.9,
"valid_targets_min": 692
},
{
"epoch": 5.169606512890095,
"grad_norm": 1.122135081296357,
"learning_rate": 7.779639618400761e-06,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16186411678791046,
"step": 3810,
"valid_targets_mean": 2047.9,
"valid_targets_min": 617
},
{
"epoch": 5.176390773405699,
"grad_norm": 0.8371034996880778,
"learning_rate": 7.726146503301835e-06,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18086284399032593,
"step": 3815,
"valid_targets_mean": 2635.9,
"valid_targets_min": 946
},
{
"epoch": 5.1831750339213025,
"grad_norm": 0.8310613229880927,
"learning_rate": 7.672793870922988e-06,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1729108989238739,
"step": 3820,
"valid_targets_mean": 2154.4,
"valid_targets_min": 714
},
{
"epoch": 5.189959294436906,
"grad_norm": 0.7736398422191684,
"learning_rate": 7.619582331921918e-06,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19843143224716187,
"step": 3825,
"valid_targets_mean": 3357.2,
"valid_targets_min": 648
},
{
"epoch": 5.19674355495251,
"grad_norm": 0.7257509154939583,
"learning_rate": 7.566512495341387e-06,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17544004321098328,
"step": 3830,
"valid_targets_mean": 2957.9,
"valid_targets_min": 1043
},
{
"epoch": 5.203527815468114,
"grad_norm": 0.7915636689184143,
"learning_rate": 7.513584968602279e-06,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17739593982696533,
"step": 3835,
"valid_targets_mean": 3008.4,
"valid_targets_min": 991
},
{
"epoch": 5.210312075983718,
"grad_norm": 0.7239442896123227,
"learning_rate": 7.4608003574966604e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15659013390541077,
"step": 3840,
"valid_targets_mean": 2958.6,
"valid_targets_min": 1152
},
{
"epoch": 5.2170963364993215,
"grad_norm": 0.8396562792144856,
"learning_rate": 7.408159266180803e-06,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17542997002601624,
"step": 3845,
"valid_targets_mean": 2428.6,
"valid_targets_min": 772
},
{
"epoch": 5.223880597014926,
"grad_norm": 0.7134303390915493,
"learning_rate": 7.3556622971683246e-06,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1654246747493744,
"step": 3850,
"valid_targets_mean": 3071.6,
"valid_targets_min": 671
},
{
"epoch": 5.230664857530529,
"grad_norm": 0.8451388168730941,
"learning_rate": 7.3033100513232356e-06,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715916395187378,
"step": 3855,
"valid_targets_mean": 2175.2,
"valid_targets_min": 1131
},
{
"epoch": 5.237449118046133,
"grad_norm": 0.717910328678344,
"learning_rate": 7.251103127853119e-06,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17889514565467834,
"step": 3860,
"valid_targets_mean": 2811.1,
"valid_targets_min": 917
},
{
"epoch": 5.244233378561737,
"grad_norm": 0.6701275306479537,
"learning_rate": 7.199042124302218e-06,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15984272956848145,
"step": 3865,
"valid_targets_mean": 3448.8,
"valid_targets_min": 1410
},
{
"epoch": 5.25101763907734,
"grad_norm": 0.7396236758430029,
"learning_rate": 7.1471276365446265e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16578418016433716,
"step": 3870,
"valid_targets_mean": 2790.6,
"valid_targets_min": 788
},
{
"epoch": 5.257801899592945,
"grad_norm": 0.7761448636163958,
"learning_rate": 7.095360258777479e-06,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16495108604431152,
"step": 3875,
"valid_targets_mean": 2547.1,
"valid_targets_min": 649
},
{
"epoch": 5.264586160108548,
"grad_norm": 0.7169834901617055,
"learning_rate": 7.043740583514116e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16059651970863342,
"step": 3880,
"valid_targets_mean": 2682.7,
"valid_targets_min": 1125
},
{
"epoch": 5.271370420624152,
"grad_norm": 0.937784973378471,
"learning_rate": 6.99226920157734e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15862375497817993,
"step": 3885,
"valid_targets_mean": 2327.4,
"valid_targets_min": 819
},
{
"epoch": 5.278154681139756,
"grad_norm": 0.7636077182810278,
"learning_rate": 6.9409467020926105e-06,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15665987133979797,
"step": 3890,
"valid_targets_mean": 2581.5,
"valid_targets_min": 770
},
{
"epoch": 5.284938941655359,
"grad_norm": 0.8082211996097235,
"learning_rate": 6.88977367248135e-06,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17556774616241455,
"step": 3895,
"valid_targets_mean": 2410.4,
"valid_targets_min": 714
},
{
"epoch": 5.291723202170964,
"grad_norm": 0.7855611135912653,
"learning_rate": 6.838750698454179e-06,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19265274703502655,
"step": 3900,
"valid_targets_mean": 2630.9,
"valid_targets_min": 640
},
{
"epoch": 5.298507462686567,
"grad_norm": 0.773979909790802,
"learning_rate": 6.787878364004223e-06,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1742939054965973,
"step": 3905,
"valid_targets_mean": 2754.6,
"valid_targets_min": 911
},
{
"epoch": 5.305291723202171,
"grad_norm": 0.7045798341954811,
"learning_rate": 6.7371572514004565e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1639530062675476,
"step": 3910,
"valid_targets_mean": 3152.7,
"valid_targets_min": 642
},
{
"epoch": 5.312075983717775,
"grad_norm": 0.7118839049525844,
"learning_rate": 6.6865879411809905e-06,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1681211143732071,
"step": 3915,
"valid_targets_mean": 3016.1,
"valid_targets_min": 548
},
{
"epoch": 5.318860244233378,
"grad_norm": 0.7619077612605996,
"learning_rate": 6.636171012146475e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1695559173822403,
"step": 3920,
"valid_targets_mean": 2828.6,
"valid_targets_min": 734
},
{
"epoch": 5.325644504748983,
"grad_norm": 0.704742231689896,
"learning_rate": 6.58590704135343e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15426993370056152,
"step": 3925,
"valid_targets_mean": 2844.4,
"valid_targets_min": 662
},
{
"epoch": 5.332428765264586,
"grad_norm": 1.083531396358083,
"learning_rate": 6.535796604107689e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15194523334503174,
"step": 3930,
"valid_targets_mean": 2859.6,
"valid_targets_min": 1012
},
{
"epoch": 5.3392130257801895,
"grad_norm": 0.7267810541836737,
"learning_rate": 6.485840273957764e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18725672364234924,
"step": 3935,
"valid_targets_mean": 3104.9,
"valid_targets_min": 910
},
{
"epoch": 5.345997286295794,
"grad_norm": 0.7803241832429276,
"learning_rate": 6.4360386226883096e-06,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18757139146327972,
"step": 3940,
"valid_targets_mean": 2826.7,
"valid_targets_min": 803
},
{
"epoch": 5.352781546811397,
"grad_norm": 0.7469635091923277,
"learning_rate": 6.386392220313595e-06,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1943964660167694,
"step": 3945,
"valid_targets_mean": 2944.8,
"valid_targets_min": 1105
},
{
"epoch": 5.359565807327002,
"grad_norm": 0.7710548111024483,
"learning_rate": 6.336901635070924e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18395206332206726,
"step": 3950,
"valid_targets_mean": 2640.2,
"valid_targets_min": 744
},
{
"epoch": 5.366350067842605,
"grad_norm": 0.7839171636791334,
"learning_rate": 6.287567433414203e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18562139570713043,
"step": 3955,
"valid_targets_mean": 2582.2,
"valid_targets_min": 788
},
{
"epoch": 5.373134328358209,
"grad_norm": 0.7856837884639124,
"learning_rate": 6.238390180007388e-06,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1797139048576355,
"step": 3960,
"valid_targets_mean": 2337.2,
"valid_targets_min": 890
},
{
"epoch": 5.379918588873813,
"grad_norm": 0.7809120404347694,
"learning_rate": 6.189370437718076e-06,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17183539271354675,
"step": 3965,
"valid_targets_mean": 2353.1,
"valid_targets_min": 894
},
{
"epoch": 5.386702849389416,
"grad_norm": 0.7115407389633623,
"learning_rate": 6.140508767611031e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17769712209701538,
"step": 3970,
"valid_targets_mean": 3229.7,
"valid_targets_min": 682
},
{
"epoch": 5.393487109905021,
"grad_norm": 0.9077544313783328,
"learning_rate": 6.091805728941766e-06,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19499380886554718,
"step": 3975,
"valid_targets_mean": 3067.6,
"valid_targets_min": 1205
},
{
"epoch": 5.400271370420624,
"grad_norm": 0.8077064097851708,
"learning_rate": 6.0432618791501685e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1870405375957489,
"step": 3980,
"valid_targets_mean": 2559.1,
"valid_targets_min": 824
},
{
"epoch": 5.407055630936228,
"grad_norm": 0.6398380496001846,
"learning_rate": 5.994877773854073e-06,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15979993343353271,
"step": 3985,
"valid_targets_mean": 3374.1,
"valid_targets_min": 765
},
{
"epoch": 5.413839891451832,
"grad_norm": 0.7502361275025041,
"learning_rate": 5.946653966842952e-06,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17689886689186096,
"step": 3990,
"valid_targets_mean": 2697.2,
"valid_targets_min": 985
},
{
"epoch": 5.420624151967435,
"grad_norm": 0.7109443485696391,
"learning_rate": 5.89859101007153e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19721101224422455,
"step": 3995,
"valid_targets_mean": 3432.0,
"valid_targets_min": 1392
},
{
"epoch": 5.4274084124830395,
"grad_norm": 0.7778834659042302,
"learning_rate": 5.850689453653519e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.176166370511055,
"step": 4000,
"valid_targets_mean": 2819.3,
"valid_targets_min": 648
},
{
"epoch": 5.434192672998643,
"grad_norm": 0.7986804713666946,
"learning_rate": 5.802949845855268e-06,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17381024360656738,
"step": 4005,
"valid_targets_mean": 2511.1,
"valid_targets_min": 682
},
{
"epoch": 5.440976933514247,
"grad_norm": 0.74764269275807,
"learning_rate": 5.75537273308951e-06,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1764945685863495,
"step": 4010,
"valid_targets_mean": 3111.7,
"valid_targets_min": 1171
},
{
"epoch": 5.447761194029851,
"grad_norm": 0.7387352711479095,
"learning_rate": 5.7079586599091386e-06,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689624935388565,
"step": 4015,
"valid_targets_mean": 2689.8,
"valid_targets_min": 746
},
{
"epoch": 5.454545454545454,
"grad_norm": 0.6334842178503496,
"learning_rate": 5.660708169000915e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1706801950931549,
"step": 4020,
"valid_targets_mean": 4078.6,
"valid_targets_min": 1344
},
{
"epoch": 5.4613297150610585,
"grad_norm": 0.7687849593222028,
"learning_rate": 5.61362180117931e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.180070698261261,
"step": 4025,
"valid_targets_mean": 2676.0,
"valid_targets_min": 1013
},
{
"epoch": 5.468113975576662,
"grad_norm": 0.730085829715646,
"learning_rate": 5.566700095380278e-06,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17584823071956635,
"step": 4030,
"valid_targets_mean": 3169.8,
"valid_targets_min": 1001
},
{
"epoch": 5.474898236092266,
"grad_norm": 0.7919939571403866,
"learning_rate": 5.519943588655119e-06,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16983819007873535,
"step": 4035,
"valid_targets_mean": 2544.8,
"valid_targets_min": 711
},
{
"epoch": 5.48168249660787,
"grad_norm": 0.7573834464121695,
"learning_rate": 5.473352816164297e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18410179018974304,
"step": 4040,
"valid_targets_mean": 2772.2,
"valid_targets_min": 1090
},
{
"epoch": 5.488466757123474,
"grad_norm": 0.8466367207178821,
"learning_rate": 5.426928311171349e-06,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1880597323179245,
"step": 4045,
"valid_targets_mean": 2396.6,
"valid_targets_min": 830
},
{
"epoch": 5.495251017639077,
"grad_norm": 0.7284020341330157,
"learning_rate": 5.3806706050367595e-06,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1683264523744583,
"step": 4050,
"valid_targets_mean": 2992.8,
"valid_targets_min": 837
},
{
"epoch": 5.502035278154681,
"grad_norm": 0.7784161722246488,
"learning_rate": 5.334580227211876e-06,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1845816969871521,
"step": 4055,
"valid_targets_mean": 2580.1,
"valid_targets_min": 742
},
{
"epoch": 5.508819538670285,
"grad_norm": 0.8548009473097017,
"learning_rate": 5.28865770523288e-06,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17506195604801178,
"step": 4060,
"valid_targets_mean": 2178.6,
"valid_targets_min": 642
},
{
"epoch": 5.515603799185889,
"grad_norm": 0.7774055293795816,
"learning_rate": 5.242903564714703e-06,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16525691747665405,
"step": 4065,
"valid_targets_mean": 2520.9,
"valid_targets_min": 720
},
{
"epoch": 5.522388059701493,
"grad_norm": 0.796456602697807,
"learning_rate": 5.197318329345053e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1665637195110321,
"step": 4070,
"valid_targets_mean": 2367.8,
"valid_targets_min": 721
},
{
"epoch": 5.529172320217096,
"grad_norm": 0.646421264270265,
"learning_rate": 5.151902520878389e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15533316135406494,
"step": 4075,
"valid_targets_mean": 2986.1,
"valid_targets_min": 692
},
{
"epoch": 5.5359565807327,
"grad_norm": 0.7819970698101568,
"learning_rate": 5.106656659129976e-06,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20608392357826233,
"step": 4080,
"valid_targets_mean": 2478.6,
"valid_targets_min": 615
},
{
"epoch": 5.542740841248304,
"grad_norm": 0.7853975289145698,
"learning_rate": 5.061581261969908e-06,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17922022938728333,
"step": 4085,
"valid_targets_mean": 2634.1,
"valid_targets_min": 632
},
{
"epoch": 5.549525101763908,
"grad_norm": 0.7225473013309462,
"learning_rate": 5.016676845317195e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1765461564064026,
"step": 4090,
"valid_targets_mean": 3014.4,
"valid_targets_min": 911
},
{
"epoch": 5.556309362279512,
"grad_norm": 0.7295640966157877,
"learning_rate": 4.971943923133871e-06,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17156416177749634,
"step": 4095,
"valid_targets_mean": 3041.5,
"valid_targets_min": 912
},
{
"epoch": 5.563093622795115,
"grad_norm": 0.9219762006603129,
"learning_rate": 4.9273830074190775e-06,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18373648822307587,
"step": 4100,
"valid_targets_mean": 2428.7,
"valid_targets_min": 722
},
{
"epoch": 5.569877883310719,
"grad_norm": 0.702767206840844,
"learning_rate": 4.8829946082032485e-06,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13803914189338684,
"step": 4105,
"valid_targets_mean": 2718.2,
"valid_targets_min": 761
},
{
"epoch": 5.576662143826323,
"grad_norm": 0.7199250201736765,
"learning_rate": 4.838779233542219e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18196873366832733,
"step": 4110,
"valid_targets_mean": 3093.8,
"valid_targets_min": 1395
},
{
"epoch": 5.5834464043419265,
"grad_norm": 0.702683524158407,
"learning_rate": 4.794737389511466e-06,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15686261653900146,
"step": 4115,
"valid_targets_mean": 2956.6,
"valid_targets_min": 1365
},
{
"epoch": 5.590230664857531,
"grad_norm": 0.8226186328669812,
"learning_rate": 4.750869580200268e-06,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18233484029769897,
"step": 4120,
"valid_targets_mean": 2818.7,
"valid_targets_min": 848
},
{
"epoch": 5.597014925373134,
"grad_norm": 0.757006026009914,
"learning_rate": 4.707176307705958e-06,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17816491425037384,
"step": 4125,
"valid_targets_mean": 2692.9,
"valid_targets_min": 578
},
{
"epoch": 5.603799185888738,
"grad_norm": 0.7711809358808944,
"learning_rate": 4.6636580721281945e-06,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1927419900894165,
"step": 4130,
"valid_targets_mean": 2813.9,
"valid_targets_min": 1322
},
{
"epoch": 5.610583446404342,
"grad_norm": 0.8362493387614779,
"learning_rate": 4.620315371563188e-06,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16866496205329895,
"step": 4135,
"valid_targets_mean": 2549.8,
"valid_targets_min": 728
},
{
"epoch": 5.6173677069199455,
"grad_norm": 0.7202504972034123,
"learning_rate": 4.577148702098064e-06,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18742281198501587,
"step": 4140,
"valid_targets_mean": 3108.2,
"valid_targets_min": 727
},
{
"epoch": 5.62415196743555,
"grad_norm": 0.7230613052656376,
"learning_rate": 4.5341585578051125e-06,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1717241406440735,
"step": 4145,
"valid_targets_mean": 2795.6,
"valid_targets_min": 955
},
{
"epoch": 5.630936227951153,
"grad_norm": 0.7394571746760491,
"learning_rate": 4.491345430736207e-06,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17502638697624207,
"step": 4150,
"valid_targets_mean": 2911.4,
"valid_targets_min": 1097
},
{
"epoch": 5.637720488466757,
"grad_norm": 1.1380143885731062,
"learning_rate": 4.4487098109171115e-06,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16936932504177094,
"step": 4155,
"valid_targets_mean": 2618.9,
"valid_targets_min": 892
},
{
"epoch": 5.644504748982361,
"grad_norm": 0.880683030604768,
"learning_rate": 4.406252186341904e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1713424026966095,
"step": 4160,
"valid_targets_mean": 2082.8,
"valid_targets_min": 654
},
{
"epoch": 5.651289009497964,
"grad_norm": 0.8944130226850632,
"learning_rate": 4.363973042967393e-06,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2198825478553772,
"step": 4165,
"valid_targets_mean": 2161.4,
"valid_targets_min": 793
},
{
"epoch": 5.658073270013569,
"grad_norm": 0.7666908944066096,
"learning_rate": 4.3218728647075324e-06,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16684460639953613,
"step": 4170,
"valid_targets_mean": 2747.1,
"valid_targets_min": 1033
},
{
"epoch": 5.664857530529172,
"grad_norm": 1.1331036484064003,
"learning_rate": 4.2799521334279155e-06,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16542381048202515,
"step": 4175,
"valid_targets_mean": 2846.9,
"valid_targets_min": 822
},
{
"epoch": 5.6716417910447765,
"grad_norm": 0.7113624200207286,
"learning_rate": 4.238211328940214e-06,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15958712995052338,
"step": 4180,
"valid_targets_mean": 2826.9,
"valid_targets_min": 904
},
{
"epoch": 5.67842605156038,
"grad_norm": 0.7443765505636735,
"learning_rate": 4.196650928996744e-06,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17205163836479187,
"step": 4185,
"valid_targets_mean": 2878.1,
"valid_targets_min": 1151
},
{
"epoch": 5.685210312075983,
"grad_norm": 0.765002712688627,
"learning_rate": 4.155271409284947e-06,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17750981450080872,
"step": 4190,
"valid_targets_mean": 2678.2,
"valid_targets_min": 1337
},
{
"epoch": 5.691994572591588,
"grad_norm": 0.7973473759974611,
"learning_rate": 4.114073243421964e-06,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18639904260635376,
"step": 4195,
"valid_targets_mean": 2673.8,
"valid_targets_min": 1544
},
{
"epoch": 5.698778833107191,
"grad_norm": 0.8006125558694456,
"learning_rate": 4.073056902949233e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.181000754237175,
"step": 4200,
"valid_targets_mean": 2716.2,
"valid_targets_min": 893
},
{
"epoch": 5.7055630936227955,
"grad_norm": 0.7771322898882181,
"learning_rate": 4.032222857327055e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1973440945148468,
"step": 4205,
"valid_targets_mean": 3029.1,
"valid_targets_min": 1149
},
{
"epoch": 5.712347354138399,
"grad_norm": 0.7542045578109661,
"learning_rate": 3.991571573929263e-06,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16543592512607574,
"step": 4210,
"valid_targets_mean": 2804.5,
"valid_targets_min": 1133
},
{
"epoch": 5.719131614654002,
"grad_norm": 0.6746826061759319,
"learning_rate": 3.951103518037822e-06,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17549774050712585,
"step": 4215,
"valid_targets_mean": 3377.5,
"valid_targets_min": 675
},
{
"epoch": 5.725915875169607,
"grad_norm": 0.7884807830662328,
"learning_rate": 3.910819152837564e-06,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19728972017765045,
"step": 4220,
"valid_targets_mean": 2609.3,
"valid_targets_min": 924
},
{
"epoch": 5.73270013568521,
"grad_norm": 0.6844292385894344,
"learning_rate": 3.870718939410829e-06,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2012067437171936,
"step": 4225,
"valid_targets_mean": 3169.2,
"valid_targets_min": 1216
},
{
"epoch": 5.739484396200814,
"grad_norm": 0.6779140929423958,
"learning_rate": 3.8308033367322185e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16013997793197632,
"step": 4230,
"valid_targets_mean": 3190.8,
"valid_targets_min": 741
},
{
"epoch": 5.746268656716418,
"grad_norm": 0.7186843297493842,
"learning_rate": 3.791072801663349e-06,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17085684835910797,
"step": 4235,
"valid_targets_mean": 3101.9,
"valid_targets_min": 964
},
{
"epoch": 5.753052917232022,
"grad_norm": 0.773844588416225,
"learning_rate": 3.751527788947593e-06,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18918392062187195,
"step": 4240,
"valid_targets_mean": 2950.2,
"valid_targets_min": 1426
},
{
"epoch": 5.759837177747626,
"grad_norm": 0.8943301985541035,
"learning_rate": 3.7121687512049075e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1794520914554596,
"step": 4245,
"valid_targets_mean": 3305.4,
"valid_targets_min": 1077
},
{
"epoch": 5.766621438263229,
"grad_norm": 0.71555932932248,
"learning_rate": 3.672996138926623e-06,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1853591352701187,
"step": 4250,
"valid_targets_mean": 3303.0,
"valid_targets_min": 1317
},
{
"epoch": 5.773405698778833,
"grad_norm": 0.7600028735931071,
"learning_rate": 3.634010400470318e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15217794477939606,
"step": 4255,
"valid_targets_mean": 2485.2,
"valid_targets_min": 765
},
{
"epoch": 5.780189959294437,
"grad_norm": 0.6651550656338701,
"learning_rate": 3.595211982054652e-06,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15896007418632507,
"step": 4260,
"valid_targets_mean": 3312.4,
"valid_targets_min": 739
},
{
"epoch": 5.786974219810041,
"grad_norm": 0.793423124225591,
"learning_rate": 3.5566013277542987e-06,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1872842162847519,
"step": 4265,
"valid_targets_mean": 2579.4,
"valid_targets_min": 1098
},
{
"epoch": 5.7937584803256446,
"grad_norm": 0.7190178787946112,
"learning_rate": 3.5181788794948267e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1685473471879959,
"step": 4270,
"valid_targets_mean": 2938.9,
"valid_targets_min": 795
},
{
"epoch": 5.800542740841248,
"grad_norm": 0.7427543324860382,
"learning_rate": 3.479945077047655e-06,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18788832426071167,
"step": 4275,
"valid_targets_mean": 3514.1,
"valid_targets_min": 655
},
{
"epoch": 5.807327001356852,
"grad_norm": 0.7301184905700668,
"learning_rate": 3.4419003580250386e-06,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724769026041031,
"step": 4280,
"valid_targets_mean": 2761.8,
"valid_targets_min": 782
},
{
"epoch": 5.814111261872456,
"grad_norm": 0.6996558660986915,
"learning_rate": 3.40404515787502e-06,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17133083939552307,
"step": 4285,
"valid_targets_mean": 3322.6,
"valid_targets_min": 1164
},
{
"epoch": 5.82089552238806,
"grad_norm": 0.7470138239152765,
"learning_rate": 3.366379909876487e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1647733896970749,
"step": 4290,
"valid_targets_mean": 2699.9,
"valid_targets_min": 856
},
{
"epoch": 5.8276797829036635,
"grad_norm": 0.8027648641349744,
"learning_rate": 3.3289050451341785e-06,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17798423767089844,
"step": 4295,
"valid_targets_mean": 2830.8,
"valid_targets_min": 1027
},
{
"epoch": 5.834464043419267,
"grad_norm": 0.6833745641979659,
"learning_rate": 3.291620992573781e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1725693941116333,
"step": 4300,
"valid_targets_mean": 3136.2,
"valid_targets_min": 1115
},
{
"epoch": 5.841248303934871,
"grad_norm": 0.7632930036843467,
"learning_rate": 3.254528178936991e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1607835590839386,
"step": 4305,
"valid_targets_mean": 2220.1,
"valid_targets_min": 1083
},
{
"epoch": 5.848032564450475,
"grad_norm": 0.7766685814823788,
"learning_rate": 3.217627028776642e-06,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17807729542255402,
"step": 4310,
"valid_targets_mean": 3144.8,
"valid_targets_min": 1348
},
{
"epoch": 5.854816824966079,
"grad_norm": 0.7615851643722991,
"learning_rate": 3.180917964451864e-06,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18378789722919464,
"step": 4315,
"valid_targets_mean": 2792.7,
"valid_targets_min": 722
},
{
"epoch": 5.8616010854816825,
"grad_norm": 0.7720381142011892,
"learning_rate": 3.1444014061232096e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19216835498809814,
"step": 4320,
"valid_targets_mean": 2816.5,
"valid_targets_min": 681
},
{
"epoch": 5.868385345997286,
"grad_norm": 0.7413182551927285,
"learning_rate": 3.1080777717478906e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17600227892398834,
"step": 4325,
"valid_targets_mean": 2807.1,
"valid_targets_min": 1049
},
{
"epoch": 5.87516960651289,
"grad_norm": 0.830639238497367,
"learning_rate": 3.071947477074948e-06,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20260506868362427,
"step": 4330,
"valid_targets_mean": 3276.9,
"valid_targets_min": 802
},
{
"epoch": 5.881953867028494,
"grad_norm": 0.7247615457982057,
"learning_rate": 3.036010935640541e-06,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745220124721527,
"step": 4335,
"valid_targets_mean": 3025.8,
"valid_targets_min": 1149
},
{
"epoch": 5.888738127544098,
"grad_norm": 0.7666810644080457,
"learning_rate": 3.0002685587631665e-06,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19823196530342102,
"step": 4340,
"valid_targets_mean": 2815.8,
"valid_targets_min": 933
},
{
"epoch": 5.895522388059701,
"grad_norm": 0.6891577535572125,
"learning_rate": 2.9647207555389833e-06,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1756839156150818,
"step": 4345,
"valid_targets_mean": 3165.6,
"valid_targets_min": 796
},
{
"epoch": 5.902306648575305,
"grad_norm": 0.6280441768186072,
"learning_rate": 2.929367932837128e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16393789649009705,
"step": 4350,
"valid_targets_mean": 3511.4,
"valid_targets_min": 1349
},
{
"epoch": 5.909090909090909,
"grad_norm": 0.7212401001251478,
"learning_rate": 2.8942104952950358e-06,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1590360701084137,
"step": 4355,
"valid_targets_mean": 2814.4,
"valid_targets_min": 781
},
{
"epoch": 5.915875169606513,
"grad_norm": 0.7587496985425881,
"learning_rate": 2.8592488453138402e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18076002597808838,
"step": 4360,
"valid_targets_mean": 2772.0,
"valid_targets_min": 1406
},
{
"epoch": 5.922659430122117,
"grad_norm": 0.7026766056453736,
"learning_rate": 2.8244833830537334e-06,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16852641105651855,
"step": 4365,
"valid_targets_mean": 3198.9,
"valid_targets_min": 1248
},
{
"epoch": 5.92944369063772,
"grad_norm": 0.7591755791375419,
"learning_rate": 2.789914506429423e-06,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18854087591171265,
"step": 4370,
"valid_targets_mean": 3410.3,
"valid_targets_min": 960
},
{
"epoch": 5.936227951153324,
"grad_norm": 0.7317196861574712,
"learning_rate": 2.755542611105544e-06,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17983709275722504,
"step": 4375,
"valid_targets_mean": 2910.4,
"valid_targets_min": 777
},
{
"epoch": 5.943012211668928,
"grad_norm": 0.7873291444565179,
"learning_rate": 2.7213680904921426e-06,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15739159286022186,
"step": 4380,
"valid_targets_mean": 2447.4,
"valid_targets_min": 1274
},
{
"epoch": 5.949796472184532,
"grad_norm": 0.783627540382998,
"learning_rate": 2.687391335740195e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18448659777641296,
"step": 4385,
"valid_targets_mean": 2981.9,
"valid_targets_min": 940
},
{
"epoch": 5.956580732700136,
"grad_norm": 0.8163415230485238,
"learning_rate": 2.6536127357370834e-06,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17967082560062408,
"step": 4390,
"valid_targets_mean": 2268.2,
"valid_targets_min": 1087
},
{
"epoch": 5.963364993215739,
"grad_norm": 0.6972529066512584,
"learning_rate": 2.6200326771021977e-06,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17101269960403442,
"step": 4395,
"valid_targets_mean": 3305.3,
"valid_targets_min": 1304
},
{
"epoch": 5.970149253731344,
"grad_norm": 0.7444293238213098,
"learning_rate": 2.5866515441824637e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16424033045768738,
"step": 4400,
"valid_targets_mean": 2531.2,
"valid_targets_min": 761
},
{
"epoch": 5.976933514246947,
"grad_norm": 0.7787083692853177,
"learning_rate": 2.553469719047983e-06,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18210354447364807,
"step": 4405,
"valid_targets_mean": 3141.8,
"valid_targets_min": 810
},
{
"epoch": 5.9837177747625505,
"grad_norm": 0.7791998751111936,
"learning_rate": 2.5204875814876318e-06,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19235186278820038,
"step": 4410,
"valid_targets_mean": 2803.9,
"valid_targets_min": 708
},
{
"epoch": 5.990502035278155,
"grad_norm": 0.7009703971990965,
"learning_rate": 2.487705509004721e-06,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18249055743217468,
"step": 4415,
"valid_targets_mean": 3232.0,
"valid_targets_min": 484
},
{
"epoch": 5.997286295793758,
"grad_norm": 0.7781270453801223,
"learning_rate": 2.4551238768126906e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16195908188819885,
"step": 4420,
"valid_targets_mean": 2633.4,
"valid_targets_min": 814
},
{
"epoch": 6.004070556309363,
"grad_norm": 0.7415388448727406,
"learning_rate": 2.422743057830792e-06,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19907845556735992,
"step": 4425,
"valid_targets_mean": 2871.6,
"valid_targets_min": 690
},
{
"epoch": 6.010854816824966,
"grad_norm": 0.742053212238427,
"learning_rate": 2.3905634226798415e-06,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18320277333259583,
"step": 4430,
"valid_targets_mean": 3028.6,
"valid_targets_min": 750
},
{
"epoch": 6.0176390773405695,
"grad_norm": 0.8079591238507426,
"learning_rate": 2.3585853396779546e-06,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17492371797561646,
"step": 4435,
"valid_targets_mean": 2414.6,
"valid_targets_min": 610
},
{
"epoch": 6.024423337856174,
"grad_norm": 0.7245282326645127,
"learning_rate": 2.326809174836355e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16501660645008087,
"step": 4440,
"valid_targets_mean": 2658.6,
"valid_targets_min": 805
},
{
"epoch": 6.031207598371777,
"grad_norm": 0.7529821726671959,
"learning_rate": 2.295235291855171e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16563096642494202,
"step": 4445,
"valid_targets_mean": 2985.2,
"valid_targets_min": 1155
},
{
"epoch": 6.0379918588873815,
"grad_norm": 0.7218429838629064,
"learning_rate": 2.2638640521192666e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16327796876430511,
"step": 4450,
"valid_targets_mean": 2918.9,
"valid_targets_min": 820
},
{
"epoch": 6.044776119402985,
"grad_norm": 0.7670474706596653,
"learning_rate": 2.23269581469413e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17224714159965515,
"step": 4455,
"valid_targets_mean": 2854.1,
"valid_targets_min": 711
},
{
"epoch": 6.051560379918589,
"grad_norm": 0.85371010583432,
"learning_rate": 2.201730936321731e-06,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18799713253974915,
"step": 4460,
"valid_targets_mean": 2257.5,
"valid_targets_min": 809
},
{
"epoch": 6.058344640434193,
"grad_norm": 0.8581102151455461,
"learning_rate": 2.170969771416471e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19284003973007202,
"step": 4465,
"valid_targets_mean": 2541.4,
"valid_targets_min": 903
},
{
"epoch": 6.065128900949796,
"grad_norm": 0.7082075259100371,
"learning_rate": 2.140412672061094e-06,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14846593141555786,
"step": 4470,
"valid_targets_mean": 2874.5,
"valid_targets_min": 900
},
{
"epoch": 6.0719131614654005,
"grad_norm": 0.6593303484533789,
"learning_rate": 2.1100599880026885e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17295196652412415,
"step": 4475,
"valid_targets_mean": 3751.6,
"valid_targets_min": 1730
},
{
"epoch": 6.078697421981004,
"grad_norm": 0.7194386838659942,
"learning_rate": 2.079912066648655e-06,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14499616622924805,
"step": 4480,
"valid_targets_mean": 2578.9,
"valid_targets_min": 1121
},
{
"epoch": 6.085481682496608,
"grad_norm": 0.7703414212546942,
"learning_rate": 2.049969253062758e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17155641317367554,
"step": 4485,
"valid_targets_mean": 2867.4,
"valid_targets_min": 727
},
{
"epoch": 6.092265943012212,
"grad_norm": 0.7581834478927615,
"learning_rate": 2.0202318899611483e-06,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14970597624778748,
"step": 4490,
"valid_targets_mean": 2776.1,
"valid_targets_min": 810
},
{
"epoch": 6.099050203527815,
"grad_norm": 0.8858694998395675,
"learning_rate": 1.9907003177084605e-06,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19518548250198364,
"step": 4495,
"valid_targets_mean": 2301.6,
"valid_targets_min": 858
},
{
"epoch": 6.1058344640434195,
"grad_norm": 0.7698959242156672,
"learning_rate": 1.9613748743139126e-06,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18513622879981995,
"step": 4500,
"valid_targets_mean": 3196.8,
"valid_targets_min": 1009
},
{
"epoch": 6.112618724559023,
"grad_norm": 0.9050028409977037,
"learning_rate": 1.9322558954274305e-06,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17871133983135223,
"step": 4505,
"valid_targets_mean": 2160.6,
"valid_targets_min": 748
},
{
"epoch": 6.119402985074627,
"grad_norm": 0.7740731558411673,
"learning_rate": 1.9033437143358213e-06,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16579106450080872,
"step": 4510,
"valid_targets_mean": 2948.0,
"valid_targets_min": 1076
},
{
"epoch": 6.126187245590231,
"grad_norm": 0.8348067497419805,
"learning_rate": 1.874638661958934e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16571199893951416,
"step": 4515,
"valid_targets_mean": 2415.9,
"valid_targets_min": 627
},
{
"epoch": 6.132971506105834,
"grad_norm": 0.7256235619648512,
"learning_rate": 1.8461410668459035e-06,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14996132254600525,
"step": 4520,
"valid_targets_mean": 2668.2,
"valid_targets_min": 806
},
{
"epoch": 6.139755766621438,
"grad_norm": 0.7614175427466571,
"learning_rate": 1.8178512551713568e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15067064762115479,
"step": 4525,
"valid_targets_mean": 3234.1,
"valid_targets_min": 656
},
{
"epoch": 6.146540027137042,
"grad_norm": 0.7569505883546243,
"learning_rate": 1.7897695507317036e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17070305347442627,
"step": 4530,
"valid_targets_mean": 2981.2,
"valid_targets_min": 1323
},
{
"epoch": 6.153324287652646,
"grad_norm": 0.715139884326026,
"learning_rate": 1.761896274941426e-06,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1826499104499817,
"step": 4535,
"valid_targets_mean": 3501.9,
"valid_targets_min": 841
},
{
"epoch": 6.16010854816825,
"grad_norm": 0.7854237661191246,
"learning_rate": 1.7342317468293912e-06,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16877636313438416,
"step": 4540,
"valid_targets_mean": 2512.0,
"valid_targets_min": 1055
},
{
"epoch": 6.166892808683853,
"grad_norm": 0.8303757582473726,
"learning_rate": 1.7067762830352096e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17255139350891113,
"step": 4545,
"valid_targets_mean": 2534.2,
"valid_targets_min": 942
},
{
"epoch": 6.173677069199457,
"grad_norm": 0.7385224765472438,
"learning_rate": 1.679530197805599e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15643605589866638,
"step": 4550,
"valid_targets_mean": 2944.8,
"valid_targets_min": 1366
},
{
"epoch": 6.180461329715061,
"grad_norm": 0.7564443718183899,
"learning_rate": 1.652493802990811e-06,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17550310492515564,
"step": 4555,
"valid_targets_mean": 3110.1,
"valid_targets_min": 1058
},
{
"epoch": 6.187245590230665,
"grad_norm": 1.71255016027657,
"learning_rate": 1.6256674080410185e-06,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15688160061836243,
"step": 4560,
"valid_targets_mean": 3095.8,
"valid_targets_min": 1214
},
{
"epoch": 6.1940298507462686,
"grad_norm": 0.8040556589037928,
"learning_rate": 1.5990513200028269e-06,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1727936565876007,
"step": 4565,
"valid_targets_mean": 2527.2,
"valid_targets_min": 991
},
{
"epoch": 6.200814111261873,
"grad_norm": 0.7945263075310672,
"learning_rate": 1.5726458435157255e-06,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18288177251815796,
"step": 4570,
"valid_targets_mean": 3045.4,
"valid_targets_min": 821
},
{
"epoch": 6.207598371777476,
"grad_norm": 0.7545719664187707,
"learning_rate": 1.5464512808086008e-06,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17064568400382996,
"step": 4575,
"valid_targets_mean": 3098.4,
"valid_targets_min": 796
},
{
"epoch": 6.21438263229308,
"grad_norm": 0.747591105064271,
"learning_rate": 1.5204679316963012e-06,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1849783957004547,
"step": 4580,
"valid_targets_mean": 3041.9,
"valid_targets_min": 1643
},
{
"epoch": 6.221166892808684,
"grad_norm": 0.7177247952162282,
"learning_rate": 1.4946960935761734e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17120692133903503,
"step": 4585,
"valid_targets_mean": 3201.8,
"valid_targets_min": 563
},
{
"epoch": 6.2279511533242875,
"grad_norm": 0.8094458246760512,
"learning_rate": 1.4691360614246897e-06,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16246119141578674,
"step": 4590,
"valid_targets_mean": 2322.5,
"valid_targets_min": 692
},
{
"epoch": 6.234735413839892,
"grad_norm": 0.7798473673390547,
"learning_rate": 1.443788127794048e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17415021359920502,
"step": 4595,
"valid_targets_mean": 2854.2,
"valid_targets_min": 1190
},
{
"epoch": 6.241519674355495,
"grad_norm": 0.7946140484277268,
"learning_rate": 1.4186525828088282e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15857259929180145,
"step": 4600,
"valid_targets_mean": 2525.8,
"valid_targets_min": 1018
},
{
"epoch": 6.248303934871099,
"grad_norm": 0.7801428383995377,
"learning_rate": 1.3937297141626904e-06,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684061586856842,
"step": 4605,
"valid_targets_mean": 2809.8,
"valid_targets_min": 917
},
{
"epoch": 6.255088195386703,
"grad_norm": 0.6643638326526149,
"learning_rate": 1.3690198071150528e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15296955406665802,
"step": 4610,
"valid_targets_mean": 3476.2,
"valid_targets_min": 1305
},
{
"epoch": 6.2618724559023065,
"grad_norm": 0.7686142175477614,
"learning_rate": 1.3445231444878504e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17054758965969086,
"step": 4615,
"valid_targets_mean": 2753.3,
"valid_targets_min": 830
},
{
"epoch": 6.268656716417911,
"grad_norm": 0.8432191119730226,
"learning_rate": 1.3202400066622834e-06,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17865519225597382,
"step": 4620,
"valid_targets_mean": 2344.4,
"valid_targets_min": 765
},
{
"epoch": 6.275440976933514,
"grad_norm": 0.6339497035055569,
"learning_rate": 1.2961706715756184e-06,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1531352996826172,
"step": 4625,
"valid_targets_mean": 3586.7,
"valid_targets_min": 2054
},
{
"epoch": 6.282225237449118,
"grad_norm": 0.8544021195040931,
"learning_rate": 1.2723154147179973e-06,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579844206571579,
"step": 4630,
"valid_targets_mean": 3154.9,
"valid_targets_min": 869
},
{
"epoch": 6.289009497964722,
"grad_norm": 0.8007481753817313,
"learning_rate": 1.2486745091292862e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1802925169467926,
"step": 4635,
"valid_targets_mean": 2729.8,
"valid_targets_min": 957
},
{
"epoch": 6.295793758480325,
"grad_norm": 0.8142132607230317,
"learning_rate": 1.2252482253959653e-06,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18052034080028534,
"step": 4640,
"valid_targets_mean": 2541.6,
"valid_targets_min": 974
},
{
"epoch": 6.30257801899593,
"grad_norm": 0.6774345228089872,
"learning_rate": 1.202036831648008e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.150282084941864,
"step": 4645,
"valid_targets_mean": 3526.9,
"valid_targets_min": 1051
},
{
"epoch": 6.309362279511533,
"grad_norm": 0.7516698326728172,
"learning_rate": 1.1790405935558292e-06,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16584287583827972,
"step": 4650,
"valid_targets_mean": 2976.7,
"valid_targets_min": 1024
},
{
"epoch": 6.3161465400271375,
"grad_norm": 0.7046916433526038,
"learning_rate": 1.156259774327233e-06,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16168582439422607,
"step": 4655,
"valid_targets_mean": 3335.2,
"valid_targets_min": 872
},
{
"epoch": 6.322930800542741,
"grad_norm": 0.767262026885646,
"learning_rate": 1.1336946347044164e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15575771033763885,
"step": 4660,
"valid_targets_mean": 2716.2,
"valid_targets_min": 1074
},
{
"epoch": 6.329715061058344,
"grad_norm": 0.792890542631687,
"learning_rate": 1.111345432960964e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16956427693367004,
"step": 4665,
"valid_targets_mean": 2624.8,
"valid_targets_min": 593
},
{
"epoch": 6.336499321573949,
"grad_norm": 0.7772682272896229,
"learning_rate": 1.089212424898909e-06,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16567683219909668,
"step": 4670,
"valid_targets_mean": 2692.4,
"valid_targets_min": 420
},
{
"epoch": 6.343283582089552,
"grad_norm": 0.7218817470491743,
"learning_rate": 1.0672958638457963e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656082570552826,
"step": 4675,
"valid_targets_mean": 3137.2,
"valid_targets_min": 1181
},
{
"epoch": 6.350067842605156,
"grad_norm": 0.7660758671491292,
"learning_rate": 1.0455960006517828e-06,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16689500212669373,
"step": 4680,
"valid_targets_mean": 2776.9,
"valid_targets_min": 1184
},
{
"epoch": 6.35685210312076,
"grad_norm": 0.7614176463332171,
"learning_rate": 1.0241130836867775e-06,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1655552089214325,
"step": 4685,
"valid_targets_mean": 2639.2,
"valid_targets_min": 1340
},
{
"epoch": 6.363636363636363,
"grad_norm": 0.731905552102256,
"learning_rate": 1.0028473588375775e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15648706257343292,
"step": 4690,
"valid_targets_mean": 2678.6,
"valid_targets_min": 1071
},
{
"epoch": 6.370420624151968,
"grad_norm": 0.7374044504633019,
"learning_rate": 9.817990695050804e-07,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17541341483592987,
"step": 4695,
"valid_targets_mean": 3396.6,
"valid_targets_min": 788
},
{
"epoch": 6.377204884667571,
"grad_norm": 0.8070797537585928,
"learning_rate": 9.60968456601472e-07,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17572826147079468,
"step": 4700,
"valid_targets_mean": 2604.2,
"valid_targets_min": 880
},
{
"epoch": 6.383989145183175,
"grad_norm": 0.7275287979567348,
"learning_rate": 9.403557585474954e-07,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15313151478767395,
"step": 4705,
"valid_targets_mean": 2704.1,
"valid_targets_min": 627
},
{
"epoch": 6.390773405698779,
"grad_norm": 0.8970798559467905,
"learning_rate": 9.199612112696843e-07,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1705400049686432,
"step": 4710,
"valid_targets_mean": 2101.6,
"valid_targets_min": 818
},
{
"epoch": 6.397557666214382,
"grad_norm": 0.7536549104416713,
"learning_rate": 8.9978504819771e-07,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1547962725162506,
"step": 4715,
"valid_targets_mean": 2824.7,
"valid_targets_min": 779
},
{
"epoch": 6.404341926729987,
"grad_norm": 0.8045187393820044,
"learning_rate": 8.798275002616785e-07,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17857302725315094,
"step": 4720,
"valid_targets_mean": 2904.6,
"valid_targets_min": 699
},
{
"epoch": 6.41112618724559,
"grad_norm": 0.8644670987087135,
"learning_rate": 8.600887958894866e-07,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18547791242599487,
"step": 4725,
"valid_targets_mean": 2751.9,
"valid_targets_min": 623
},
{
"epoch": 6.417910447761194,
"grad_norm": 0.8231644619228083,
"learning_rate": 8.4056916100423e-07,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16595998406410217,
"step": 4730,
"valid_targets_mean": 2423.4,
"valid_targets_min": 692
},
{
"epoch": 6.424694708276798,
"grad_norm": 0.7911518564082718,
"learning_rate": 8.212688190215879e-07,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17415902018547058,
"step": 4735,
"valid_targets_mean": 2703.4,
"valid_targets_min": 793
},
{
"epoch": 6.431478968792401,
"grad_norm": 0.8160726715736674,
"learning_rate": 8.021879908472962e-07,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18597552180290222,
"step": 4740,
"valid_targets_mean": 2784.6,
"valid_targets_min": 1092
},
{
"epoch": 6.4382632293080055,
"grad_norm": 0.7067244227602366,
"learning_rate": 7.833268948745854e-07,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16125139594078064,
"step": 4745,
"valid_targets_mean": 3260.1,
"valid_targets_min": 896
},
{
"epoch": 6.445047489823609,
"grad_norm": 0.7408785373138851,
"learning_rate": 7.646857469817148e-07,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15260982513427734,
"step": 4750,
"valid_targets_mean": 2774.1,
"valid_targets_min": 797
},
{
"epoch": 6.451831750339213,
"grad_norm": 0.6966270003794208,
"learning_rate": 7.462647605294849e-07,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.148808091878891,
"step": 4755,
"valid_targets_mean": 2975.9,
"valid_targets_min": 681
},
{
"epoch": 6.458616010854817,
"grad_norm": 0.7126074027304123,
"learning_rate": 7.28064146358789e-07,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15134704113006592,
"step": 4760,
"valid_targets_mean": 3576.7,
"valid_targets_min": 689
},
{
"epoch": 6.46540027137042,
"grad_norm": 0.8135549579243775,
"learning_rate": 7.100841127882119e-07,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1627068817615509,
"step": 4765,
"valid_targets_mean": 2379.0,
"valid_targets_min": 890
},
{
"epoch": 6.4721845318860245,
"grad_norm": 0.6946858722656691,
"learning_rate": 6.9232486561164e-07,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15446284413337708,
"step": 4770,
"valid_targets_mean": 3180.2,
"valid_targets_min": 1145
},
{
"epoch": 6.478968792401628,
"grad_norm": 0.8707673966033334,
"learning_rate": 6.74786608095912e-07,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17315858602523804,
"step": 4775,
"valid_targets_mean": 2392.1,
"valid_targets_min": 740
},
{
"epoch": 6.485753052917232,
"grad_norm": 0.7302574945303589,
"learning_rate": 6.574695409784792e-07,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1769123077392578,
"step": 4780,
"valid_targets_mean": 3501.0,
"valid_targets_min": 735
},
{
"epoch": 6.492537313432836,
"grad_norm": 0.8695981905879026,
"learning_rate": 6.403738624651201e-07,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1758110076189041,
"step": 4785,
"valid_targets_mean": 2153.2,
"valid_targets_min": 1133
},
{
"epoch": 6.49932157394844,
"grad_norm": 0.6446530009894795,
"learning_rate": 6.234997682276711e-07,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484566032886505,
"step": 4790,
"valid_targets_mean": 3468.8,
"valid_targets_min": 1345
},
{
"epoch": 6.5061058344640434,
"grad_norm": 0.7063043963291199,
"learning_rate": 6.068474514017797e-07,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1765894889831543,
"step": 4795,
"valid_targets_mean": 3490.4,
"valid_targets_min": 954
},
{
"epoch": 6.512890094979647,
"grad_norm": 0.8151482914810542,
"learning_rate": 5.904171025847016e-07,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16545557975769043,
"step": 4800,
"valid_targets_mean": 2565.6,
"valid_targets_min": 767
},
{
"epoch": 6.519674355495251,
"grad_norm": 0.7173252334227114,
"learning_rate": 5.742089098331094e-07,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15513482689857483,
"step": 4805,
"valid_targets_mean": 3147.9,
"valid_targets_min": 1185
},
{
"epoch": 6.526458616010855,
"grad_norm": 0.744561572381357,
"learning_rate": 5.582230586609538e-07,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628095507621765,
"step": 4810,
"valid_targets_mean": 2782.1,
"valid_targets_min": 1219
},
{
"epoch": 6.533242876526459,
"grad_norm": 0.9358406796473209,
"learning_rate": 5.424597320373259e-07,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18553614616394043,
"step": 4815,
"valid_targets_mean": 2122.8,
"valid_targets_min": 719
},
{
"epoch": 6.540027137042062,
"grad_norm": 0.7762174577670051,
"learning_rate": 5.269191103843719e-07,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16511686146259308,
"step": 4820,
"valid_targets_mean": 2672.0,
"valid_targets_min": 998
},
{
"epoch": 6.546811397557666,
"grad_norm": 0.683256793284698,
"learning_rate": 5.116013715752299e-07,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17595712840557098,
"step": 4825,
"valid_targets_mean": 3763.1,
"valid_targets_min": 1182
},
{
"epoch": 6.55359565807327,
"grad_norm": 0.7956506160614817,
"learning_rate": 4.965066909319837e-07,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17820480465888977,
"step": 4830,
"valid_targets_mean": 2759.7,
"valid_targets_min": 1292
},
{
"epoch": 6.560379918588874,
"grad_norm": 0.7587179233666759,
"learning_rate": 4.816352412236702e-07,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17972393333911896,
"step": 4835,
"valid_targets_mean": 2840.0,
"valid_targets_min": 718
},
{
"epoch": 6.567164179104478,
"grad_norm": 0.7306219090534811,
"learning_rate": 4.669871926642877e-07,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15142644941806793,
"step": 4840,
"valid_targets_mean": 3011.1,
"valid_targets_min": 686
},
{
"epoch": 6.573948439620081,
"grad_norm": 0.8468764362506153,
"learning_rate": 4.5256271291085785e-07,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16415920853614807,
"step": 4845,
"valid_targets_mean": 2226.1,
"valid_targets_min": 799
},
{
"epoch": 6.580732700135686,
"grad_norm": 0.7218042166118971,
"learning_rate": 4.3836196706150026e-07,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14739587903022766,
"step": 4850,
"valid_targets_mean": 3025.1,
"valid_targets_min": 788
},
{
"epoch": 6.587516960651289,
"grad_norm": 0.7548311142057721,
"learning_rate": 4.243851176535474e-07,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1665259748697281,
"step": 4855,
"valid_targets_mean": 2818.0,
"valid_targets_min": 728
},
{
"epoch": 6.5943012211668925,
"grad_norm": 0.7611024739102207,
"learning_rate": 4.106323246616817e-07,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15098467469215393,
"step": 4860,
"valid_targets_mean": 3311.1,
"valid_targets_min": 806
},
{
"epoch": 6.601085481682497,
"grad_norm": 0.8170024951749895,
"learning_rate": 3.971037454961058e-07,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1671171486377716,
"step": 4865,
"valid_targets_mean": 2565.4,
"valid_targets_min": 798
},
{
"epoch": 6.6078697421981,
"grad_norm": 0.7074879855210716,
"learning_rate": 3.8379953500074617e-07,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1538231521844864,
"step": 4870,
"valid_targets_mean": 3038.6,
"valid_targets_min": 742
},
{
"epoch": 6.614654002713705,
"grad_norm": 0.7784406456308786,
"learning_rate": 3.7071984545146157e-07,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17332404851913452,
"step": 4875,
"valid_targets_mean": 2704.2,
"valid_targets_min": 1374
},
{
"epoch": 6.621438263229308,
"grad_norm": 0.7707976870962088,
"learning_rate": 3.578648265543261e-07,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15194040536880493,
"step": 4880,
"valid_targets_mean": 2598.7,
"valid_targets_min": 770
},
{
"epoch": 6.6282225237449115,
"grad_norm": 0.7794811748817996,
"learning_rate": 3.4523462544389987e-07,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1765557825565338,
"step": 4885,
"valid_targets_mean": 2984.3,
"valid_targets_min": 1174
},
{
"epoch": 6.635006784260516,
"grad_norm": 0.7299801758059727,
"learning_rate": 3.328293866815435e-07,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16560907661914825,
"step": 4890,
"valid_targets_mean": 3176.7,
"valid_targets_min": 1444
},
{
"epoch": 6.641791044776119,
"grad_norm": 0.8430277934827622,
"learning_rate": 3.2064925225377297e-07,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1819601058959961,
"step": 4895,
"valid_targets_mean": 2420.4,
"valid_targets_min": 642
},
{
"epoch": 6.648575305291724,
"grad_norm": 0.8143191944576621,
"learning_rate": 3.086943615706295e-07,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18464431166648865,
"step": 4900,
"valid_targets_mean": 2860.9,
"valid_targets_min": 717
},
{
"epoch": 6.655359565807327,
"grad_norm": 0.7808926512242406,
"learning_rate": 2.969648514640855e-07,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17209918797016144,
"step": 4905,
"valid_targets_mean": 2871.8,
"valid_targets_min": 817
},
{
"epoch": 6.6621438263229305,
"grad_norm": 0.7932529850799425,
"learning_rate": 2.854608561864702e-07,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17645207047462463,
"step": 4910,
"valid_targets_mean": 2660.2,
"valid_targets_min": 927
},
{
"epoch": 6.668928086838535,
"grad_norm": 0.92065568822347,
"learning_rate": 2.7418250740895325e-07,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19371803104877472,
"step": 4915,
"valid_targets_mean": 2207.4,
"valid_targets_min": 856
},
{
"epoch": 6.675712347354138,
"grad_norm": 0.6839393586837104,
"learning_rate": 2.6312993422001e-07,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17107108235359192,
"step": 4920,
"valid_targets_mean": 3477.2,
"valid_targets_min": 930
},
{
"epoch": 6.6824966078697425,
"grad_norm": 0.710980917983464,
"learning_rate": 2.5230326312397193e-07,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745888739824295,
"step": 4925,
"valid_targets_mean": 3478.5,
"valid_targets_min": 642
},
{
"epoch": 6.689280868385346,
"grad_norm": 0.7823508117950982,
"learning_rate": 2.417026180395476e-07,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15715618431568146,
"step": 4930,
"valid_targets_mean": 2545.1,
"valid_targets_min": 895
},
{
"epoch": 6.696065128900949,
"grad_norm": 0.7659619371709346,
"learning_rate": 2.3132812029844187e-07,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14484542608261108,
"step": 4935,
"valid_targets_mean": 2404.1,
"valid_targets_min": 548
},
{
"epoch": 6.702849389416554,
"grad_norm": 0.7229493539815992,
"learning_rate": 2.2117988864393424e-07,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15829598903656006,
"step": 4940,
"valid_targets_mean": 3077.1,
"valid_targets_min": 714
},
{
"epoch": 6.709633649932157,
"grad_norm": 0.7896285355647491,
"learning_rate": 2.112580392295338e-07,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17784717679023743,
"step": 4945,
"valid_targets_mean": 2630.4,
"valid_targets_min": 1081
},
{
"epoch": 6.7164179104477615,
"grad_norm": 0.9253668056101276,
"learning_rate": 2.015626856176578e-07,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16507627069950104,
"step": 4950,
"valid_targets_mean": 2150.9,
"valid_targets_min": 815
},
{
"epoch": 6.723202170963365,
"grad_norm": 0.8173264202820435,
"learning_rate": 1.9209393877831273e-07,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18161508440971375,
"step": 4955,
"valid_targets_mean": 2604.2,
"valid_targets_min": 840
},
{
"epoch": 6.729986431478968,
"grad_norm": 0.7523430361745242,
"learning_rate": 1.8285190708783984e-07,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569797694683075,
"step": 4960,
"valid_targets_mean": 2848.9,
"valid_targets_min": 1035
},
{
"epoch": 6.736770691994573,
"grad_norm": 0.7772846302429779,
"learning_rate": 1.7383669632766276e-07,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17585310339927673,
"step": 4965,
"valid_targets_mean": 2752.7,
"valid_targets_min": 792
},
{
"epoch": 6.743554952510176,
"grad_norm": 0.9312669800652025,
"learning_rate": 1.6504840968309288e-07,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16369280219078064,
"step": 4970,
"valid_targets_mean": 2244.8,
"valid_targets_min": 618
},
{
"epoch": 6.75033921302578,
"grad_norm": 0.740973564771969,
"learning_rate": 1.5648714774213037e-07,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16859431564807892,
"step": 4975,
"valid_targets_mean": 3112.4,
"valid_targets_min": 538
},
{
"epoch": 6.757123473541384,
"grad_norm": 0.800910909512139,
"learning_rate": 1.4815300849432278e-07,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1737082302570343,
"step": 4980,
"valid_targets_mean": 2754.4,
"valid_targets_min": 1617
},
{
"epoch": 6.763907734056987,
"grad_norm": 0.725161307786821,
"learning_rate": 1.400460873296461e-07,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16292381286621094,
"step": 4985,
"valid_targets_mean": 3145.3,
"valid_targets_min": 912
},
{
"epoch": 6.770691994572592,
"grad_norm": 0.8381499766215631,
"learning_rate": 1.3216647703740315e-07,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18227586150169373,
"step": 4990,
"valid_targets_mean": 2443.8,
"valid_targets_min": 944
},
{
"epoch": 6.777476255088195,
"grad_norm": 0.8004952099912124,
"learning_rate": 1.2451426780517363e-07,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17602723836898804,
"step": 4995,
"valid_targets_mean": 2544.9,
"valid_targets_min": 814
},
{
"epoch": 6.784260515603799,
"grad_norm": 0.8175798384888614,
"learning_rate": 1.1708954721776355e-07,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15319892764091492,
"step": 5000,
"valid_targets_mean": 3087.2,
"valid_targets_min": 1206
},
{
"epoch": 6.791044776119403,
"grad_norm": 0.8311080394214818,
"learning_rate": 1.0989240025622627e-07,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1745099425315857,
"step": 5005,
"valid_targets_mean": 2356.4,
"valid_targets_min": 754
},
{
"epoch": 6.797829036635007,
"grad_norm": 0.765582281484442,
"learning_rate": 1.0292290929687421e-07,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15547017753124237,
"step": 5010,
"valid_targets_mean": 2607.4,
"valid_targets_min": 656
},
{
"epoch": 6.804613297150611,
"grad_norm": 0.8814252430063856,
"learning_rate": 9.618115411033524e-08,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16623856127262115,
"step": 5015,
"valid_targets_mean": 2101.0,
"valid_targets_min": 732
},
{
"epoch": 6.811397557666214,
"grad_norm": 0.7599170245144763,
"learning_rate": 8.966721186065341e-08,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1648900806903839,
"step": 5020,
"valid_targets_mean": 2629.4,
"valid_targets_min": 1313
},
{
"epoch": 6.818181818181818,
"grad_norm": 0.6566181393738637,
"learning_rate": 8.338115710438744e-08,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621677428483963,
"step": 5025,
"valid_targets_mean": 3358.0,
"valid_targets_min": 654
},
{
"epoch": 6.824966078697422,
"grad_norm": 0.7442894660376455,
"learning_rate": 7.732306178977134e-08,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1600368767976761,
"step": 5030,
"valid_targets_mean": 3117.9,
"valid_targets_min": 880
},
{
"epoch": 6.831750339213026,
"grad_norm": 0.7314337251400312,
"learning_rate": 7.149299525588405e-08,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1598661243915558,
"step": 5035,
"valid_targets_mean": 2865.1,
"valid_targets_min": 514
},
{
"epoch": 6.8385345997286295,
"grad_norm": 0.712971911902212,
"learning_rate": 6.58910242318611e-08,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1687866449356079,
"step": 5040,
"valid_targets_mean": 3268.2,
"valid_targets_min": 889
},
{
"epoch": 6.845318860244234,
"grad_norm": 0.7170233413590963,
"learning_rate": 6.051721283612422e-08,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16001065075397491,
"step": 5045,
"valid_targets_mean": 3043.4,
"valid_targets_min": 712
},
{
"epoch": 6.852103120759837,
"grad_norm": 0.8748422499637547,
"learning_rate": 5.537162257565065e-08,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17490287125110626,
"step": 5050,
"valid_targets_mean": 2234.8,
"valid_targets_min": 632
},
{
"epoch": 6.858887381275441,
"grad_norm": 0.7527414733725077,
"learning_rate": 5.045431234527165e-08,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17598162591457367,
"step": 5055,
"valid_targets_mean": 3049.6,
"valid_targets_min": 648
},
{
"epoch": 6.865671641791045,
"grad_norm": 0.750418327168722,
"learning_rate": 4.576533842699294e-08,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612885594367981,
"step": 5060,
"valid_targets_mean": 2946.2,
"valid_targets_min": 981
},
{
"epoch": 6.8724559023066485,
"grad_norm": 0.8234037034287423,
"learning_rate": 4.1304754489359666e-08,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15995310246944427,
"step": 5065,
"valid_targets_mean": 2353.8,
"valid_targets_min": 803
},
{
"epoch": 6.879240162822253,
"grad_norm": 0.8151052308072695,
"learning_rate": 3.707261158682807e-08,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16730859875679016,
"step": 5070,
"valid_targets_mean": 2366.6,
"valid_targets_min": 706
},
{
"epoch": 6.886024423337856,
"grad_norm": 0.794569340466791,
"learning_rate": 3.306895815919475e-08,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17812877893447876,
"step": 5075,
"valid_targets_mean": 2787.9,
"valid_targets_min": 1092
},
{
"epoch": 6.89280868385346,
"grad_norm": 0.6779205812201277,
"learning_rate": 2.929384003103497e-08,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1553945243358612,
"step": 5080,
"valid_targets_mean": 3201.9,
"valid_targets_min": 858
},
{
"epoch": 6.899592944369064,
"grad_norm": 0.7802177039337713,
"learning_rate": 2.5747300411180787e-08,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16561156511306763,
"step": 5085,
"valid_targets_mean": 2595.4,
"valid_targets_min": 761
},
{
"epoch": 6.906377204884667,
"grad_norm": 0.811535089999137,
"learning_rate": 2.2429379892221493e-08,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710594892501831,
"step": 5090,
"valid_targets_mean": 2819.6,
"valid_targets_min": 782
},
{
"epoch": 6.913161465400272,
"grad_norm": 0.7976488997817401,
"learning_rate": 1.9340116450050628e-08,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1631883978843689,
"step": 5095,
"valid_targets_mean": 2428.8,
"valid_targets_min": 697
},
{
"epoch": 6.919945725915875,
"grad_norm": 0.8090475833391716,
"learning_rate": 1.6479545443415236e-08,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1432981789112091,
"step": 5100,
"valid_targets_mean": 2219.2,
"valid_targets_min": 764
},
{
"epoch": 6.926729986431479,
"grad_norm": 0.682864252053581,
"learning_rate": 1.3847699613527276e-08,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1406230330467224,
"step": 5105,
"valid_targets_mean": 2982.7,
"valid_targets_min": 1119
},
{
"epoch": 6.933514246947083,
"grad_norm": 0.6898488676376657,
"learning_rate": 1.1444609083675062e-08,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1759582757949829,
"step": 5110,
"valid_targets_mean": 3367.1,
"valid_targets_min": 1487
},
{
"epoch": 6.940298507462686,
"grad_norm": 0.7796796211939258,
"learning_rate": 9.270301358890177e-09,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1705056130886078,
"step": 5115,
"valid_targets_mean": 2493.1,
"valid_targets_min": 780
},
{
"epoch": 6.947082767978291,
"grad_norm": 1.019436094106403,
"learning_rate": 7.324801325621078e-09,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1720581352710724,
"step": 5120,
"valid_targets_mean": 2621.9,
"valid_targets_min": 615
},
{
"epoch": 6.953867028493894,
"grad_norm": 0.7032830768741243,
"learning_rate": 5.6081312514599805e-09,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14902475476264954,
"step": 5125,
"valid_targets_mean": 3147.9,
"valid_targets_min": 1474
},
{
"epoch": 6.960651289009498,
"grad_norm": 0.7432217757535253,
"learning_rate": 4.120310784878623e-09,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1647299975156784,
"step": 5130,
"valid_targets_mean": 2841.1,
"valid_targets_min": 578
},
{
"epoch": 6.967435549525102,
"grad_norm": 0.7089666153527104,
"learning_rate": 2.861356955008443e-09,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19622814655303955,
"step": 5135,
"valid_targets_mean": 3448.8,
"valid_targets_min": 1062
},
{
"epoch": 6.974219810040705,
"grad_norm": 0.9344960536682286,
"learning_rate": 1.8312841714474005e-09,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16499242186546326,
"step": 5140,
"valid_targets_mean": 2747.8,
"valid_targets_min": 804
},
{
"epoch": 6.98100407055631,
"grad_norm": 0.7980431188161958,
"learning_rate": 1.030104224086781e-09,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15351396799087524,
"step": 5145,
"valid_targets_mean": 2372.8,
"valid_targets_min": 727
},
{
"epoch": 6.987788331071913,
"grad_norm": 0.6998390532387075,
"learning_rate": 4.578262829846303e-10,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1696673333644867,
"step": 5150,
"valid_targets_mean": 3469.1,
"valid_targets_min": 659
},
{
"epoch": 6.9945725915875165,
"grad_norm": 0.7592131753298821,
"learning_rate": 1.1445689825473339e-10,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16776353120803833,
"step": 5155,
"valid_targets_mean": 2719.2,
"valid_targets_min": 997
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16736872494220734,
"step": 5159,
"total_flos": 1027340714311680.0,
"train_loss": 0.24267188053672734,
"train_runtime": 23911.9379,
"train_samples_per_second": 3.449,
"train_steps_per_second": 0.216,
"valid_targets_mean": 2441.9,
"valid_targets_min": 1168
}
],
"logging_steps": 5,
"max_steps": 5159,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1027340714311680.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}