nl2bash-bugsshuffle / trainer_state.json
hf-reset
Reset repository without checkpoints directories
fb65c2d
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 6657,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.005257623554153523,
"grad_norm": 10.325974059947884,
"learning_rate": 2.4024024024024026e-07,
"loss": 0.5985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5698529481887817,
"step": 5,
"valid_targets_mean": 2187.3,
"valid_targets_min": 652
},
{
"epoch": 0.010515247108307046,
"grad_norm": 10.34611556198037,
"learning_rate": 5.405405405405406e-07,
"loss": 0.5861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6291496753692627,
"step": 10,
"valid_targets_mean": 2250.8,
"valid_targets_min": 825
},
{
"epoch": 0.015772870662460567,
"grad_norm": 8.757269404879597,
"learning_rate": 8.40840840840841e-07,
"loss": 0.6112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5312914848327637,
"step": 15,
"valid_targets_mean": 2316.7,
"valid_targets_min": 518
},
{
"epoch": 0.02103049421661409,
"grad_norm": 8.915168565359615,
"learning_rate": 1.1411411411411411e-06,
"loss": 0.5804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5726572871208191,
"step": 20,
"valid_targets_mean": 2757.2,
"valid_targets_min": 826
},
{
"epoch": 0.026288117770767613,
"grad_norm": 6.930471774373005,
"learning_rate": 1.4414414414414416e-06,
"loss": 0.569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.515241265296936,
"step": 25,
"valid_targets_mean": 2158.8,
"valid_targets_min": 655
},
{
"epoch": 0.031545741324921134,
"grad_norm": 5.464255752065892,
"learning_rate": 1.7417417417417418e-06,
"loss": 0.5258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48765829205513,
"step": 30,
"valid_targets_mean": 2350.6,
"valid_targets_min": 771
},
{
"epoch": 0.03680336487907466,
"grad_norm": 4.895194969300943,
"learning_rate": 2.0420420420420424e-06,
"loss": 0.5394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.549271821975708,
"step": 35,
"valid_targets_mean": 1980.2,
"valid_targets_min": 663
},
{
"epoch": 0.04206098843322818,
"grad_norm": 3.8055975289928003,
"learning_rate": 2.3423423423423424e-06,
"loss": 0.4583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48486676812171936,
"step": 40,
"valid_targets_mean": 2417.9,
"valid_targets_min": 750
},
{
"epoch": 0.0473186119873817,
"grad_norm": 3.126668847976631,
"learning_rate": 2.642642642642643e-06,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4197412133216858,
"step": 45,
"valid_targets_mean": 2325.9,
"valid_targets_min": 739
},
{
"epoch": 0.052576235541535225,
"grad_norm": 2.9703458920789476,
"learning_rate": 2.942942942942943e-06,
"loss": 0.4284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41909611225128174,
"step": 50,
"valid_targets_mean": 2370.1,
"valid_targets_min": 683
},
{
"epoch": 0.05783385909568875,
"grad_norm": 1.5787527955355334,
"learning_rate": 3.2432432432432437e-06,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37502822279930115,
"step": 55,
"valid_targets_mean": 2348.0,
"valid_targets_min": 789
},
{
"epoch": 0.06309148264984227,
"grad_norm": 1.2393001408568016,
"learning_rate": 3.5435435435435437e-06,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35404878854751587,
"step": 60,
"valid_targets_mean": 2349.1,
"valid_targets_min": 612
},
{
"epoch": 0.0683491062039958,
"grad_norm": 0.979857142940989,
"learning_rate": 3.843843843843844e-06,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996273934841156,
"step": 65,
"valid_targets_mean": 2483.2,
"valid_targets_min": 717
},
{
"epoch": 0.07360672975814932,
"grad_norm": 0.9212476887598485,
"learning_rate": 4.1441441441441446e-06,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870257496833801,
"step": 70,
"valid_targets_mean": 2394.4,
"valid_targets_min": 652
},
{
"epoch": 0.07886435331230283,
"grad_norm": 0.9469675437264563,
"learning_rate": 4.444444444444444e-06,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3160991668701172,
"step": 75,
"valid_targets_mean": 2335.7,
"valid_targets_min": 699
},
{
"epoch": 0.08412197686645637,
"grad_norm": 0.82749236172384,
"learning_rate": 4.7447447447447454e-06,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2892245352268219,
"step": 80,
"valid_targets_mean": 2259.5,
"valid_targets_min": 711
},
{
"epoch": 0.08937960042060988,
"grad_norm": 0.7604860837844936,
"learning_rate": 5.045045045045045e-06,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3247096836566925,
"step": 85,
"valid_targets_mean": 2552.5,
"valid_targets_min": 559
},
{
"epoch": 0.0946372239747634,
"grad_norm": 0.924772968564554,
"learning_rate": 5.345345345345346e-06,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3220024108886719,
"step": 90,
"valid_targets_mean": 2037.8,
"valid_targets_min": 618
},
{
"epoch": 0.09989484752891693,
"grad_norm": 0.7776137247177106,
"learning_rate": 5.645645645645647e-06,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2980426251888275,
"step": 95,
"valid_targets_mean": 2283.9,
"valid_targets_min": 488
},
{
"epoch": 0.10515247108307045,
"grad_norm": 0.66064778952609,
"learning_rate": 5.945945945945947e-06,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25451916456222534,
"step": 100,
"valid_targets_mean": 2559.4,
"valid_targets_min": 788
},
{
"epoch": 0.11041009463722397,
"grad_norm": 0.743316071167387,
"learning_rate": 6.246246246246247e-06,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.223159521818161,
"step": 105,
"valid_targets_mean": 2259.7,
"valid_targets_min": 615
},
{
"epoch": 0.1156677181913775,
"grad_norm": 0.660018316048897,
"learning_rate": 6.546546546546547e-06,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24553650617599487,
"step": 110,
"valid_targets_mean": 2373.6,
"valid_targets_min": 646
},
{
"epoch": 0.12092534174553102,
"grad_norm": 0.75313059375532,
"learning_rate": 6.846846846846848e-06,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655906677246094,
"step": 115,
"valid_targets_mean": 1854.9,
"valid_targets_min": 697
},
{
"epoch": 0.12618296529968454,
"grad_norm": 0.9059966431167111,
"learning_rate": 7.147147147147148e-06,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2551083564758301,
"step": 120,
"valid_targets_mean": 1748.6,
"valid_targets_min": 677
},
{
"epoch": 0.13144058885383805,
"grad_norm": 0.6226560072430135,
"learning_rate": 7.447447447447448e-06,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2199288308620453,
"step": 125,
"valid_targets_mean": 2439.9,
"valid_targets_min": 830
},
{
"epoch": 0.1366982124079916,
"grad_norm": 0.7154734474743384,
"learning_rate": 7.747747747747749e-06,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24942263960838318,
"step": 130,
"valid_targets_mean": 2037.8,
"valid_targets_min": 749
},
{
"epoch": 0.14195583596214512,
"grad_norm": 0.7971901998725666,
"learning_rate": 8.048048048048048e-06,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27062466740608215,
"step": 135,
"valid_targets_mean": 2109.6,
"valid_targets_min": 522
},
{
"epoch": 0.14721345951629863,
"grad_norm": 0.7314031221791617,
"learning_rate": 8.348348348348348e-06,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23720356822013855,
"step": 140,
"valid_targets_mean": 2099.1,
"valid_targets_min": 741
},
{
"epoch": 0.15247108307045215,
"grad_norm": 0.7358610335324305,
"learning_rate": 8.64864864864865e-06,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25373178720474243,
"step": 145,
"valid_targets_mean": 2100.0,
"valid_targets_min": 881
},
{
"epoch": 0.15772870662460567,
"grad_norm": 0.7992179881681551,
"learning_rate": 8.94894894894895e-06,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26445630192756653,
"step": 150,
"valid_targets_mean": 1760.9,
"valid_targets_min": 658
},
{
"epoch": 0.16298633017875921,
"grad_norm": 0.7195681763815677,
"learning_rate": 9.24924924924925e-06,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23244032263755798,
"step": 155,
"valid_targets_mean": 2128.6,
"valid_targets_min": 589
},
{
"epoch": 0.16824395373291273,
"grad_norm": 0.6557286363239768,
"learning_rate": 9.54954954954955e-06,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20433446764945984,
"step": 160,
"valid_targets_mean": 2399.4,
"valid_targets_min": 458
},
{
"epoch": 0.17350157728706625,
"grad_norm": 0.691600778302532,
"learning_rate": 9.849849849849851e-06,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2632032632827759,
"step": 165,
"valid_targets_mean": 2430.4,
"valid_targets_min": 772
},
{
"epoch": 0.17875920084121977,
"grad_norm": 0.6089327617524263,
"learning_rate": 1.015015015015015e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19681835174560547,
"step": 170,
"valid_targets_mean": 2616.8,
"valid_targets_min": 762
},
{
"epoch": 0.18401682439537329,
"grad_norm": 0.6984873873563,
"learning_rate": 1.0450450450450452e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22802557051181793,
"step": 175,
"valid_targets_mean": 2247.9,
"valid_targets_min": 577
},
{
"epoch": 0.1892744479495268,
"grad_norm": 0.764807422264669,
"learning_rate": 1.0750750750750751e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23037518560886383,
"step": 180,
"valid_targets_mean": 1950.9,
"valid_targets_min": 759
},
{
"epoch": 0.19453207150368035,
"grad_norm": 0.6083181160844173,
"learning_rate": 1.1051051051051051e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19824735820293427,
"step": 185,
"valid_targets_mean": 2341.1,
"valid_targets_min": 802
},
{
"epoch": 0.19978969505783387,
"grad_norm": 0.7577641290857153,
"learning_rate": 1.1351351351351352e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2339884638786316,
"step": 190,
"valid_targets_mean": 1832.2,
"valid_targets_min": 516
},
{
"epoch": 0.20504731861198738,
"grad_norm": 0.6227920663722901,
"learning_rate": 1.1651651651651652e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18700635433197021,
"step": 195,
"valid_targets_mean": 2573.8,
"valid_targets_min": 883
},
{
"epoch": 0.2103049421661409,
"grad_norm": 0.6402043732900615,
"learning_rate": 1.1951951951951951e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2238750010728836,
"step": 200,
"valid_targets_mean": 2668.7,
"valid_targets_min": 804
},
{
"epoch": 0.21556256572029442,
"grad_norm": 0.6263134032541054,
"learning_rate": 1.2252252252252253e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.185381680727005,
"step": 205,
"valid_targets_mean": 2980.8,
"valid_targets_min": 919
},
{
"epoch": 0.22082018927444794,
"grad_norm": 0.6523981097403889,
"learning_rate": 1.2552552552552552e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1915464848279953,
"step": 210,
"valid_targets_mean": 2569.8,
"valid_targets_min": 898
},
{
"epoch": 0.22607781282860148,
"grad_norm": 0.6741956953226019,
"learning_rate": 1.2852852852852854e-05,
"loss": 0.211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23643609881401062,
"step": 215,
"valid_targets_mean": 2380.8,
"valid_targets_min": 673
},
{
"epoch": 0.231335436382755,
"grad_norm": 0.6873623890856462,
"learning_rate": 1.3153153153153155e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2156476080417633,
"step": 220,
"valid_targets_mean": 2281.6,
"valid_targets_min": 582
},
{
"epoch": 0.23659305993690852,
"grad_norm": 0.5587768460857466,
"learning_rate": 1.3453453453453456e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1894698590040207,
"step": 225,
"valid_targets_mean": 2919.2,
"valid_targets_min": 740
},
{
"epoch": 0.24185068349106204,
"grad_norm": 0.7145488777949135,
"learning_rate": 1.3753753753753756e-05,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2471567541360855,
"step": 230,
"valid_targets_mean": 2381.1,
"valid_targets_min": 734
},
{
"epoch": 0.24710830704521555,
"grad_norm": 0.5501524932439846,
"learning_rate": 1.4054054054054055e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18856927752494812,
"step": 235,
"valid_targets_mean": 3058.8,
"valid_targets_min": 855
},
{
"epoch": 0.25236593059936907,
"grad_norm": 0.799471898571431,
"learning_rate": 1.4354354354354357e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25401976704597473,
"step": 240,
"valid_targets_mean": 1978.3,
"valid_targets_min": 782
},
{
"epoch": 0.2576235541535226,
"grad_norm": 0.5932338862383251,
"learning_rate": 1.4654654654654656e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1802828013896942,
"step": 245,
"valid_targets_mean": 2629.1,
"valid_targets_min": 529
},
{
"epoch": 0.2628811777076761,
"grad_norm": 0.6260958613247514,
"learning_rate": 1.4954954954954957e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2139127254486084,
"step": 250,
"valid_targets_mean": 2684.2,
"valid_targets_min": 596
},
{
"epoch": 0.26813880126182965,
"grad_norm": 0.6675664639310421,
"learning_rate": 1.5255255255255257e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1949969083070755,
"step": 255,
"valid_targets_mean": 2610.5,
"valid_targets_min": 699
},
{
"epoch": 0.2733964248159832,
"grad_norm": 0.9494391056576763,
"learning_rate": 1.555555555555556e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19775743782520294,
"step": 260,
"valid_targets_mean": 2579.2,
"valid_targets_min": 765
},
{
"epoch": 0.2786540483701367,
"grad_norm": 0.5683338310977286,
"learning_rate": 1.5855855855855858e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1904410570859909,
"step": 265,
"valid_targets_mean": 2987.2,
"valid_targets_min": 1078
},
{
"epoch": 0.28391167192429023,
"grad_norm": 0.6348899767525547,
"learning_rate": 1.6156156156156157e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17143738269805908,
"step": 270,
"valid_targets_mean": 2192.1,
"valid_targets_min": 871
},
{
"epoch": 0.2891692954784437,
"grad_norm": 0.5893782779917193,
"learning_rate": 1.6456456456456457e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2026655077934265,
"step": 275,
"valid_targets_mean": 2866.9,
"valid_targets_min": 538
},
{
"epoch": 0.29442691903259727,
"grad_norm": 0.7451648590960245,
"learning_rate": 1.6756756756756757e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2093118131160736,
"step": 280,
"valid_targets_mean": 2221.4,
"valid_targets_min": 727
},
{
"epoch": 0.2996845425867508,
"grad_norm": 0.889222720310402,
"learning_rate": 1.705705705705706e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.294559121131897,
"step": 285,
"valid_targets_mean": 1926.3,
"valid_targets_min": 734
},
{
"epoch": 0.3049421661409043,
"grad_norm": 0.665492563040093,
"learning_rate": 1.735735735735736e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23913708329200745,
"step": 290,
"valid_targets_mean": 2329.9,
"valid_targets_min": 716
},
{
"epoch": 0.31019978969505785,
"grad_norm": 0.6853436124014033,
"learning_rate": 1.765765765765766e-05,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21258655190467834,
"step": 295,
"valid_targets_mean": 2236.8,
"valid_targets_min": 333
},
{
"epoch": 0.31545741324921134,
"grad_norm": 0.7220153580532297,
"learning_rate": 1.795795795795796e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18811582028865814,
"step": 300,
"valid_targets_mean": 2204.8,
"valid_targets_min": 543
},
{
"epoch": 0.3207150368033649,
"grad_norm": 0.6226543888854543,
"learning_rate": 1.8258258258258258e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17797502875328064,
"step": 305,
"valid_targets_mean": 2458.4,
"valid_targets_min": 816
},
{
"epoch": 0.32597266035751843,
"grad_norm": 0.7186866937790976,
"learning_rate": 1.855855855855856e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21228225529193878,
"step": 310,
"valid_targets_mean": 2375.6,
"valid_targets_min": 740
},
{
"epoch": 0.3312302839116719,
"grad_norm": 0.6936918457414369,
"learning_rate": 1.885885885885886e-05,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18250223994255066,
"step": 315,
"valid_targets_mean": 2669.8,
"valid_targets_min": 961
},
{
"epoch": 0.33648790746582546,
"grad_norm": 0.7534635493687819,
"learning_rate": 1.915915915915916e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20414358377456665,
"step": 320,
"valid_targets_mean": 2061.4,
"valid_targets_min": 633
},
{
"epoch": 0.34174553101997895,
"grad_norm": 0.5642674252044817,
"learning_rate": 1.9459459459459463e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18312115967273712,
"step": 325,
"valid_targets_mean": 2918.9,
"valid_targets_min": 727
},
{
"epoch": 0.3470031545741325,
"grad_norm": 1.1061165336019023,
"learning_rate": 1.9759759759759763e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25024163722991943,
"step": 330,
"valid_targets_mean": 2102.5,
"valid_targets_min": 570
},
{
"epoch": 0.352260778128286,
"grad_norm": 0.6910255160002087,
"learning_rate": 2.0060060060060062e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19173447787761688,
"step": 335,
"valid_targets_mean": 2207.9,
"valid_targets_min": 712
},
{
"epoch": 0.35751840168243953,
"grad_norm": 0.7099021627794961,
"learning_rate": 2.0360360360360362e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2061748504638672,
"step": 340,
"valid_targets_mean": 2240.0,
"valid_targets_min": 816
},
{
"epoch": 0.3627760252365931,
"grad_norm": 0.6310405251066221,
"learning_rate": 2.066066066066066e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.176910400390625,
"step": 345,
"valid_targets_mean": 2483.1,
"valid_targets_min": 530
},
{
"epoch": 0.36803364879074657,
"grad_norm": 0.6741541048094768,
"learning_rate": 2.0960960960960964e-05,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16975396871566772,
"step": 350,
"valid_targets_mean": 2461.9,
"valid_targets_min": 704
},
{
"epoch": 0.3732912723449001,
"grad_norm": 0.6677794123031981,
"learning_rate": 2.1261261261261264e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17146332561969757,
"step": 355,
"valid_targets_mean": 1978.3,
"valid_targets_min": 662
},
{
"epoch": 0.3785488958990536,
"grad_norm": 0.775718171958301,
"learning_rate": 2.1561561561561564e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536715269088745,
"step": 360,
"valid_targets_mean": 2015.7,
"valid_targets_min": 720
},
{
"epoch": 0.38380651945320715,
"grad_norm": 0.6325528998646359,
"learning_rate": 2.1861861861861863e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20889200270175934,
"step": 365,
"valid_targets_mean": 2631.3,
"valid_targets_min": 818
},
{
"epoch": 0.3890641430073607,
"grad_norm": 0.7213306891722329,
"learning_rate": 2.2162162162162163e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2096201777458191,
"step": 370,
"valid_targets_mean": 2089.7,
"valid_targets_min": 741
},
{
"epoch": 0.3943217665615142,
"grad_norm": 0.5349085473692315,
"learning_rate": 2.2462462462462466e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13460159301757812,
"step": 375,
"valid_targets_mean": 2720.9,
"valid_targets_min": 485
},
{
"epoch": 0.39957939011566773,
"grad_norm": 0.6373080512649653,
"learning_rate": 2.2762762762762765e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.181401789188385,
"step": 380,
"valid_targets_mean": 2664.4,
"valid_targets_min": 927
},
{
"epoch": 0.4048370136698212,
"grad_norm": 0.815663581320817,
"learning_rate": 2.3063063063063065e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19424355030059814,
"step": 385,
"valid_targets_mean": 2010.2,
"valid_targets_min": 534
},
{
"epoch": 0.41009463722397477,
"grad_norm": 0.6746297245872371,
"learning_rate": 2.3363363363363364e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19251810014247894,
"step": 390,
"valid_targets_mean": 2467.2,
"valid_targets_min": 847
},
{
"epoch": 0.4153522607781283,
"grad_norm": 0.6317551272807292,
"learning_rate": 2.3663663663663664e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18690259754657745,
"step": 395,
"valid_targets_mean": 2629.9,
"valid_targets_min": 940
},
{
"epoch": 0.4206098843322818,
"grad_norm": 0.5930390638966087,
"learning_rate": 2.3963963963963967e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17946986854076385,
"step": 400,
"valid_targets_mean": 2703.4,
"valid_targets_min": 689
},
{
"epoch": 0.42586750788643535,
"grad_norm": 0.722799696829428,
"learning_rate": 2.4264264264264267e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2141094207763672,
"step": 405,
"valid_targets_mean": 2128.2,
"valid_targets_min": 712
},
{
"epoch": 0.43112513144058884,
"grad_norm": 0.760671547292989,
"learning_rate": 2.4564564564564566e-05,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19687330722808838,
"step": 410,
"valid_targets_mean": 1751.6,
"valid_targets_min": 638
},
{
"epoch": 0.4363827549947424,
"grad_norm": 0.6909768606370942,
"learning_rate": 2.4864864864864866e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2088453322649002,
"step": 415,
"valid_targets_mean": 2239.5,
"valid_targets_min": 478
},
{
"epoch": 0.4416403785488959,
"grad_norm": 0.5903366376741392,
"learning_rate": 2.5165165165165165e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1566462516784668,
"step": 420,
"valid_targets_mean": 2530.4,
"valid_targets_min": 816
},
{
"epoch": 0.4468980021030494,
"grad_norm": 0.6147737168498079,
"learning_rate": 2.5465465465465465e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.175796240568161,
"step": 425,
"valid_targets_mean": 2636.4,
"valid_targets_min": 744
},
{
"epoch": 0.45215562565720296,
"grad_norm": 0.7187613599477839,
"learning_rate": 2.5765765765765768e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862875074148178,
"step": 430,
"valid_targets_mean": 2198.9,
"valid_targets_min": 649
},
{
"epoch": 0.45741324921135645,
"grad_norm": 0.5974366789403296,
"learning_rate": 2.6066066066066067e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20132970809936523,
"step": 435,
"valid_targets_mean": 2388.2,
"valid_targets_min": 718
},
{
"epoch": 0.46267087276551,
"grad_norm": 0.7290863107759993,
"learning_rate": 2.6366366366366367e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1937723457813263,
"step": 440,
"valid_targets_mean": 2251.8,
"valid_targets_min": 682
},
{
"epoch": 0.4679284963196635,
"grad_norm": 0.7201505656839541,
"learning_rate": 2.6666666666666667e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20128653943538666,
"step": 445,
"valid_targets_mean": 2351.4,
"valid_targets_min": 797
},
{
"epoch": 0.47318611987381703,
"grad_norm": 0.7538369265177368,
"learning_rate": 2.6966966966966966e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18841460347175598,
"step": 450,
"valid_targets_mean": 1894.8,
"valid_targets_min": 909
},
{
"epoch": 0.4784437434279706,
"grad_norm": 0.6855349353613355,
"learning_rate": 2.726726726726727e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1809961497783661,
"step": 455,
"valid_targets_mean": 2314.8,
"valid_targets_min": 645
},
{
"epoch": 0.48370136698212407,
"grad_norm": 0.557578493597873,
"learning_rate": 2.756756756756757e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15485841035842896,
"step": 460,
"valid_targets_mean": 2608.8,
"valid_targets_min": 526
},
{
"epoch": 0.4889589905362776,
"grad_norm": 0.5943630435783159,
"learning_rate": 2.786786786786787e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17757076025009155,
"step": 465,
"valid_targets_mean": 2493.2,
"valid_targets_min": 734
},
{
"epoch": 0.4942166140904311,
"grad_norm": 0.6835416043237226,
"learning_rate": 2.8168168168168168e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16320756077766418,
"step": 470,
"valid_targets_mean": 1887.7,
"valid_targets_min": 722
},
{
"epoch": 0.49947423764458465,
"grad_norm": 0.7077909962188252,
"learning_rate": 2.8468468468468467e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1896069049835205,
"step": 475,
"valid_targets_mean": 1849.9,
"valid_targets_min": 711
},
{
"epoch": 0.5047318611987381,
"grad_norm": 0.6617014641404008,
"learning_rate": 2.8768768768768774e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17856386303901672,
"step": 480,
"valid_targets_mean": 2606.5,
"valid_targets_min": 757
},
{
"epoch": 0.5099894847528917,
"grad_norm": 0.7315452586981643,
"learning_rate": 2.9069069069069073e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21579106152057648,
"step": 485,
"valid_targets_mean": 2144.4,
"valid_targets_min": 591
},
{
"epoch": 0.5152471083070452,
"grad_norm": 0.7395163140849079,
"learning_rate": 2.9369369369369373e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20368653535842896,
"step": 490,
"valid_targets_mean": 1992.6,
"valid_targets_min": 851
},
{
"epoch": 0.5205047318611987,
"grad_norm": 0.6422630720939135,
"learning_rate": 2.9669669669669673e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24187633395195007,
"step": 495,
"valid_targets_mean": 2486.3,
"valid_targets_min": 770
},
{
"epoch": 0.5257623554153522,
"grad_norm": 0.7367030484019584,
"learning_rate": 2.9969969969969976e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13721273839473724,
"step": 500,
"valid_targets_mean": 2497.6,
"valid_targets_min": 862
},
{
"epoch": 0.5310199789695058,
"grad_norm": 0.6497925578020836,
"learning_rate": 3.0270270270270275e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16397172212600708,
"step": 505,
"valid_targets_mean": 1927.3,
"valid_targets_min": 614
},
{
"epoch": 0.5362776025236593,
"grad_norm": 0.6420648792656638,
"learning_rate": 3.0570570570570575e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1578940749168396,
"step": 510,
"valid_targets_mean": 2199.2,
"valid_targets_min": 550
},
{
"epoch": 0.5415352260778128,
"grad_norm": 0.6323088462269795,
"learning_rate": 3.0870870870870874e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1881733536720276,
"step": 515,
"valid_targets_mean": 2238.9,
"valid_targets_min": 736
},
{
"epoch": 0.5467928496319664,
"grad_norm": 0.6071581287757932,
"learning_rate": 3.1171171171171174e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161208838224411,
"step": 520,
"valid_targets_mean": 2443.1,
"valid_targets_min": 909
},
{
"epoch": 0.5520504731861199,
"grad_norm": 0.5722165896765079,
"learning_rate": 3.1471471471471473e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628541648387909,
"step": 525,
"valid_targets_mean": 2472.2,
"valid_targets_min": 424
},
{
"epoch": 0.5573080967402734,
"grad_norm": 0.5718409638706886,
"learning_rate": 3.177177177177177e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16681770980358124,
"step": 530,
"valid_targets_mean": 2387.2,
"valid_targets_min": 676
},
{
"epoch": 0.562565720294427,
"grad_norm": 0.7034879401845234,
"learning_rate": 3.207207207207207e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751999855041504,
"step": 535,
"valid_targets_mean": 2111.0,
"valid_targets_min": 692
},
{
"epoch": 0.5678233438485805,
"grad_norm": 0.9071190797548387,
"learning_rate": 3.237237237237238e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1928257793188095,
"step": 540,
"valid_targets_mean": 2259.1,
"valid_targets_min": 767
},
{
"epoch": 0.573080967402734,
"grad_norm": 0.6957506105580801,
"learning_rate": 3.267267267267268e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19071762263774872,
"step": 545,
"valid_targets_mean": 2100.1,
"valid_targets_min": 593
},
{
"epoch": 0.5783385909568874,
"grad_norm": 0.7884429234830329,
"learning_rate": 3.297297297297298e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18166415393352509,
"step": 550,
"valid_targets_mean": 1668.4,
"valid_targets_min": 673
},
{
"epoch": 0.583596214511041,
"grad_norm": 0.5737532599035816,
"learning_rate": 3.327327327327328e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15513579547405243,
"step": 555,
"valid_targets_mean": 2771.8,
"valid_targets_min": 710
},
{
"epoch": 0.5888538380651945,
"grad_norm": 0.5734107825488577,
"learning_rate": 3.357357357357358e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18644770979881287,
"step": 560,
"valid_targets_mean": 2491.6,
"valid_targets_min": 658
},
{
"epoch": 0.594111461619348,
"grad_norm": 0.5553995753854393,
"learning_rate": 3.387387387387388e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17800036072731018,
"step": 565,
"valid_targets_mean": 2598.2,
"valid_targets_min": 1126
},
{
"epoch": 0.5993690851735016,
"grad_norm": 0.6360637990611876,
"learning_rate": 3.4174174174174176e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16586969792842865,
"step": 570,
"valid_targets_mean": 2114.4,
"valid_targets_min": 632
},
{
"epoch": 0.6046267087276551,
"grad_norm": 0.599463088721673,
"learning_rate": 3.4474474474474476e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1638803482055664,
"step": 575,
"valid_targets_mean": 2169.0,
"valid_targets_min": 851
},
{
"epoch": 0.6098843322818086,
"grad_norm": 0.7816240205612559,
"learning_rate": 3.4774774774774776e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21671947836875916,
"step": 580,
"valid_targets_mean": 1645.6,
"valid_targets_min": 781
},
{
"epoch": 0.6151419558359621,
"grad_norm": 0.7398920407442463,
"learning_rate": 3.5075075075075075e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20531770586967468,
"step": 585,
"valid_targets_mean": 2567.9,
"valid_targets_min": 523
},
{
"epoch": 0.6203995793901157,
"grad_norm": 0.49902272883171905,
"learning_rate": 3.5375375375375375e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13718831539154053,
"step": 590,
"valid_targets_mean": 2637.8,
"valid_targets_min": 484
},
{
"epoch": 0.6256572029442692,
"grad_norm": 0.6814272166124004,
"learning_rate": 3.567567567567568e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921451985836029,
"step": 595,
"valid_targets_mean": 2228.6,
"valid_targets_min": 786
},
{
"epoch": 0.6309148264984227,
"grad_norm": 0.5437394859533489,
"learning_rate": 3.597597597597598e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18390172719955444,
"step": 600,
"valid_targets_mean": 2788.6,
"valid_targets_min": 1249
},
{
"epoch": 0.6361724500525763,
"grad_norm": 0.7445833625193122,
"learning_rate": 3.627627627627628e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20908337831497192,
"step": 605,
"valid_targets_mean": 1758.6,
"valid_targets_min": 559
},
{
"epoch": 0.6414300736067298,
"grad_norm": 0.7236716425859328,
"learning_rate": 3.657657657657658e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20160071551799774,
"step": 610,
"valid_targets_mean": 1882.8,
"valid_targets_min": 788
},
{
"epoch": 0.6466876971608833,
"grad_norm": 0.681907959030046,
"learning_rate": 3.687687687687688e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19641152024269104,
"step": 615,
"valid_targets_mean": 2132.7,
"valid_targets_min": 724
},
{
"epoch": 0.6519453207150369,
"grad_norm": 0.45721078622016703,
"learning_rate": 3.717717717717718e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13573741912841797,
"step": 620,
"valid_targets_mean": 3075.2,
"valid_targets_min": 788
},
{
"epoch": 0.6572029442691903,
"grad_norm": 0.6225687786900717,
"learning_rate": 3.747747747747748e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18571923673152924,
"step": 625,
"valid_targets_mean": 2183.8,
"valid_targets_min": 700
},
{
"epoch": 0.6624605678233438,
"grad_norm": 0.6009341475358304,
"learning_rate": 3.777777777777778e-05,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1731058955192566,
"step": 630,
"valid_targets_mean": 2362.7,
"valid_targets_min": 804
},
{
"epoch": 0.6677181913774973,
"grad_norm": 0.6464808668170543,
"learning_rate": 3.807807807807808e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1671919822692871,
"step": 635,
"valid_targets_mean": 1980.8,
"valid_targets_min": 592
},
{
"epoch": 0.6729758149316509,
"grad_norm": 0.5632651786349206,
"learning_rate": 3.837837837837838e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18203315138816833,
"step": 640,
"valid_targets_mean": 2670.2,
"valid_targets_min": 750
},
{
"epoch": 0.6782334384858044,
"grad_norm": 0.5810773855761291,
"learning_rate": 3.8678678678678684e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18520139157772064,
"step": 645,
"valid_targets_mean": 2278.9,
"valid_targets_min": 787
},
{
"epoch": 0.6834910620399579,
"grad_norm": 0.6150283734943846,
"learning_rate": 3.897897897897898e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14168278872966766,
"step": 650,
"valid_targets_mean": 2230.8,
"valid_targets_min": 722
},
{
"epoch": 0.6887486855941115,
"grad_norm": 0.5645102322077462,
"learning_rate": 3.927927927927928e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16727334260940552,
"step": 655,
"valid_targets_mean": 2240.4,
"valid_targets_min": 773
},
{
"epoch": 0.694006309148265,
"grad_norm": 0.5281592910351098,
"learning_rate": 3.957957957957958e-05,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15454602241516113,
"step": 660,
"valid_targets_mean": 2391.4,
"valid_targets_min": 785
},
{
"epoch": 0.6992639327024185,
"grad_norm": 0.5959270183647,
"learning_rate": 3.987987987987988e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17326083779335022,
"step": 665,
"valid_targets_mean": 2328.1,
"valid_targets_min": 841
},
{
"epoch": 0.704521556256572,
"grad_norm": 0.6339966781689561,
"learning_rate": 3.9999975251805184e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16850808262825012,
"step": 670,
"valid_targets_mean": 2042.2,
"valid_targets_min": 777
},
{
"epoch": 0.7097791798107256,
"grad_norm": 0.5987674114964633,
"learning_rate": 3.9999824013058675e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16761921346187592,
"step": 675,
"valid_targets_mean": 2518.4,
"valid_targets_min": 760
},
{
"epoch": 0.7150368033648791,
"grad_norm": 0.635898070816828,
"learning_rate": 3.99995352856012e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20546624064445496,
"step": 680,
"valid_targets_mean": 2519.9,
"valid_targets_min": 985
},
{
"epoch": 0.7202944269190326,
"grad_norm": 0.5704696477449783,
"learning_rate": 3.999910907141761e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16397696733474731,
"step": 685,
"valid_targets_mean": 2938.4,
"valid_targets_min": 921
},
{
"epoch": 0.7255520504731862,
"grad_norm": 0.5893660568484972,
"learning_rate": 3.9998545373437924e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19878719747066498,
"step": 690,
"valid_targets_mean": 2286.5,
"valid_targets_min": 623
},
{
"epoch": 0.7308096740273397,
"grad_norm": 0.6433652331608646,
"learning_rate": 3.999784419553728e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15845108032226562,
"step": 695,
"valid_targets_mean": 1922.4,
"valid_targets_min": 563
},
{
"epoch": 0.7360672975814931,
"grad_norm": 0.4487958100841574,
"learning_rate": 3.9997005542535916e-05,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13349756598472595,
"step": 700,
"valid_targets_mean": 3132.7,
"valid_targets_min": 777
},
{
"epoch": 0.7413249211356467,
"grad_norm": 0.5017683246837674,
"learning_rate": 3.9996029420199154e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14281517267227173,
"step": 705,
"valid_targets_mean": 3116.9,
"valid_targets_min": 768
},
{
"epoch": 0.7465825446898002,
"grad_norm": 0.6680436188387587,
"learning_rate": 3.9994915835237336e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16415849328041077,
"step": 710,
"valid_targets_mean": 1991.9,
"valid_targets_min": 622
},
{
"epoch": 0.7518401682439537,
"grad_norm": 0.5786349741556408,
"learning_rate": 3.999366479530581e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101982682943344,
"step": 715,
"valid_targets_mean": 2443.0,
"valid_targets_min": 750
},
{
"epoch": 0.7570977917981072,
"grad_norm": 0.6321178555432165,
"learning_rate": 3.999227630900483e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14732156693935394,
"step": 720,
"valid_targets_mean": 2187.8,
"valid_targets_min": 645
},
{
"epoch": 0.7623554153522608,
"grad_norm": 0.5873468724272303,
"learning_rate": 3.9990750385879554e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1809384822845459,
"step": 725,
"valid_targets_mean": 2686.9,
"valid_targets_min": 759
},
{
"epoch": 0.7676130389064143,
"grad_norm": 0.770293637713331,
"learning_rate": 3.998908703641993e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19991716742515564,
"step": 730,
"valid_targets_mean": 1949.1,
"valid_targets_min": 544
},
{
"epoch": 0.7728706624605678,
"grad_norm": 0.544064862966594,
"learning_rate": 3.9987286272060644e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14638791978359222,
"step": 735,
"valid_targets_mean": 2426.7,
"valid_targets_min": 794
},
{
"epoch": 0.7781282860147214,
"grad_norm": 0.5444828725185055,
"learning_rate": 3.998534810518104e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1417040228843689,
"step": 740,
"valid_targets_mean": 2386.8,
"valid_targets_min": 1117
},
{
"epoch": 0.7833859095688749,
"grad_norm": 0.6403914222370137,
"learning_rate": 3.998327254910504e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2143629491329193,
"step": 745,
"valid_targets_mean": 1959.9,
"valid_targets_min": 1044
},
{
"epoch": 0.7886435331230284,
"grad_norm": 0.5028262785941544,
"learning_rate": 3.998105961810105e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15218302607536316,
"step": 750,
"valid_targets_mean": 2712.9,
"valid_targets_min": 691
},
{
"epoch": 0.7939011566771819,
"grad_norm": 0.7306148472705972,
"learning_rate": 3.997870932738187e-05,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1602567732334137,
"step": 755,
"valid_targets_mean": 2521.6,
"valid_targets_min": 731
},
{
"epoch": 0.7991587802313355,
"grad_norm": 0.5832513468291718,
"learning_rate": 3.997622169310454e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18383777141571045,
"step": 760,
"valid_targets_mean": 2134.2,
"valid_targets_min": 655
},
{
"epoch": 0.804416403785489,
"grad_norm": 0.6242876619796933,
"learning_rate": 3.9973596732370296e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1778438687324524,
"step": 765,
"valid_targets_mean": 1782.9,
"valid_targets_min": 490
},
{
"epoch": 0.8096740273396424,
"grad_norm": 0.696908627361147,
"learning_rate": 3.997083446322443e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18748943507671356,
"step": 770,
"valid_targets_mean": 1747.4,
"valid_targets_min": 697
},
{
"epoch": 0.814931650893796,
"grad_norm": 0.7540305921918701,
"learning_rate": 3.9967934904656145e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19418692588806152,
"step": 775,
"valid_targets_mean": 1872.0,
"valid_targets_min": 754
},
{
"epoch": 0.8201892744479495,
"grad_norm": 0.6401412864858457,
"learning_rate": 3.9964898076598445e-05,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17221704125404358,
"step": 780,
"valid_targets_mean": 1849.5,
"valid_targets_min": 717
},
{
"epoch": 0.825446898002103,
"grad_norm": 0.5747510347430306,
"learning_rate": 3.996172399992799e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18032671511173248,
"step": 785,
"valid_targets_mean": 2206.8,
"valid_targets_min": 721
},
{
"epoch": 0.8307045215562566,
"grad_norm": 0.5179693444755097,
"learning_rate": 3.995841269646496e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442815214395523,
"step": 790,
"valid_targets_mean": 2437.4,
"valid_targets_min": 711
},
{
"epoch": 0.8359621451104101,
"grad_norm": 0.5889811942367722,
"learning_rate": 3.995496418897291e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15919098258018494,
"step": 795,
"valid_targets_mean": 2093.8,
"valid_targets_min": 573
},
{
"epoch": 0.8412197686645636,
"grad_norm": 0.48159733784105707,
"learning_rate": 3.995137850115856e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1566462367773056,
"step": 800,
"valid_targets_mean": 2729.2,
"valid_targets_min": 1026
},
{
"epoch": 0.8464773922187171,
"grad_norm": 0.45889986939992605,
"learning_rate": 3.994765565767174e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15732339024543762,
"step": 805,
"valid_targets_mean": 2682.2,
"valid_targets_min": 902
},
{
"epoch": 0.8517350157728707,
"grad_norm": 0.5920820501188195,
"learning_rate": 3.9943795684105104e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16061899065971375,
"step": 810,
"valid_targets_mean": 2266.4,
"valid_targets_min": 711
},
{
"epoch": 0.8569926393270242,
"grad_norm": 0.49656435706906604,
"learning_rate": 3.993979860699403e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17811651527881622,
"step": 815,
"valid_targets_mean": 2735.4,
"valid_targets_min": 833
},
{
"epoch": 0.8622502628811777,
"grad_norm": 0.4581859924468785,
"learning_rate": 3.993566445381641e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1335049718618393,
"step": 820,
"valid_targets_mean": 2790.2,
"valid_targets_min": 446
},
{
"epoch": 0.8675078864353313,
"grad_norm": 0.5895950662286351,
"learning_rate": 3.9931393252992454e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17721489071846008,
"step": 825,
"valid_targets_mean": 2180.7,
"valid_targets_min": 683
},
{
"epoch": 0.8727655099894848,
"grad_norm": 0.5802489189400181,
"learning_rate": 3.992698503388453e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15258771181106567,
"step": 830,
"valid_targets_mean": 2000.4,
"valid_targets_min": 518
},
{
"epoch": 0.8780231335436383,
"grad_norm": 0.4993161271086695,
"learning_rate": 3.992243982679691e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15528042614459991,
"step": 835,
"valid_targets_mean": 2338.6,
"valid_targets_min": 664
},
{
"epoch": 0.8832807570977917,
"grad_norm": 0.49788813008883437,
"learning_rate": 3.991775766297562e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17193055152893066,
"step": 840,
"valid_targets_mean": 2463.5,
"valid_targets_min": 521
},
{
"epoch": 0.8885383806519453,
"grad_norm": 0.62190442322264,
"learning_rate": 3.991293857460815e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14908094704151154,
"step": 845,
"valid_targets_mean": 2454.8,
"valid_targets_min": 747
},
{
"epoch": 0.8937960042060988,
"grad_norm": 0.564106713835091,
"learning_rate": 3.9907982594823326e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14456875622272491,
"step": 850,
"valid_targets_mean": 1942.8,
"valid_targets_min": 337
},
{
"epoch": 0.8990536277602523,
"grad_norm": 0.5652238802710153,
"learning_rate": 3.9902889757691e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15603473782539368,
"step": 855,
"valid_targets_mean": 2479.9,
"valid_targets_min": 449
},
{
"epoch": 0.9043112513144059,
"grad_norm": 0.5557854689743138,
"learning_rate": 3.9897660098221866e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1946299523115158,
"step": 860,
"valid_targets_mean": 2797.2,
"valid_targets_min": 1127
},
{
"epoch": 0.9095688748685594,
"grad_norm": 0.47848415326154364,
"learning_rate": 3.98922936523672e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15333466231822968,
"step": 865,
"valid_targets_mean": 2642.8,
"valid_targets_min": 748
},
{
"epoch": 0.9148264984227129,
"grad_norm": 0.5477124486710891,
"learning_rate": 3.9886790457018604e-05,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455027163028717,
"step": 870,
"valid_targets_mean": 2130.8,
"valid_targets_min": 554
},
{
"epoch": 0.9200841219768665,
"grad_norm": 0.482463002665872,
"learning_rate": 3.9881150550007776e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15480923652648926,
"step": 875,
"valid_targets_mean": 2639.6,
"valid_targets_min": 746
},
{
"epoch": 0.92534174553102,
"grad_norm": 0.6091923554351032,
"learning_rate": 3.987537397010624e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18330509960651398,
"step": 880,
"valid_targets_mean": 1815.5,
"valid_targets_min": 803
},
{
"epoch": 0.9305993690851735,
"grad_norm": 0.5769865256429234,
"learning_rate": 3.9869460757025064e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15766553580760956,
"step": 885,
"valid_targets_mean": 2084.2,
"valid_targets_min": 677
},
{
"epoch": 0.935856992639327,
"grad_norm": 0.46131201133569494,
"learning_rate": 3.9863410951414616e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14745357632637024,
"step": 890,
"valid_targets_mean": 2944.2,
"valid_targets_min": 855
},
{
"epoch": 0.9411146161934806,
"grad_norm": 0.617416236613489,
"learning_rate": 3.985722459486425e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1965213119983673,
"step": 895,
"valid_targets_mean": 1945.8,
"valid_targets_min": 639
},
{
"epoch": 0.9463722397476341,
"grad_norm": 0.6068341327737703,
"learning_rate": 3.985090172990206e-05,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689082831144333,
"step": 900,
"valid_targets_mean": 2248.5,
"valid_targets_min": 684
},
{
"epoch": 0.9516298633017876,
"grad_norm": 0.5912572095950641,
"learning_rate": 3.984444239999455e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16497471928596497,
"step": 905,
"valid_targets_mean": 1847.9,
"valid_targets_min": 566
},
{
"epoch": 0.9568874868559412,
"grad_norm": 0.5841589712639083,
"learning_rate": 3.9837846649546354e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18890559673309326,
"step": 910,
"valid_targets_mean": 2282.3,
"valid_targets_min": 549
},
{
"epoch": 0.9621451104100947,
"grad_norm": 0.5007366217729837,
"learning_rate": 3.9831114523899945e-05,
"loss": 0.1627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1335860937833786,
"step": 915,
"valid_targets_mean": 2242.7,
"valid_targets_min": 539
},
{
"epoch": 0.9674027339642481,
"grad_norm": 0.6870618813935128,
"learning_rate": 3.982424606933529e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15983468294143677,
"step": 920,
"valid_targets_mean": 1903.2,
"valid_targets_min": 486
},
{
"epoch": 0.9726603575184016,
"grad_norm": 0.5199752289946125,
"learning_rate": 3.981724133306954e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1660923957824707,
"step": 925,
"valid_targets_mean": 2608.4,
"valid_targets_min": 847
},
{
"epoch": 0.9779179810725552,
"grad_norm": 0.5424070805126671,
"learning_rate": 3.981010036325674e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15435153245925903,
"step": 930,
"valid_targets_mean": 1866.8,
"valid_targets_min": 526
},
{
"epoch": 0.9831756046267087,
"grad_norm": 0.4825716591165228,
"learning_rate": 3.980282320898746e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14119663834571838,
"step": 935,
"valid_targets_mean": 2298.9,
"valid_targets_min": 802
},
{
"epoch": 0.9884332281808622,
"grad_norm": 0.5588624288109972,
"learning_rate": 3.9795409920288456e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20035411417484283,
"step": 940,
"valid_targets_mean": 2405.1,
"valid_targets_min": 667
},
{
"epoch": 0.9936908517350158,
"grad_norm": 0.5412933819885745,
"learning_rate": 3.978786054812236e-05,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15584760904312134,
"step": 945,
"valid_targets_mean": 2029.0,
"valid_targets_min": 641
},
{
"epoch": 0.9989484752891693,
"grad_norm": 0.5590037279130108,
"learning_rate": 3.9780175144387304e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18622665107250214,
"step": 950,
"valid_targets_mean": 2303.4,
"valid_targets_min": 751
},
{
"epoch": 1.0042060988433228,
"grad_norm": 0.4913941844630526,
"learning_rate": 3.977235376191656e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13712620735168457,
"step": 955,
"valid_targets_mean": 2234.4,
"valid_targets_min": 697
},
{
"epoch": 1.0094637223974763,
"grad_norm": 0.5574044477571565,
"learning_rate": 3.9764396454478195e-05,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726335883140564,
"step": 960,
"valid_targets_mean": 2338.3,
"valid_targets_min": 696
},
{
"epoch": 1.0147213459516298,
"grad_norm": 0.5770000978677239,
"learning_rate": 3.975630327677468e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1890842169523239,
"step": 965,
"valid_targets_mean": 2206.1,
"valid_targets_min": 776
},
{
"epoch": 1.0199789695057835,
"grad_norm": 0.6739464685570162,
"learning_rate": 3.974807428444254e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16731727123260498,
"step": 970,
"valid_targets_mean": 1820.7,
"valid_targets_min": 796
},
{
"epoch": 1.025236593059937,
"grad_norm": 0.5005618630147292,
"learning_rate": 3.973970953405195e-05,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13522601127624512,
"step": 975,
"valid_targets_mean": 2267.5,
"valid_targets_min": 767
},
{
"epoch": 1.0304942166140905,
"grad_norm": 0.5342310903126117,
"learning_rate": 3.9731209083106354e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15838786959648132,
"step": 980,
"valid_targets_mean": 2170.8,
"valid_targets_min": 337
},
{
"epoch": 1.035751840168244,
"grad_norm": 0.5422313577106275,
"learning_rate": 3.972257299004206e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16515782475471497,
"step": 985,
"valid_targets_mean": 2289.5,
"valid_targets_min": 771
},
{
"epoch": 1.0410094637223974,
"grad_norm": 0.5515823157763934,
"learning_rate": 3.9713801314227867e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17059384286403656,
"step": 990,
"valid_targets_mean": 1878.6,
"valid_targets_min": 246
},
{
"epoch": 1.046267087276551,
"grad_norm": 0.47915626914547066,
"learning_rate": 3.9704894115964615e-05,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13370344042778015,
"step": 995,
"valid_targets_mean": 2246.9,
"valid_targets_min": 760
},
{
"epoch": 1.0515247108307044,
"grad_norm": 0.43390148331658024,
"learning_rate": 3.9695851456484805e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14509449899196625,
"step": 1000,
"valid_targets_mean": 3186.6,
"valid_targets_min": 1045
},
{
"epoch": 1.0567823343848581,
"grad_norm": 0.571701063259449,
"learning_rate": 3.968667339795218e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15463784337043762,
"step": 1005,
"valid_targets_mean": 2025.8,
"valid_targets_min": 699
},
{
"epoch": 1.0620399579390116,
"grad_norm": 0.5766098090902164,
"learning_rate": 3.9677360003461246e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14297954738140106,
"step": 1010,
"valid_targets_mean": 1722.7,
"valid_targets_min": 612
},
{
"epoch": 1.0672975814931651,
"grad_norm": 0.4849722094117099,
"learning_rate": 3.966791133703691e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15411697328090668,
"step": 1015,
"valid_targets_mean": 2515.6,
"valid_targets_min": 663
},
{
"epoch": 1.0725552050473186,
"grad_norm": 0.5469032580772873,
"learning_rate": 3.965832746363397e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1780654788017273,
"step": 1020,
"valid_targets_mean": 2291.1,
"valid_targets_min": 721
},
{
"epoch": 1.077812828601472,
"grad_norm": 0.4579539501403899,
"learning_rate": 3.964860844913676e-05,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14604100584983826,
"step": 1025,
"valid_targets_mean": 2671.9,
"valid_targets_min": 784
},
{
"epoch": 1.0830704521556256,
"grad_norm": 0.45572251214805365,
"learning_rate": 3.9638754360358585e-05,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15409834682941437,
"step": 1030,
"valid_targets_mean": 2830.2,
"valid_targets_min": 754
},
{
"epoch": 1.088328075709779,
"grad_norm": 0.5630656693781774,
"learning_rate": 3.962876526504134e-05,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15992572903633118,
"step": 1035,
"valid_targets_mean": 2036.1,
"valid_targets_min": 560
},
{
"epoch": 1.0935856992639328,
"grad_norm": 0.623107144555327,
"learning_rate": 3.961864123185502e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15125590562820435,
"step": 1040,
"valid_targets_mean": 1604.8,
"valid_targets_min": 568
},
{
"epoch": 1.0988433228180863,
"grad_norm": 0.5078151422910574,
"learning_rate": 3.9608382330397265e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.131246879696846,
"step": 1045,
"valid_targets_mean": 2134.9,
"valid_targets_min": 535
},
{
"epoch": 1.1041009463722398,
"grad_norm": 0.5419586812634338,
"learning_rate": 3.959798863119284e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17790265381336212,
"step": 1050,
"valid_targets_mean": 2206.5,
"valid_targets_min": 635
},
{
"epoch": 1.1093585699263933,
"grad_norm": 0.42872401583713005,
"learning_rate": 3.9587460205693194e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11107654869556427,
"step": 1055,
"valid_targets_mean": 2629.1,
"valid_targets_min": 853
},
{
"epoch": 1.1146161934805467,
"grad_norm": 0.4812693528779981,
"learning_rate": 3.9576797126275945e-05,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15019483864307404,
"step": 1060,
"valid_targets_mean": 2700.4,
"valid_targets_min": 606
},
{
"epoch": 1.1198738170347002,
"grad_norm": 0.441257293011989,
"learning_rate": 3.9565999466244384e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14144045114517212,
"step": 1065,
"valid_targets_mean": 2790.8,
"valid_targets_min": 804
},
{
"epoch": 1.125131440588854,
"grad_norm": 0.5990886150338299,
"learning_rate": 3.955506729982699e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20643794536590576,
"step": 1070,
"valid_targets_mean": 1939.9,
"valid_targets_min": 572
},
{
"epoch": 1.1303890641430074,
"grad_norm": 0.49092829702841184,
"learning_rate": 3.9544000702176896e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16491742432117462,
"step": 1075,
"valid_targets_mean": 2971.6,
"valid_targets_min": 645
},
{
"epoch": 1.135646687697161,
"grad_norm": 0.595178819783364,
"learning_rate": 3.953279974937139e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17017915844917297,
"step": 1080,
"valid_targets_mean": 2023.4,
"valid_targets_min": 806
},
{
"epoch": 1.1409043112513144,
"grad_norm": 0.5445377847711285,
"learning_rate": 3.9521464518411356e-05,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510683000087738,
"step": 1085,
"valid_targets_mean": 1929.0,
"valid_targets_min": 700
},
{
"epoch": 1.146161934805468,
"grad_norm": 0.4914239190639807,
"learning_rate": 3.950999508722082e-05,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14013531804084778,
"step": 1090,
"valid_targets_mean": 2581.4,
"valid_targets_min": 706
},
{
"epoch": 1.1514195583596214,
"grad_norm": 0.5449959755108419,
"learning_rate": 3.9498391534646325e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1524956226348877,
"step": 1095,
"valid_targets_mean": 2219.2,
"valid_targets_min": 660
},
{
"epoch": 1.1566771819137749,
"grad_norm": 0.45182769202454204,
"learning_rate": 3.948665394045646e-05,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13435500860214233,
"step": 1100,
"valid_targets_mean": 2639.7,
"valid_targets_min": 911
},
{
"epoch": 1.1619348054679284,
"grad_norm": 0.4960432951831983,
"learning_rate": 3.9474782385341255e-05,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14274129271507263,
"step": 1105,
"valid_targets_mean": 2265.6,
"valid_targets_min": 493
},
{
"epoch": 1.167192429022082,
"grad_norm": 0.4180641784123541,
"learning_rate": 3.9462776950911684e-05,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12849754095077515,
"step": 1110,
"valid_targets_mean": 2983.8,
"valid_targets_min": 893
},
{
"epoch": 1.1724500525762356,
"grad_norm": 0.5659956360723372,
"learning_rate": 3.9450637719699046e-05,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16112183034420013,
"step": 1115,
"valid_targets_mean": 1966.4,
"valid_targets_min": 612
},
{
"epoch": 1.177707676130389,
"grad_norm": 0.43420634299325733,
"learning_rate": 3.9438364775154436e-05,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11898370087146759,
"step": 1120,
"valid_targets_mean": 2543.1,
"valid_targets_min": 632
},
{
"epoch": 1.1829652996845426,
"grad_norm": 0.5586253038415747,
"learning_rate": 3.942595820164818e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16678744554519653,
"step": 1125,
"valid_targets_mean": 2127.7,
"valid_targets_min": 796
},
{
"epoch": 1.188222923238696,
"grad_norm": 0.4532370160765986,
"learning_rate": 3.94134180844692e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13639366626739502,
"step": 1130,
"valid_targets_mean": 2682.5,
"valid_targets_min": 728
},
{
"epoch": 1.1934805467928495,
"grad_norm": 0.4478218887214927,
"learning_rate": 3.940074450982449e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11848050355911255,
"step": 1135,
"valid_targets_mean": 2773.8,
"valid_targets_min": 746
},
{
"epoch": 1.1987381703470033,
"grad_norm": 0.6019738194115937,
"learning_rate": 3.93879375648385e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19964569807052612,
"step": 1140,
"valid_targets_mean": 2764.6,
"valid_targets_min": 523
},
{
"epoch": 1.2039957939011567,
"grad_norm": 0.6086044259404536,
"learning_rate": 3.9374997337552496e-05,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15948590636253357,
"step": 1145,
"valid_targets_mean": 1668.8,
"valid_targets_min": 557
},
{
"epoch": 1.2092534174553102,
"grad_norm": 0.3925842189469582,
"learning_rate": 3.936192391692404e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12689751386642456,
"step": 1150,
"valid_targets_mean": 2989.9,
"valid_targets_min": 910
},
{
"epoch": 1.2145110410094637,
"grad_norm": 0.5477920484644458,
"learning_rate": 3.9348717392826306e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.176341250538826,
"step": 1155,
"valid_targets_mean": 2156.2,
"valid_targets_min": 753
},
{
"epoch": 1.2197686645636172,
"grad_norm": 0.523259215501025,
"learning_rate": 3.933537785604748e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15306803584098816,
"step": 1160,
"valid_targets_mean": 2222.0,
"valid_targets_min": 593
},
{
"epoch": 1.2250262881177707,
"grad_norm": 0.505929491947455,
"learning_rate": 3.932190539829018e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15849801898002625,
"step": 1165,
"valid_targets_mean": 2339.6,
"valid_targets_min": 851
},
{
"epoch": 1.2302839116719242,
"grad_norm": 0.60608527053194,
"learning_rate": 3.9308300112170735e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17203304171562195,
"step": 1170,
"valid_targets_mean": 1741.6,
"valid_targets_min": 684
},
{
"epoch": 1.235541535226078,
"grad_norm": 0.49371457829657883,
"learning_rate": 3.929456209121865e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14522910118103027,
"step": 1175,
"valid_targets_mean": 2302.8,
"valid_targets_min": 635
},
{
"epoch": 1.2407991587802314,
"grad_norm": 0.5143315716049925,
"learning_rate": 3.928069142987589e-05,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1450309455394745,
"step": 1180,
"valid_targets_mean": 2335.0,
"valid_targets_min": 707
},
{
"epoch": 1.2460567823343849,
"grad_norm": 0.6352431597142808,
"learning_rate": 3.926668822349625e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20668178796768188,
"step": 1185,
"valid_targets_mean": 1585.6,
"valid_targets_min": 734
},
{
"epoch": 1.2513144058885384,
"grad_norm": 0.5083380849868259,
"learning_rate": 3.925255256834474e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606515496969223,
"step": 1190,
"valid_targets_mean": 2409.8,
"valid_targets_min": 759
},
{
"epoch": 1.2565720294426919,
"grad_norm": 0.4040707060838454,
"learning_rate": 3.923828456159685e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11984424293041229,
"step": 1195,
"valid_targets_mean": 2802.8,
"valid_targets_min": 623
},
{
"epoch": 1.2618296529968454,
"grad_norm": 0.43208527395499524,
"learning_rate": 3.922388430133793e-05,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419583261013031,
"step": 1200,
"valid_targets_mean": 2662.6,
"valid_targets_min": 1125
},
{
"epoch": 1.267087276550999,
"grad_norm": 0.5543534851610293,
"learning_rate": 3.9209351886562535e-05,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17189328372478485,
"step": 1205,
"valid_targets_mean": 1997.5,
"valid_targets_min": 457
},
{
"epoch": 1.2723449001051526,
"grad_norm": 0.46557909010572596,
"learning_rate": 3.919468741717367e-05,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1330093890428543,
"step": 1210,
"valid_targets_mean": 2614.4,
"valid_targets_min": 994
},
{
"epoch": 1.277602523659306,
"grad_norm": 0.48752943215991795,
"learning_rate": 3.9179890993982186e-05,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14586924016475677,
"step": 1215,
"valid_targets_mean": 2471.2,
"valid_targets_min": 819
},
{
"epoch": 1.2828601472134595,
"grad_norm": 0.5652684979113541,
"learning_rate": 3.916496271870603e-05,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15604804456233978,
"step": 1220,
"valid_targets_mean": 1788.2,
"valid_targets_min": 596
},
{
"epoch": 1.288117770767613,
"grad_norm": 0.5497344054874691,
"learning_rate": 3.914990269396957e-05,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13384535908699036,
"step": 1225,
"valid_targets_mean": 2010.0,
"valid_targets_min": 776
},
{
"epoch": 1.2933753943217665,
"grad_norm": 0.48779520430533513,
"learning_rate": 3.913471102330288e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1322687268257141,
"step": 1230,
"valid_targets_mean": 2307.1,
"valid_targets_min": 731
},
{
"epoch": 1.29863301787592,
"grad_norm": 0.4463700279712265,
"learning_rate": 3.911938781114105e-05,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1255062222480774,
"step": 1235,
"valid_targets_mean": 2305.5,
"valid_targets_min": 534
},
{
"epoch": 1.3038906414300735,
"grad_norm": 0.6614464423156223,
"learning_rate": 3.910393316282345e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21906360983848572,
"step": 1240,
"valid_targets_mean": 1905.9,
"valid_targets_min": 485
},
{
"epoch": 1.3091482649842272,
"grad_norm": 0.5049346086179223,
"learning_rate": 3.9088347184592974e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14003358781337738,
"step": 1245,
"valid_targets_mean": 2203.8,
"valid_targets_min": 564
},
{
"epoch": 1.3144058885383807,
"grad_norm": 0.4343623017250803,
"learning_rate": 3.907262998359539e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13102751970291138,
"step": 1250,
"valid_targets_mean": 2605.8,
"valid_targets_min": 773
},
{
"epoch": 1.3196635120925342,
"grad_norm": 0.5209468839527972,
"learning_rate": 3.905678166787852e-05,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16362372040748596,
"step": 1255,
"valid_targets_mean": 2132.3,
"valid_targets_min": 482
},
{
"epoch": 1.3249211356466877,
"grad_norm": 0.492330059639802,
"learning_rate": 3.9040802346391555e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1356244832277298,
"step": 1260,
"valid_targets_mean": 1977.9,
"valid_targets_min": 779
},
{
"epoch": 1.3301787592008412,
"grad_norm": 0.41651714887501695,
"learning_rate": 3.902469212898427e-05,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11109089106321335,
"step": 1265,
"valid_targets_mean": 2564.5,
"valid_targets_min": 742
},
{
"epoch": 1.3354363827549949,
"grad_norm": 0.5895499209659201,
"learning_rate": 3.900845112640631e-05,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1631077229976654,
"step": 1270,
"valid_targets_mean": 2024.9,
"valid_targets_min": 629
},
{
"epoch": 1.3406940063091484,
"grad_norm": 0.5477993349332434,
"learning_rate": 3.8992079450306355e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1507028192281723,
"step": 1275,
"valid_targets_mean": 2162.8,
"valid_targets_min": 650
},
{
"epoch": 1.3459516298633019,
"grad_norm": 0.5121261948599832,
"learning_rate": 3.897557721323145e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17162734270095825,
"step": 1280,
"valid_targets_mean": 2294.5,
"valid_targets_min": 855
},
{
"epoch": 1.3512092534174553,
"grad_norm": 0.4511211509373639,
"learning_rate": 3.895894452862614e-05,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13311448693275452,
"step": 1285,
"valid_targets_mean": 2522.4,
"valid_targets_min": 795
},
{
"epoch": 1.3564668769716088,
"grad_norm": 0.5006143250460527,
"learning_rate": 3.894218151083176e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20667588710784912,
"step": 1290,
"valid_targets_mean": 2397.5,
"valid_targets_min": 824
},
{
"epoch": 1.3617245005257623,
"grad_norm": 0.7061602708002128,
"learning_rate": 3.892528827508562e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19911471009254456,
"step": 1295,
"valid_targets_mean": 1638.8,
"valid_targets_min": 665
},
{
"epoch": 1.3669821240799158,
"grad_norm": 0.5508593363955756,
"learning_rate": 3.890826493752018e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17751124501228333,
"step": 1300,
"valid_targets_mean": 2020.2,
"valid_targets_min": 623
},
{
"epoch": 1.3722397476340693,
"grad_norm": 0.5755999421111012,
"learning_rate": 3.8891111615162314e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15987738966941833,
"step": 1305,
"valid_targets_mean": 1651.8,
"valid_targets_min": 458
},
{
"epoch": 1.3774973711882228,
"grad_norm": 0.5039376806620596,
"learning_rate": 3.8873828425932486e-05,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12485198676586151,
"step": 1310,
"valid_targets_mean": 1892.3,
"valid_targets_min": 598
},
{
"epoch": 1.3827549947423765,
"grad_norm": 0.6010676327777069,
"learning_rate": 3.8856415488643885e-05,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15700513124465942,
"step": 1315,
"valid_targets_mean": 2039.7,
"valid_targets_min": 585
},
{
"epoch": 1.38801261829653,
"grad_norm": 0.49489475140621403,
"learning_rate": 3.88388729230017e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13475683331489563,
"step": 1320,
"valid_targets_mean": 2251.7,
"valid_targets_min": 649
},
{
"epoch": 1.3932702418506835,
"grad_norm": 0.4579000074165094,
"learning_rate": 3.8821200849602215e-05,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13412441313266754,
"step": 1325,
"valid_targets_mean": 2511.9,
"valid_targets_min": 492
},
{
"epoch": 1.398527865404837,
"grad_norm": 0.5554232332296529,
"learning_rate": 3.880339938993204e-05,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17779545485973358,
"step": 1330,
"valid_targets_mean": 2224.8,
"valid_targets_min": 727
},
{
"epoch": 1.4037854889589905,
"grad_norm": 0.4786923955032469,
"learning_rate": 3.878546866636724e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1452464759349823,
"step": 1335,
"valid_targets_mean": 2291.9,
"valid_targets_min": 553
},
{
"epoch": 1.4090431125131442,
"grad_norm": 0.43106947675657575,
"learning_rate": 3.876740880217248e-05,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11492572724819183,
"step": 1340,
"valid_targets_mean": 2898.8,
"valid_targets_min": 639
},
{
"epoch": 1.4143007360672977,
"grad_norm": 0.5665214216964269,
"learning_rate": 3.874921992150026e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1824207901954651,
"step": 1345,
"valid_targets_mean": 2328.7,
"valid_targets_min": 787
},
{
"epoch": 1.4195583596214512,
"grad_norm": 0.6373178617906868,
"learning_rate": 3.873090214938994e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14647290110588074,
"step": 1350,
"valid_targets_mean": 1876.3,
"valid_targets_min": 516
},
{
"epoch": 1.4248159831756047,
"grad_norm": 0.48330050653953466,
"learning_rate": 3.871245561176698e-05,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13250577449798584,
"step": 1355,
"valid_targets_mean": 2409.4,
"valid_targets_min": 711
},
{
"epoch": 1.4300736067297581,
"grad_norm": 0.48702556306514433,
"learning_rate": 3.869388043544204e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16086526215076447,
"step": 1360,
"valid_targets_mean": 2460.9,
"valid_targets_min": 564
},
{
"epoch": 1.4353312302839116,
"grad_norm": 0.45568931764300974,
"learning_rate": 3.8675176748110076e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12848922610282898,
"step": 1365,
"valid_targets_mean": 2733.8,
"valid_targets_min": 1002
},
{
"epoch": 1.4405888538380651,
"grad_norm": 0.4233365491022964,
"learning_rate": 3.865634467834953e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11810208857059479,
"step": 1370,
"valid_targets_mean": 2603.2,
"valid_targets_min": 757
},
{
"epoch": 1.4458464773922186,
"grad_norm": 0.6425781993163098,
"learning_rate": 3.863738435562139e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15976637601852417,
"step": 1375,
"valid_targets_mean": 1802.4,
"valid_targets_min": 764
},
{
"epoch": 1.4511041009463723,
"grad_norm": 0.47116356563697187,
"learning_rate": 3.8618295910268316e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15315991640090942,
"step": 1380,
"valid_targets_mean": 2527.4,
"valid_targets_min": 694
},
{
"epoch": 1.4563617245005258,
"grad_norm": 0.42654991784477303,
"learning_rate": 3.859907947351374e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1342701017856598,
"step": 1385,
"valid_targets_mean": 2513.1,
"valid_targets_min": 727
},
{
"epoch": 1.4616193480546793,
"grad_norm": 0.5811636897559682,
"learning_rate": 3.8579735177460994e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17021822929382324,
"step": 1390,
"valid_targets_mean": 2342.8,
"valid_targets_min": 877
},
{
"epoch": 1.4668769716088328,
"grad_norm": 0.5528552217400138,
"learning_rate": 3.856026315509236e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18569661676883698,
"step": 1395,
"valid_targets_mean": 2027.5,
"valid_targets_min": 661
},
{
"epoch": 1.4721345951629863,
"grad_norm": 0.44820836371016154,
"learning_rate": 3.8540663540268175e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14447733759880066,
"step": 1400,
"valid_targets_mean": 2271.6,
"valid_targets_min": 504
},
{
"epoch": 1.4773922187171398,
"grad_norm": 0.5195966640549234,
"learning_rate": 3.852093646772592e-05,
"loss": 0.137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14088033139705658,
"step": 1405,
"valid_targets_mean": 2280.4,
"valid_targets_min": 631
},
{
"epoch": 1.4826498422712935,
"grad_norm": 0.511140988879075,
"learning_rate": 3.850108207307927e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15610060095787048,
"step": 1410,
"valid_targets_mean": 2253.1,
"valid_targets_min": 1041
},
{
"epoch": 1.487907465825447,
"grad_norm": 0.5626239953999536,
"learning_rate": 3.848110049281719e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14686822891235352,
"step": 1415,
"valid_targets_mean": 1738.8,
"valid_targets_min": 724
},
{
"epoch": 1.4931650893796005,
"grad_norm": 0.45419612637605666,
"learning_rate": 3.846099186430297e-05,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1240888386964798,
"step": 1420,
"valid_targets_mean": 2130.2,
"valid_targets_min": 679
},
{
"epoch": 1.498422712933754,
"grad_norm": 0.4351700229892183,
"learning_rate": 3.8440756325773296e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12879678606987,
"step": 1425,
"valid_targets_mean": 2529.8,
"valid_targets_min": 542
},
{
"epoch": 1.5036803364879074,
"grad_norm": 0.5260099569797893,
"learning_rate": 3.84203940163373e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15119123458862305,
"step": 1430,
"valid_targets_mean": 2252.4,
"valid_targets_min": 764
},
{
"epoch": 1.508937960042061,
"grad_norm": 0.702275732972416,
"learning_rate": 3.83999050759756e-05,
"loss": 0.1698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20185378193855286,
"step": 1435,
"valid_targets_mean": 1654.4,
"valid_targets_min": 543
},
{
"epoch": 1.5141955835962144,
"grad_norm": 0.503833869356007,
"learning_rate": 3.837928964553933e-05,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14579704403877258,
"step": 1440,
"valid_targets_mean": 2116.2,
"valid_targets_min": 802
},
{
"epoch": 1.519453207150368,
"grad_norm": 0.5200791456643497,
"learning_rate": 3.835854786674918e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1617119014263153,
"step": 1445,
"valid_targets_mean": 2073.2,
"valid_targets_min": 714
},
{
"epoch": 1.5247108307045214,
"grad_norm": 0.5470358551289737,
"learning_rate": 3.8337679882194443e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686500757932663,
"step": 1450,
"valid_targets_mean": 1898.4,
"valid_targets_min": 605
},
{
"epoch": 1.5299684542586751,
"grad_norm": 0.5225253746397357,
"learning_rate": 3.8316685835331984e-05,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1774263083934784,
"step": 1455,
"valid_targets_mean": 2032.9,
"valid_targets_min": 484
},
{
"epoch": 1.5352260778128286,
"grad_norm": 0.43300310632000233,
"learning_rate": 3.8295565870485295e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12071298062801361,
"step": 1460,
"valid_targets_mean": 2565.9,
"valid_targets_min": 810
},
{
"epoch": 1.540483701366982,
"grad_norm": 0.5393950203820551,
"learning_rate": 3.827432013284349e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1655823290348053,
"step": 1465,
"valid_targets_mean": 2102.7,
"valid_targets_min": 701
},
{
"epoch": 1.5457413249211358,
"grad_norm": 0.4757485508866357,
"learning_rate": 3.825294876846031e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14885063469409943,
"step": 1470,
"valid_targets_mean": 2354.3,
"valid_targets_min": 631
},
{
"epoch": 1.5509989484752893,
"grad_norm": 0.5416280302684693,
"learning_rate": 3.823145192425313e-05,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13655738532543182,
"step": 1475,
"valid_targets_mean": 2512.6,
"valid_targets_min": 622
},
{
"epoch": 1.5562565720294428,
"grad_norm": 0.6229583310323635,
"learning_rate": 3.8209829748001894e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17115293443202972,
"step": 1480,
"valid_targets_mean": 1718.1,
"valid_targets_min": 710
},
{
"epoch": 1.5615141955835963,
"grad_norm": 0.519409879750345,
"learning_rate": 3.8188082388348186e-05,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17206339538097382,
"step": 1485,
"valid_targets_mean": 2301.4,
"valid_targets_min": 760
},
{
"epoch": 1.5667718191377498,
"grad_norm": 0.46667895425451783,
"learning_rate": 3.816620999479413e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12790817022323608,
"step": 1490,
"valid_targets_mean": 2259.9,
"valid_targets_min": 492
},
{
"epoch": 1.5720294426919033,
"grad_norm": 0.5220018902821102,
"learning_rate": 3.8144212717701424e-05,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16024719178676605,
"step": 1495,
"valid_targets_mean": 2243.8,
"valid_targets_min": 937
},
{
"epoch": 1.5772870662460567,
"grad_norm": 0.46071983556767643,
"learning_rate": 3.812209070829025e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12235837429761887,
"step": 1500,
"valid_targets_mean": 2669.8,
"valid_targets_min": 656
},
{
"epoch": 1.5825446898002102,
"grad_norm": 0.559304595141797,
"learning_rate": 3.809984411863828e-05,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1550862044095993,
"step": 1505,
"valid_targets_mean": 1869.9,
"valid_targets_min": 673
},
{
"epoch": 1.5878023133543637,
"grad_norm": 0.6225497021218658,
"learning_rate": 3.80774731016796e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1890285164117813,
"step": 1510,
"valid_targets_mean": 1925.2,
"valid_targets_min": 611
},
{
"epoch": 1.5930599369085172,
"grad_norm": 0.4436472576665815,
"learning_rate": 3.805497781120369e-05,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13567166030406952,
"step": 1515,
"valid_targets_mean": 2568.1,
"valid_targets_min": 845
},
{
"epoch": 1.598317560462671,
"grad_norm": 0.7038720866935955,
"learning_rate": 3.8032358401854315e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2125886231660843,
"step": 1520,
"valid_targets_mean": 1661.3,
"valid_targets_min": 680
},
{
"epoch": 1.6035751840168244,
"grad_norm": 0.4228259736234144,
"learning_rate": 3.800961502912854e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12922674417495728,
"step": 1525,
"valid_targets_mean": 2306.6,
"valid_targets_min": 654
},
{
"epoch": 1.608832807570978,
"grad_norm": 0.5484483778701249,
"learning_rate": 3.798674784937557e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15941087901592255,
"step": 1530,
"valid_targets_mean": 2061.1,
"valid_targets_min": 635
},
{
"epoch": 1.6140904311251314,
"grad_norm": 0.4770810525091347,
"learning_rate": 3.7963757019795756e-05,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12932509183883667,
"step": 1535,
"valid_targets_mean": 2397.7,
"valid_targets_min": 615
},
{
"epoch": 1.619348054679285,
"grad_norm": 0.5004936276439662,
"learning_rate": 3.794064269843946e-05,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14063172042369843,
"step": 1540,
"valid_targets_mean": 2006.1,
"valid_targets_min": 814
},
{
"epoch": 1.6246056782334386,
"grad_norm": 0.5097411431283284,
"learning_rate": 3.791740504420599e-05,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.145649254322052,
"step": 1545,
"valid_targets_mean": 1994.4,
"valid_targets_min": 782
},
{
"epoch": 1.629863301787592,
"grad_norm": 0.40331204148126387,
"learning_rate": 3.789404421684251e-05,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12102833390235901,
"step": 1550,
"valid_targets_mean": 2933.8,
"valid_targets_min": 705
},
{
"epoch": 1.6351209253417456,
"grad_norm": 0.3753680666356623,
"learning_rate": 3.787056037694293e-05,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11178039014339447,
"step": 1555,
"valid_targets_mean": 2994.1,
"valid_targets_min": 950
},
{
"epoch": 1.640378548895899,
"grad_norm": 0.3784757429266007,
"learning_rate": 3.784695368594682e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11730167269706726,
"step": 1560,
"valid_targets_mean": 3059.6,
"valid_targets_min": 698
},
{
"epoch": 1.6456361724500526,
"grad_norm": 0.46791378953283935,
"learning_rate": 3.782322430613828e-05,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1434706747531891,
"step": 1565,
"valid_targets_mean": 2098.8,
"valid_targets_min": 549
},
{
"epoch": 1.650893796004206,
"grad_norm": 0.5131913623298254,
"learning_rate": 3.779937240064484e-05,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17528071999549866,
"step": 1570,
"valid_targets_mean": 2479.7,
"valid_targets_min": 734
},
{
"epoch": 1.6561514195583595,
"grad_norm": 0.4787676239528799,
"learning_rate": 3.777539813343634e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1525578796863556,
"step": 1575,
"valid_targets_mean": 2419.9,
"valid_targets_min": 655
},
{
"epoch": 1.661409043112513,
"grad_norm": 0.5097454193957103,
"learning_rate": 3.7751301669323776e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515212506055832,
"step": 1580,
"valid_targets_mean": 2156.2,
"valid_targets_min": 837
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.44848135346744805,
"learning_rate": 3.772708317395818e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15940351784229279,
"step": 1585,
"valid_targets_mean": 2610.3,
"valid_targets_min": 617
},
{
"epoch": 1.6719242902208202,
"grad_norm": 0.4809853729383809,
"learning_rate": 3.770274281382952e-05,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1557113528251648,
"step": 1590,
"valid_targets_mean": 2268.4,
"valid_targets_min": 514
},
{
"epoch": 1.6771819137749737,
"grad_norm": 0.546072311066789,
"learning_rate": 3.767828075626551e-05,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1509373039007187,
"step": 1595,
"valid_targets_mean": 1996.9,
"valid_targets_min": 825
},
{
"epoch": 1.6824395373291272,
"grad_norm": 1.1263729491732608,
"learning_rate": 3.7653697169430456e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749960035085678,
"step": 1600,
"valid_targets_mean": 1937.6,
"valid_targets_min": 707
},
{
"epoch": 1.687697160883281,
"grad_norm": 0.5565429344508764,
"learning_rate": 3.762899222232413e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15961700677871704,
"step": 1605,
"valid_targets_mean": 1760.7,
"valid_targets_min": 740
},
{
"epoch": 1.6929547844374344,
"grad_norm": 0.4796990499082493,
"learning_rate": 3.760416608478061e-05,
"loss": 0.143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15107330679893494,
"step": 1610,
"valid_targets_mean": 2156.3,
"valid_targets_min": 760
},
{
"epoch": 1.698212407991588,
"grad_norm": 0.453284399681182,
"learning_rate": 3.7579218927467044e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15035119652748108,
"step": 1615,
"valid_targets_mean": 2370.3,
"valid_targets_min": 858
},
{
"epoch": 1.7034700315457414,
"grad_norm": 0.5609207278755044,
"learning_rate": 3.7554150921882596e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1658046543598175,
"step": 1620,
"valid_targets_mean": 2289.4,
"valid_targets_min": 594
},
{
"epoch": 1.7087276550998949,
"grad_norm": 0.489528722517424,
"learning_rate": 3.752896224035716e-05,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14376391470432281,
"step": 1625,
"valid_targets_mean": 2270.4,
"valid_targets_min": 447
},
{
"epoch": 1.7139852786540484,
"grad_norm": 0.5757880157204146,
"learning_rate": 3.750365305605024e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15369608998298645,
"step": 1630,
"valid_targets_mean": 1842.8,
"valid_targets_min": 520
},
{
"epoch": 1.7192429022082019,
"grad_norm": 0.6199804316674978,
"learning_rate": 3.7478223542949704e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23520562052726746,
"step": 1635,
"valid_targets_mean": 1732.6,
"valid_targets_min": 544
},
{
"epoch": 1.7245005257623554,
"grad_norm": 0.6234013940743057,
"learning_rate": 3.745267387587065e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14816375076770782,
"step": 1640,
"valid_targets_mean": 2256.4,
"valid_targets_min": 784
},
{
"epoch": 1.7297581493165088,
"grad_norm": 0.39606806833065256,
"learning_rate": 3.742700423045416e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11933799833059311,
"step": 1645,
"valid_targets_mean": 2799.9,
"valid_targets_min": 790
},
{
"epoch": 1.7350157728706623,
"grad_norm": 0.41853999709419526,
"learning_rate": 3.7401214783166116e-05,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12586048245429993,
"step": 1650,
"valid_targets_mean": 2299.3,
"valid_targets_min": 449
},
{
"epoch": 1.7402733964248158,
"grad_norm": 0.4665163153226736,
"learning_rate": 3.737530571129596e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1512151062488556,
"step": 1655,
"valid_targets_mean": 2344.2,
"valid_targets_min": 711
},
{
"epoch": 1.7455310199789695,
"grad_norm": 0.4972080448544214,
"learning_rate": 3.734927719295551e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14359167218208313,
"step": 1660,
"valid_targets_mean": 2295.5,
"valid_targets_min": 933
},
{
"epoch": 1.750788643533123,
"grad_norm": 0.43461253492401125,
"learning_rate": 3.732312940707772e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17093902826309204,
"step": 1665,
"valid_targets_mean": 2810.1,
"valid_targets_min": 664
},
{
"epoch": 1.7560462670872765,
"grad_norm": 0.48535144756133497,
"learning_rate": 3.729686253341543e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13613176345825195,
"step": 1670,
"valid_targets_mean": 1979.6,
"valid_targets_min": 714
},
{
"epoch": 1.7613038906414302,
"grad_norm": 0.4781604460296353,
"learning_rate": 3.7270476752540163e-05,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1583690345287323,
"step": 1675,
"valid_targets_mean": 2193.4,
"valid_targets_min": 720
},
{
"epoch": 1.7665615141955837,
"grad_norm": 0.4636953366985517,
"learning_rate": 3.724397224584086e-05,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1320091038942337,
"step": 1680,
"valid_targets_mean": 2121.1,
"valid_targets_min": 567
},
{
"epoch": 1.7718191377497372,
"grad_norm": 0.45235219741823857,
"learning_rate": 3.7217349195522656e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375328004360199,
"step": 1685,
"valid_targets_mean": 2287.0,
"valid_targets_min": 752
},
{
"epoch": 1.7770767613038907,
"grad_norm": 0.5279603918969447,
"learning_rate": 3.7190607784605604e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14660730957984924,
"step": 1690,
"valid_targets_mean": 2240.7,
"valid_targets_min": 798
},
{
"epoch": 1.7823343848580442,
"grad_norm": 0.41329114609770984,
"learning_rate": 3.716374819692341e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15471050143241882,
"step": 1695,
"valid_targets_mean": 2950.4,
"valid_targets_min": 837
},
{
"epoch": 1.7875920084121977,
"grad_norm": 0.48618523616643183,
"learning_rate": 3.713677061712223e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14447468519210815,
"step": 1700,
"valid_targets_mean": 2012.0,
"valid_targets_min": 638
},
{
"epoch": 1.7928496319663512,
"grad_norm": 0.4507089705375839,
"learning_rate": 3.7109675230659316e-05,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15283942222595215,
"step": 1705,
"valid_targets_mean": 2564.6,
"valid_targets_min": 622
},
{
"epoch": 1.7981072555205047,
"grad_norm": 0.7337028383217412,
"learning_rate": 3.7082462223801784e-05,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1652950644493103,
"step": 1710,
"valid_targets_mean": 1482.8,
"valid_targets_min": 525
},
{
"epoch": 1.8033648790746581,
"grad_norm": 0.4112594232596541,
"learning_rate": 3.7055131783625364e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14620056748390198,
"step": 1715,
"valid_targets_mean": 3001.4,
"valid_targets_min": 847
},
{
"epoch": 1.8086225026288116,
"grad_norm": 0.4449486795859238,
"learning_rate": 3.702768409801304e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15046781301498413,
"step": 1720,
"valid_targets_mean": 2618.0,
"valid_targets_min": 798
},
{
"epoch": 1.8138801261829653,
"grad_norm": 0.506351232875529,
"learning_rate": 3.700011935565384e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13286535441875458,
"step": 1725,
"valid_targets_mean": 2428.1,
"valid_targets_min": 546
},
{
"epoch": 1.8191377497371188,
"grad_norm": 0.48214377667694075,
"learning_rate": 3.697243774604145e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12532919645309448,
"step": 1730,
"valid_targets_mean": 2073.8,
"valid_targets_min": 759
},
{
"epoch": 1.8243953732912723,
"grad_norm": 0.4955432033829991,
"learning_rate": 3.6944639459473e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133253276348114,
"step": 1735,
"valid_targets_mean": 2046.4,
"valid_targets_min": 805
},
{
"epoch": 1.8296529968454258,
"grad_norm": 0.4714543593923112,
"learning_rate": 3.69167246870477e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15946990251541138,
"step": 1740,
"valid_targets_mean": 2243.0,
"valid_targets_min": 646
},
{
"epoch": 1.8349106203995795,
"grad_norm": 0.4606924941630629,
"learning_rate": 3.6888693620665546e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1744510531425476,
"step": 1745,
"valid_targets_mean": 2670.9,
"valid_targets_min": 725
},
{
"epoch": 1.840168243953733,
"grad_norm": 0.5201006931571852,
"learning_rate": 3.686054645302598e-05,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1766928732395172,
"step": 1750,
"valid_targets_mean": 2316.8,
"valid_targets_min": 1075
},
{
"epoch": 1.8454258675078865,
"grad_norm": 0.4129815771962509,
"learning_rate": 3.6832283377626603e-05,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13509492576122284,
"step": 1755,
"valid_targets_mean": 2487.6,
"valid_targets_min": 850
},
{
"epoch": 1.85068349106204,
"grad_norm": 0.5756252784309024,
"learning_rate": 3.680390458876182e-05,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17633795738220215,
"step": 1760,
"valid_targets_mean": 1864.7,
"valid_targets_min": 511
},
{
"epoch": 1.8559411146161935,
"grad_norm": 0.44562070679854765,
"learning_rate": 3.67754102815215e-05,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1346631944179535,
"step": 1765,
"valid_targets_mean": 2271.6,
"valid_targets_min": 770
},
{
"epoch": 1.861198738170347,
"grad_norm": 0.4161437501373808,
"learning_rate": 3.6746800651789636e-05,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12186533212661743,
"step": 1770,
"valid_targets_mean": 2435.9,
"valid_targets_min": 810
},
{
"epoch": 1.8664563617245005,
"grad_norm": 0.5775706994653773,
"learning_rate": 3.671807589624302e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1577707976102829,
"step": 1775,
"valid_targets_mean": 1631.6,
"valid_targets_min": 524
},
{
"epoch": 1.871713985278654,
"grad_norm": 0.48258766681087256,
"learning_rate": 3.6689236212349865e-05,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15474461019039154,
"step": 1780,
"valid_targets_mean": 2626.8,
"valid_targets_min": 727
},
{
"epoch": 1.8769716088328074,
"grad_norm": 0.6044542061499013,
"learning_rate": 3.6660281798368485e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17260998487472534,
"step": 1785,
"valid_targets_mean": 1687.1,
"valid_targets_min": 676
},
{
"epoch": 1.882229232386961,
"grad_norm": 0.4151710265798618,
"learning_rate": 3.663121285334586e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14284290373325348,
"step": 1790,
"valid_targets_mean": 2609.9,
"valid_targets_min": 665
},
{
"epoch": 1.8874868559411146,
"grad_norm": 0.5325140969298698,
"learning_rate": 3.660202957711635e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16473495960235596,
"step": 1795,
"valid_targets_mean": 2058.4,
"valid_targets_min": 668
},
{
"epoch": 1.8927444794952681,
"grad_norm": 0.5215486027809936,
"learning_rate": 3.657273217030026e-05,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19604501128196716,
"step": 1800,
"valid_targets_mean": 2170.8,
"valid_targets_min": 486
},
{
"epoch": 1.8980021030494216,
"grad_norm": 1.9357247443695407,
"learning_rate": 3.654332083430252e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10836437344551086,
"step": 1805,
"valid_targets_mean": 2348.1,
"valid_targets_min": 635
},
{
"epoch": 1.9032597266035753,
"grad_norm": 0.5001717909983574,
"learning_rate": 3.651379577131121e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1701362431049347,
"step": 1810,
"valid_targets_mean": 2189.1,
"valid_targets_min": 635
},
{
"epoch": 1.9085173501577288,
"grad_norm": 0.4480450755045227,
"learning_rate": 3.648415718429629e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15512478351593018,
"step": 1815,
"valid_targets_mean": 2763.6,
"valid_targets_min": 703
},
{
"epoch": 1.9137749737118823,
"grad_norm": 0.4520564240954849,
"learning_rate": 3.6454405277008087e-05,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14041677117347717,
"step": 1820,
"valid_targets_mean": 2520.4,
"valid_targets_min": 845
},
{
"epoch": 1.9190325972660358,
"grad_norm": 0.4069217501261934,
"learning_rate": 3.6424540253975985e-05,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1304551661014557,
"step": 1825,
"valid_targets_mean": 2595.4,
"valid_targets_min": 647
},
{
"epoch": 1.9242902208201893,
"grad_norm": 0.5475187771011519,
"learning_rate": 3.6394562320506955e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1664676070213318,
"step": 1830,
"valid_targets_mean": 2688.9,
"valid_targets_min": 909
},
{
"epoch": 1.9295478443743428,
"grad_norm": 0.5416559309008887,
"learning_rate": 3.636447168268419e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1847115308046341,
"step": 1835,
"valid_targets_mean": 2223.1,
"valid_targets_min": 554
},
{
"epoch": 1.9348054679284963,
"grad_norm": 0.45198125327378663,
"learning_rate": 3.633426854736566e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15288934111595154,
"step": 1840,
"valid_targets_mean": 2307.6,
"valid_targets_min": 689
},
{
"epoch": 1.9400630914826498,
"grad_norm": 0.49718358102815036,
"learning_rate": 3.6303953122182695e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17160025238990784,
"step": 1845,
"valid_targets_mean": 2595.4,
"valid_targets_min": 745
},
{
"epoch": 1.9453207150368033,
"grad_norm": 0.5932074393640244,
"learning_rate": 3.6273525615538564e-05,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17138652503490448,
"step": 1850,
"valid_targets_mean": 1705.4,
"valid_targets_min": 896
},
{
"epoch": 1.9505783385909568,
"grad_norm": 0.4838557067188173,
"learning_rate": 3.6242986236607046e-05,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1822124868631363,
"step": 1855,
"valid_targets_mean": 2238.8,
"valid_targets_min": 928
},
{
"epoch": 1.9558359621451105,
"grad_norm": 0.5008302577532774,
"learning_rate": 3.6212335195330976e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17570628225803375,
"step": 1860,
"valid_targets_mean": 2048.1,
"valid_targets_min": 720
},
{
"epoch": 1.961093585699264,
"grad_norm": 0.4096575459462327,
"learning_rate": 3.618157270242082e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12385016679763794,
"step": 1865,
"valid_targets_mean": 2401.0,
"valid_targets_min": 656
},
{
"epoch": 1.9663512092534174,
"grad_norm": 0.4354302816924471,
"learning_rate": 3.615069896935321e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13620790839195251,
"step": 1870,
"valid_targets_mean": 2298.9,
"valid_targets_min": 705
},
{
"epoch": 1.971608832807571,
"grad_norm": 0.4422162817001818,
"learning_rate": 3.6119714208369506e-05,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1441817283630371,
"step": 1875,
"valid_targets_mean": 2163.5,
"valid_targets_min": 842
},
{
"epoch": 1.9768664563617246,
"grad_norm": 0.38037559250128045,
"learning_rate": 3.608861863247432e-05,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125374436378479,
"step": 1880,
"valid_targets_mean": 2816.2,
"valid_targets_min": 1085
},
{
"epoch": 1.9821240799158781,
"grad_norm": 0.4279345920030894,
"learning_rate": 3.6057412455434075e-05,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1381811499595642,
"step": 1885,
"valid_targets_mean": 2501.2,
"valid_targets_min": 775
},
{
"epoch": 1.9873817034700316,
"grad_norm": 0.4242817265694865,
"learning_rate": 3.6026095891775494e-05,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1506459265947342,
"step": 1890,
"valid_targets_mean": 2550.9,
"valid_targets_min": 826
},
{
"epoch": 1.9926393270241851,
"grad_norm": 0.5151468554817712,
"learning_rate": 3.5994669156784184e-05,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16714484989643097,
"step": 1895,
"valid_targets_mean": 2281.9,
"valid_targets_min": 705
},
{
"epoch": 1.9978969505783386,
"grad_norm": 0.41782599593456177,
"learning_rate": 3.5963132466503107e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12775075435638428,
"step": 1900,
"valid_targets_mean": 2439.4,
"valid_targets_min": 738
},
{
"epoch": 2.003154574132492,
"grad_norm": 0.4165370010370444,
"learning_rate": 3.593148603773111e-05,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11981405317783356,
"step": 1905,
"valid_targets_mean": 2356.5,
"valid_targets_min": 662
},
{
"epoch": 2.0084121976866456,
"grad_norm": 0.4882073231063211,
"learning_rate": 3.5899730088021455e-05,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12051345407962799,
"step": 1910,
"valid_targets_mean": 2324.1,
"valid_targets_min": 796
},
{
"epoch": 2.013669821240799,
"grad_norm": 0.5074815735614124,
"learning_rate": 3.586786483568028e-05,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16859525442123413,
"step": 1915,
"valid_targets_mean": 2066.3,
"valid_targets_min": 772
},
{
"epoch": 2.0189274447949526,
"grad_norm": 0.42950139192766656,
"learning_rate": 3.583589049976514e-05,
"loss": 0.1213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11452405154705048,
"step": 1920,
"valid_targets_mean": 2316.4,
"valid_targets_min": 663
},
{
"epoch": 2.024185068349106,
"grad_norm": 0.38708359130884057,
"learning_rate": 3.580380730008348e-05,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08783847093582153,
"step": 1925,
"valid_targets_mean": 2917.4,
"valid_targets_min": 605
},
{
"epoch": 2.0294426919032595,
"grad_norm": 0.4962443253703049,
"learning_rate": 3.577161545719113e-05,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1337311565876007,
"step": 1930,
"valid_targets_mean": 2157.9,
"valid_targets_min": 809
},
{
"epoch": 2.034700315457413,
"grad_norm": 0.45862104770317996,
"learning_rate": 3.573931519239079e-05,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1386127471923828,
"step": 1935,
"valid_targets_mean": 2262.4,
"valid_targets_min": 820
},
{
"epoch": 2.039957939011567,
"grad_norm": 0.5549444717886148,
"learning_rate": 3.5706906727730496e-05,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13468411564826965,
"step": 1940,
"valid_targets_mean": 1934.9,
"valid_targets_min": 950
},
{
"epoch": 2.0452155625657205,
"grad_norm": 0.5070987988138339,
"learning_rate": 3.567439028600211e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14278246462345123,
"step": 1945,
"valid_targets_mean": 2418.1,
"valid_targets_min": 949
},
{
"epoch": 2.050473186119874,
"grad_norm": 0.45731591837081925,
"learning_rate": 3.564176609073979e-05,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14413893222808838,
"step": 1950,
"valid_targets_mean": 2671.4,
"valid_targets_min": 615
},
{
"epoch": 2.0557308096740274,
"grad_norm": 0.5123913667295944,
"learning_rate": 3.5609034366218426e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1473674178123474,
"step": 1955,
"valid_targets_mean": 2359.5,
"valid_targets_min": 926
},
{
"epoch": 2.060988433228181,
"grad_norm": 0.4780785072793604,
"learning_rate": 3.5576195337452146e-05,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12123583257198334,
"step": 1960,
"valid_targets_mean": 2013.9,
"valid_targets_min": 702
},
{
"epoch": 2.0662460567823344,
"grad_norm": 0.3815864367478656,
"learning_rate": 3.55432492301927e-05,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1051771491765976,
"step": 1965,
"valid_targets_mean": 2731.7,
"valid_targets_min": 772
},
{
"epoch": 2.071503680336488,
"grad_norm": 0.46772429283695915,
"learning_rate": 3.551019627092799e-05,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13175570964813232,
"step": 1970,
"valid_targets_mean": 2440.7,
"valid_targets_min": 677
},
{
"epoch": 2.0767613038906414,
"grad_norm": 0.556231018219464,
"learning_rate": 3.547703668688044e-05,
"loss": 0.1188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13067355751991272,
"step": 1975,
"valid_targets_mean": 1788.6,
"valid_targets_min": 687
},
{
"epoch": 2.082018927444795,
"grad_norm": 0.5408633758543436,
"learning_rate": 3.544377070600549e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15026794373989105,
"step": 1980,
"valid_targets_mean": 2042.7,
"valid_targets_min": 712
},
{
"epoch": 2.0872765509989484,
"grad_norm": 0.47754843928115875,
"learning_rate": 3.541039855699e-05,
"loss": 0.1194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12666237354278564,
"step": 1985,
"valid_targets_mean": 2131.7,
"valid_targets_min": 836
},
{
"epoch": 2.092534174553102,
"grad_norm": 0.43168005253830566,
"learning_rate": 3.537692046925065e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11582004278898239,
"step": 1990,
"valid_targets_mean": 2472.6,
"valid_targets_min": 826
},
{
"epoch": 2.0977917981072554,
"grad_norm": 0.5380064357290384,
"learning_rate": 3.534333667293244e-05,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13713784515857697,
"step": 1995,
"valid_targets_mean": 2021.4,
"valid_targets_min": 637
},
{
"epoch": 2.103049421661409,
"grad_norm": 0.5845972184708509,
"learning_rate": 3.5309647398907056e-05,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710910052061081,
"step": 2000,
"valid_targets_mean": 1991.2,
"valid_targets_min": 738
},
{
"epoch": 2.108307045215563,
"grad_norm": 0.6249776196883474,
"learning_rate": 3.527585287877125e-05,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11936753243207932,
"step": 2005,
"valid_targets_mean": 2236.9,
"valid_targets_min": 812
},
{
"epoch": 2.1135646687697163,
"grad_norm": 0.4626009802451835,
"learning_rate": 3.5241953344845345e-05,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11106312274932861,
"step": 2010,
"valid_targets_mean": 2144.8,
"valid_targets_min": 551
},
{
"epoch": 2.1188222923238698,
"grad_norm": 0.4507578603910488,
"learning_rate": 3.520794903017153e-05,
"loss": 0.1338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1228797659277916,
"step": 2015,
"valid_targets_mean": 2368.6,
"valid_targets_min": 826
},
{
"epoch": 2.1240799158780233,
"grad_norm": 0.4590026027765624,
"learning_rate": 3.517384016851235e-05,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13244223594665527,
"step": 2020,
"valid_targets_mean": 2675.6,
"valid_targets_min": 663
},
{
"epoch": 2.1293375394321767,
"grad_norm": 0.5106300807003196,
"learning_rate": 3.513962699434903e-05,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14137056469917297,
"step": 2025,
"valid_targets_mean": 2193.9,
"valid_targets_min": 621
},
{
"epoch": 2.1345951629863302,
"grad_norm": 0.4223421034280718,
"learning_rate": 3.5105309742879894e-05,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11488351225852966,
"step": 2030,
"valid_targets_mean": 2716.0,
"valid_targets_min": 744
},
{
"epoch": 2.1398527865404837,
"grad_norm": 0.4726773189930089,
"learning_rate": 3.507088865001876e-05,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12050914764404297,
"step": 2035,
"valid_targets_mean": 2316.9,
"valid_targets_min": 697
},
{
"epoch": 2.145110410094637,
"grad_norm": 0.40285060808881745,
"learning_rate": 3.5036363952393296e-05,
"loss": 0.1209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10139887034893036,
"step": 2040,
"valid_targets_mean": 2308.3,
"valid_targets_min": 765
},
{
"epoch": 2.1503680336487907,
"grad_norm": 0.5783542833364608,
"learning_rate": 3.500173588734339e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442745476961136,
"step": 2045,
"valid_targets_mean": 1760.6,
"valid_targets_min": 784
},
{
"epoch": 2.155625657202944,
"grad_norm": 0.4527249070861431,
"learning_rate": 3.4967004692919555e-05,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12106870114803314,
"step": 2050,
"valid_targets_mean": 2406.2,
"valid_targets_min": 728
},
{
"epoch": 2.1608832807570977,
"grad_norm": 0.4602957888289968,
"learning_rate": 3.4932170607881226e-05,
"loss": 0.1274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14271163940429688,
"step": 2055,
"valid_targets_mean": 2614.0,
"valid_targets_min": 800
},
{
"epoch": 2.166140904311251,
"grad_norm": 0.4306041008958775,
"learning_rate": 3.4897233871695205e-05,
"loss": 0.1259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1112859696149826,
"step": 2060,
"valid_targets_mean": 2409.6,
"valid_targets_min": 919
},
{
"epoch": 2.1713985278654047,
"grad_norm": 0.39117994337061757,
"learning_rate": 3.4862194724533934e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1018102765083313,
"step": 2065,
"valid_targets_mean": 3024.4,
"valid_targets_min": 615
},
{
"epoch": 2.176656151419558,
"grad_norm": 0.5193252628270868,
"learning_rate": 3.4827053407273894e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16743426024913788,
"step": 2070,
"valid_targets_mean": 2178.8,
"valid_targets_min": 900
},
{
"epoch": 2.181913774973712,
"grad_norm": 0.4773644910737866,
"learning_rate": 3.4791810161493935e-05,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11436664313077927,
"step": 2075,
"valid_targets_mean": 2165.2,
"valid_targets_min": 564
},
{
"epoch": 2.1871713985278656,
"grad_norm": 0.49019952779097675,
"learning_rate": 3.47564652294736e-05,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278860867023468,
"step": 2080,
"valid_targets_mean": 2144.4,
"valid_targets_min": 790
},
{
"epoch": 2.192429022082019,
"grad_norm": 0.45905165358912653,
"learning_rate": 3.472101885419149e-05,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10517239570617676,
"step": 2085,
"valid_targets_mean": 2574.6,
"valid_targets_min": 916
},
{
"epoch": 2.1976866456361726,
"grad_norm": 0.4057615533224451,
"learning_rate": 3.468547127932358e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10115516185760498,
"step": 2090,
"valid_targets_mean": 2422.2,
"valid_targets_min": 720
},
{
"epoch": 2.202944269190326,
"grad_norm": 0.469340057308021,
"learning_rate": 3.4649822749241525e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12604938447475433,
"step": 2095,
"valid_targets_mean": 2676.9,
"valid_targets_min": 490
},
{
"epoch": 2.2082018927444795,
"grad_norm": 0.6505534050622875,
"learning_rate": 3.4614073509011e-05,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13901427388191223,
"step": 2100,
"valid_targets_mean": 1320.7,
"valid_targets_min": 594
},
{
"epoch": 2.213459516298633,
"grad_norm": 0.4383173264208626,
"learning_rate": 3.4578223804390026e-05,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10560506582260132,
"step": 2105,
"valid_targets_mean": 2229.6,
"valid_targets_min": 694
},
{
"epoch": 2.2187171398527865,
"grad_norm": 0.6069740713094931,
"learning_rate": 3.454227388182725e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24115046858787537,
"step": 2110,
"valid_targets_mean": 1657.2,
"valid_targets_min": 812
},
{
"epoch": 2.22397476340694,
"grad_norm": 0.43533617110430645,
"learning_rate": 3.450622398846026e-05,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12046660482883453,
"step": 2115,
"valid_targets_mean": 2715.1,
"valid_targets_min": 746
},
{
"epoch": 2.2292323869610935,
"grad_norm": 0.599359561496524,
"learning_rate": 3.447007437211392e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14519494771957397,
"step": 2120,
"valid_targets_mean": 1855.6,
"valid_targets_min": 598
},
{
"epoch": 2.234490010515247,
"grad_norm": 0.38420244117190716,
"learning_rate": 3.443382528129862e-05,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11376230418682098,
"step": 2125,
"valid_targets_mean": 2770.0,
"valid_targets_min": 781
},
{
"epoch": 2.2397476340694005,
"grad_norm": 0.4896507218182568,
"learning_rate": 3.4397476965208604e-05,
"loss": 0.1273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1241091936826706,
"step": 2130,
"valid_targets_mean": 2216.6,
"valid_targets_min": 524
},
{
"epoch": 2.245005257623554,
"grad_norm": 0.4650364241948299,
"learning_rate": 3.43610296737202e-05,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12122425436973572,
"step": 2135,
"valid_targets_mean": 2123.4,
"valid_targets_min": 734
},
{
"epoch": 2.250262881177708,
"grad_norm": 0.5977926020048738,
"learning_rate": 3.432448365739019e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14992423355579376,
"step": 2140,
"valid_targets_mean": 1818.1,
"valid_targets_min": 669
},
{
"epoch": 2.2555205047318614,
"grad_norm": 0.4837572047226774,
"learning_rate": 3.4287839167454016e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1280701458454132,
"step": 2145,
"valid_targets_mean": 2250.2,
"valid_targets_min": 682
},
{
"epoch": 2.260778128286015,
"grad_norm": 0.5125748737367186,
"learning_rate": 3.4251096455824076e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1362539529800415,
"step": 2150,
"valid_targets_mean": 2222.9,
"valid_targets_min": 1144
},
{
"epoch": 2.2660357518401684,
"grad_norm": 0.5179245122239554,
"learning_rate": 3.421425577508799e-05,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12561476230621338,
"step": 2155,
"valid_targets_mean": 1877.7,
"valid_targets_min": 627
},
{
"epoch": 2.271293375394322,
"grad_norm": 0.572251612705651,
"learning_rate": 3.417731737850687e-05,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14186495542526245,
"step": 2160,
"valid_targets_mean": 1725.6,
"valid_targets_min": 507
},
{
"epoch": 2.2765509989484753,
"grad_norm": 0.5609206474550744,
"learning_rate": 3.4140281520013595e-05,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495792269706726,
"step": 2165,
"valid_targets_mean": 1738.9,
"valid_targets_min": 598
},
{
"epoch": 2.281808622502629,
"grad_norm": 0.4291383467964329,
"learning_rate": 3.4103148454211017e-05,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11707118153572083,
"step": 2170,
"valid_targets_mean": 2785.3,
"valid_targets_min": 802
},
{
"epoch": 2.2870662460567823,
"grad_norm": 0.45233604821609774,
"learning_rate": 3.4065918436370244e-05,
"loss": 0.1183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12072920054197311,
"step": 2175,
"valid_targets_mean": 2427.9,
"valid_targets_min": 743
},
{
"epoch": 2.292323869610936,
"grad_norm": 0.5262996722238373,
"learning_rate": 3.402859172242889e-05,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12840887904167175,
"step": 2180,
"valid_targets_mean": 2301.5,
"valid_targets_min": 647
},
{
"epoch": 2.2975814931650893,
"grad_norm": 0.4828494742963766,
"learning_rate": 3.399116856898931e-05,
"loss": 0.1281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1163383424282074,
"step": 2185,
"valid_targets_mean": 1966.8,
"valid_targets_min": 671
},
{
"epoch": 2.302839116719243,
"grad_norm": 0.4408567104646948,
"learning_rate": 3.395364923331681e-05,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11785329878330231,
"step": 2190,
"valid_targets_mean": 2664.4,
"valid_targets_min": 333
},
{
"epoch": 2.3080967402733963,
"grad_norm": 0.46781551370442137,
"learning_rate": 3.391603397333793e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1327618658542633,
"step": 2195,
"valid_targets_mean": 2295.9,
"valid_targets_min": 980
},
{
"epoch": 2.3133543638275498,
"grad_norm": 0.461624610712435,
"learning_rate": 3.387832304763861e-05,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1282767653465271,
"step": 2200,
"valid_targets_mean": 2335.7,
"valid_targets_min": 937
},
{
"epoch": 2.3186119873817033,
"grad_norm": 0.47052356903787107,
"learning_rate": 3.384051671546247e-05,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11978121846914291,
"step": 2205,
"valid_targets_mean": 2129.2,
"valid_targets_min": 690
},
{
"epoch": 2.3238696109358568,
"grad_norm": 0.5583559171870117,
"learning_rate": 3.380261523670899e-05,
"loss": 0.129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14906030893325806,
"step": 2210,
"valid_targets_mean": 1948.1,
"valid_targets_min": 759
},
{
"epoch": 2.3291272344900107,
"grad_norm": 0.4414407548790824,
"learning_rate": 3.376461887193173e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1148625984787941,
"step": 2215,
"valid_targets_mean": 2430.5,
"valid_targets_min": 589
},
{
"epoch": 2.334384858044164,
"grad_norm": 0.4772414705822393,
"learning_rate": 3.372652788233656e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14924514293670654,
"step": 2220,
"valid_targets_mean": 2866.3,
"valid_targets_min": 1286
},
{
"epoch": 2.3396424815983177,
"grad_norm": 0.5095114198475202,
"learning_rate": 3.368834252977982e-05,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1499393880367279,
"step": 2225,
"valid_targets_mean": 2038.2,
"valid_targets_min": 569
},
{
"epoch": 2.344900105152471,
"grad_norm": 0.5492758789004418,
"learning_rate": 3.3650063076766586e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13819925487041473,
"step": 2230,
"valid_targets_mean": 2024.1,
"valid_targets_min": 681
},
{
"epoch": 2.3501577287066246,
"grad_norm": 0.5599938825560205,
"learning_rate": 3.3611689786448786e-05,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12143988907337189,
"step": 2235,
"valid_targets_mean": 2295.2,
"valid_targets_min": 560
},
{
"epoch": 2.355415352260778,
"grad_norm": 0.4764121806434522,
"learning_rate": 3.357322292262346e-05,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14417289197444916,
"step": 2240,
"valid_targets_mean": 2300.9,
"valid_targets_min": 585
},
{
"epoch": 2.3606729758149316,
"grad_norm": 0.41294962937457674,
"learning_rate": 3.353466274973092e-05,
"loss": 0.128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13291729986667633,
"step": 2245,
"valid_targets_mean": 2764.4,
"valid_targets_min": 673
},
{
"epoch": 2.365930599369085,
"grad_norm": 0.6155898043722726,
"learning_rate": 3.3496009532852907e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16557329893112183,
"step": 2250,
"valid_targets_mean": 1606.2,
"valid_targets_min": 702
},
{
"epoch": 2.3711882229232386,
"grad_norm": 0.44913851343093436,
"learning_rate": 3.345726353771082e-05,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1271086186170578,
"step": 2255,
"valid_targets_mean": 2099.0,
"valid_targets_min": 612
},
{
"epoch": 2.376445846477392,
"grad_norm": 0.4152659533284206,
"learning_rate": 3.341842503066384e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10442264378070831,
"step": 2260,
"valid_targets_mean": 2427.3,
"valid_targets_min": 816
},
{
"epoch": 2.3817034700315456,
"grad_norm": 0.4398070682209434,
"learning_rate": 3.3379494278707136e-05,
"loss": 0.128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13010065257549286,
"step": 2265,
"valid_targets_mean": 2532.3,
"valid_targets_min": 719
},
{
"epoch": 2.386961093585699,
"grad_norm": 0.41513624638668983,
"learning_rate": 3.334047154947e-05,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12492187321186066,
"step": 2270,
"valid_targets_mean": 2769.9,
"valid_targets_min": 776
},
{
"epoch": 2.392218717139853,
"grad_norm": 0.5673060841263946,
"learning_rate": 3.330135711121404e-05,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13597270846366882,
"step": 2275,
"valid_targets_mean": 1809.6,
"valid_targets_min": 701
},
{
"epoch": 2.3974763406940065,
"grad_norm": 0.49355202092433315,
"learning_rate": 3.32621512328313e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13019579648971558,
"step": 2280,
"valid_targets_mean": 2124.6,
"valid_targets_min": 617
},
{
"epoch": 2.40273396424816,
"grad_norm": 0.450817274315313,
"learning_rate": 3.3222854183842434e-05,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11162659525871277,
"step": 2285,
"valid_targets_mean": 2170.4,
"valid_targets_min": 722
},
{
"epoch": 2.4079915878023135,
"grad_norm": 0.47578870750920976,
"learning_rate": 3.318346623439486e-05,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.120580293238163,
"step": 2290,
"valid_targets_mean": 2150.6,
"valid_targets_min": 203
},
{
"epoch": 2.413249211356467,
"grad_norm": 0.5302285404249144,
"learning_rate": 3.314398765526087e-05,
"loss": 0.1267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13867713510990143,
"step": 2295,
"valid_targets_mean": 2153.8,
"valid_targets_min": 724
},
{
"epoch": 2.4185068349106205,
"grad_norm": 0.5674673130410676,
"learning_rate": 3.310441871783581e-05,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15291212499141693,
"step": 2300,
"valid_targets_mean": 1910.3,
"valid_targets_min": 772
},
{
"epoch": 2.423764458464774,
"grad_norm": 0.37856761450775467,
"learning_rate": 3.3064759694136165e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10432924330234528,
"step": 2305,
"valid_targets_mean": 3020.6,
"valid_targets_min": 1076
},
{
"epoch": 2.4290220820189274,
"grad_norm": 0.5086169310332803,
"learning_rate": 3.302501085679776e-05,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13484901189804077,
"step": 2310,
"valid_targets_mean": 2347.6,
"valid_targets_min": 982
},
{
"epoch": 2.434279705573081,
"grad_norm": 0.5309705554750334,
"learning_rate": 3.29851724790738e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16106128692626953,
"step": 2315,
"valid_targets_mean": 2332.8,
"valid_targets_min": 786
},
{
"epoch": 2.4395373291272344,
"grad_norm": 0.5216922839752293,
"learning_rate": 3.294524483483306e-05,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12702396512031555,
"step": 2320,
"valid_targets_mean": 1755.4,
"valid_targets_min": 623
},
{
"epoch": 2.444794952681388,
"grad_norm": 0.5380436931117779,
"learning_rate": 3.290522819855799e-05,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14177465438842773,
"step": 2325,
"valid_targets_mean": 2111.9,
"valid_targets_min": 663
},
{
"epoch": 2.4500525762355414,
"grad_norm": 0.569671408989822,
"learning_rate": 3.2865122845342776e-05,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17413151264190674,
"step": 2330,
"valid_targets_mean": 2052.1,
"valid_targets_min": 792
},
{
"epoch": 2.455310199789695,
"grad_norm": 0.4973580982001922,
"learning_rate": 3.282492905089151e-05,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12970225512981415,
"step": 2335,
"valid_targets_mean": 1919.8,
"valid_targets_min": 703
},
{
"epoch": 2.4605678233438484,
"grad_norm": 0.535683558284658,
"learning_rate": 3.2784647091516285e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13729405403137207,
"step": 2340,
"valid_targets_mean": 2092.4,
"valid_targets_min": 901
},
{
"epoch": 2.465825446898002,
"grad_norm": 0.5350141288116025,
"learning_rate": 3.274427724413527e-05,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18814143538475037,
"step": 2345,
"valid_targets_mean": 1991.1,
"valid_targets_min": 796
},
{
"epoch": 2.471083070452156,
"grad_norm": 0.46916322154103374,
"learning_rate": 3.270381978627081e-05,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12381716817617416,
"step": 2350,
"valid_targets_mean": 2520.6,
"valid_targets_min": 903
},
{
"epoch": 2.4763406940063093,
"grad_norm": 0.41841785116112407,
"learning_rate": 3.266327499604755e-05,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13207407295703888,
"step": 2355,
"valid_targets_mean": 2773.9,
"valid_targets_min": 967
},
{
"epoch": 2.481598317560463,
"grad_norm": 0.370764477658884,
"learning_rate": 3.262264315219049e-05,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09727045893669128,
"step": 2360,
"valid_targets_mean": 2640.9,
"valid_targets_min": 728
},
{
"epoch": 2.4868559411146163,
"grad_norm": 0.49322867372756224,
"learning_rate": 3.258192453402306e-05,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13653698563575745,
"step": 2365,
"valid_targets_mean": 2480.3,
"valid_targets_min": 619
},
{
"epoch": 2.4921135646687698,
"grad_norm": 0.6000008792945966,
"learning_rate": 3.254111942146526e-05,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17861872911453247,
"step": 2370,
"valid_targets_mean": 2338.8,
"valid_targets_min": 724
},
{
"epoch": 2.4973711882229233,
"grad_norm": 0.6244983815523586,
"learning_rate": 3.2500228095031677e-05,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1728927344083786,
"step": 2375,
"valid_targets_mean": 1750.2,
"valid_targets_min": 654
},
{
"epoch": 2.5026288117770767,
"grad_norm": 0.45085743143190754,
"learning_rate": 3.2459250835829553e-05,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12541204690933228,
"step": 2380,
"valid_targets_mean": 2501.1,
"valid_targets_min": 875
},
{
"epoch": 2.5078864353312302,
"grad_norm": 0.5607166281402027,
"learning_rate": 3.241818792555692e-05,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14313367009162903,
"step": 2385,
"valid_targets_mean": 1766.9,
"valid_targets_min": 622
},
{
"epoch": 2.5131440588853837,
"grad_norm": 0.349230123314275,
"learning_rate": 3.2377039646500565e-05,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10430118441581726,
"step": 2390,
"valid_targets_mean": 3307.1,
"valid_targets_min": 652
},
{
"epoch": 2.518401682439537,
"grad_norm": 0.4417621172341899,
"learning_rate": 3.2335806281534195e-05,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11151588708162308,
"step": 2395,
"valid_targets_mean": 2447.7,
"valid_targets_min": 656
},
{
"epoch": 2.5236593059936907,
"grad_norm": 0.49931457443472277,
"learning_rate": 3.229448811411639e-05,
"loss": 0.1327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12890373170375824,
"step": 2400,
"valid_targets_mean": 2252.1,
"valid_targets_min": 625
},
{
"epoch": 2.5289169295478446,
"grad_norm": 0.7942673110753607,
"learning_rate": 3.225308542828874e-05,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19666960835456848,
"step": 2405,
"valid_targets_mean": 1578.9,
"valid_targets_min": 572
},
{
"epoch": 2.534174553101998,
"grad_norm": 0.51248329231455,
"learning_rate": 3.221159850867385e-05,
"loss": 0.1337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1459226906299591,
"step": 2410,
"valid_targets_mean": 2156.8,
"valid_targets_min": 509
},
{
"epoch": 2.5394321766561516,
"grad_norm": 0.49317302567320126,
"learning_rate": 3.217002764047338e-05,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11925698071718216,
"step": 2415,
"valid_targets_mean": 2903.6,
"valid_targets_min": 800
},
{
"epoch": 2.544689800210305,
"grad_norm": 0.4393291901406591,
"learning_rate": 3.212837310946609e-05,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12763074040412903,
"step": 2420,
"valid_targets_mean": 2780.6,
"valid_targets_min": 1164
},
{
"epoch": 2.5499474237644586,
"grad_norm": 0.4716747925974937,
"learning_rate": 3.20866352020059e-05,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12626245617866516,
"step": 2425,
"valid_targets_mean": 1949.4,
"valid_targets_min": 714
},
{
"epoch": 2.555205047318612,
"grad_norm": 0.5235167266244677,
"learning_rate": 3.204481420501989e-05,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14741046726703644,
"step": 2430,
"valid_targets_mean": 2202.5,
"valid_targets_min": 854
},
{
"epoch": 2.5604626708727656,
"grad_norm": 0.4269687559337652,
"learning_rate": 3.200291040600632e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1541425883769989,
"step": 2435,
"valid_targets_mean": 2509.3,
"valid_targets_min": 1171
},
{
"epoch": 2.565720294426919,
"grad_norm": 0.44445840751802473,
"learning_rate": 3.196092409303272e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1255953013896942,
"step": 2440,
"valid_targets_mean": 2813.1,
"valid_targets_min": 970
},
{
"epoch": 2.5709779179810726,
"grad_norm": 0.577425782298681,
"learning_rate": 3.1918855554733804e-05,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1654086410999298,
"step": 2445,
"valid_targets_mean": 1792.1,
"valid_targets_min": 482
},
{
"epoch": 2.576235541535226,
"grad_norm": 0.5646865981120427,
"learning_rate": 3.187670508030959e-05,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12331168353557587,
"step": 2450,
"valid_targets_mean": 2131.4,
"valid_targets_min": 634
},
{
"epoch": 2.5814931650893795,
"grad_norm": 0.4210411659881901,
"learning_rate": 3.183447295952334e-05,
"loss": 0.1209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12410222738981247,
"step": 2455,
"valid_targets_mean": 2511.1,
"valid_targets_min": 635
},
{
"epoch": 2.586750788643533,
"grad_norm": 0.5143315136141954,
"learning_rate": 3.1792159482699606e-05,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13157877326011658,
"step": 2460,
"valid_targets_mean": 2035.7,
"valid_targets_min": 333
},
{
"epoch": 2.5920084121976865,
"grad_norm": 0.4927887120879855,
"learning_rate": 3.174976494072222e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12919488549232483,
"step": 2465,
"valid_targets_mean": 2004.0,
"valid_targets_min": 652
},
{
"epoch": 2.59726603575184,
"grad_norm": 0.5610440503495874,
"learning_rate": 3.170728962503227e-05,
"loss": 0.1358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13205116987228394,
"step": 2470,
"valid_targets_mean": 1937.8,
"valid_targets_min": 706
},
{
"epoch": 2.6025236593059935,
"grad_norm": 0.44492199722204956,
"learning_rate": 3.1664733827626174e-05,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11554092913866043,
"step": 2475,
"valid_targets_mean": 2413.4,
"valid_targets_min": 746
},
{
"epoch": 2.607781282860147,
"grad_norm": 0.4157640745535471,
"learning_rate": 3.1622097841053574e-05,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1235933005809784,
"step": 2480,
"valid_targets_mean": 2683.9,
"valid_targets_min": 799
},
{
"epoch": 2.6130389064143005,
"grad_norm": 0.5745930299468012,
"learning_rate": 3.15793819584154e-05,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14433233439922333,
"step": 2485,
"valid_targets_mean": 2245.2,
"valid_targets_min": 739
},
{
"epoch": 2.6182965299684544,
"grad_norm": 0.469643202711402,
"learning_rate": 3.1536586473361815e-05,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13549131155014038,
"step": 2490,
"valid_targets_mean": 2644.9,
"valid_targets_min": 323
},
{
"epoch": 2.623554153522608,
"grad_norm": 0.48888303913649117,
"learning_rate": 3.149371168009022e-05,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1277773380279541,
"step": 2495,
"valid_targets_mean": 2266.4,
"valid_targets_min": 741
},
{
"epoch": 2.6288117770767614,
"grad_norm": 0.46544848382238063,
"learning_rate": 3.145075787334319e-05,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1833849549293518,
"step": 2500,
"valid_targets_mean": 2318.6,
"valid_targets_min": 623
},
{
"epoch": 2.634069400630915,
"grad_norm": 0.4568665677588512,
"learning_rate": 3.140772534840652e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12838146090507507,
"step": 2505,
"valid_targets_mean": 2301.1,
"valid_targets_min": 639
},
{
"epoch": 2.6393270241850684,
"grad_norm": 0.46751738504389234,
"learning_rate": 3.1364614401107126e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12055309116840363,
"step": 2510,
"valid_targets_mean": 2212.8,
"valid_targets_min": 816
},
{
"epoch": 2.644584647739222,
"grad_norm": 0.43672126320010757,
"learning_rate": 3.1321425327811044e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1180083304643631,
"step": 2515,
"valid_targets_mean": 2219.2,
"valid_targets_min": 837
},
{
"epoch": 2.6498422712933754,
"grad_norm": 0.4515973901786908,
"learning_rate": 3.127815842542138e-05,
"loss": 0.1277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1234833151102066,
"step": 2520,
"valid_targets_mean": 2426.4,
"valid_targets_min": 700
},
{
"epoch": 2.655099894847529,
"grad_norm": 0.5307805703940389,
"learning_rate": 3.1234813991376296e-05,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1535000205039978,
"step": 2525,
"valid_targets_mean": 2139.4,
"valid_targets_min": 751
},
{
"epoch": 2.6603575184016823,
"grad_norm": 0.5082195572812225,
"learning_rate": 3.119139232364693e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14292414486408234,
"step": 2530,
"valid_targets_mean": 2131.5,
"valid_targets_min": 732
},
{
"epoch": 2.665615141955836,
"grad_norm": 0.5632757976378782,
"learning_rate": 3.1147893720735356e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13347192108631134,
"step": 2535,
"valid_targets_mean": 1798.6,
"valid_targets_min": 541
},
{
"epoch": 2.6708727655099898,
"grad_norm": 0.4999263753768626,
"learning_rate": 3.110431848167255e-05,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1604682207107544,
"step": 2540,
"valid_targets_mean": 2195.6,
"valid_targets_min": 492
},
{
"epoch": 2.6761303890641432,
"grad_norm": 0.4846247046942896,
"learning_rate": 3.106066690601633e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1544347107410431,
"step": 2545,
"valid_targets_mean": 2396.6,
"valid_targets_min": 734
},
{
"epoch": 2.6813880126182967,
"grad_norm": 0.5031037870288574,
"learning_rate": 3.101693929384927e-05,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12892138957977295,
"step": 2550,
"valid_targets_mean": 2153.6,
"valid_targets_min": 660
},
{
"epoch": 2.6866456361724502,
"grad_norm": 0.4237681668530756,
"learning_rate": 3.097313594577667e-05,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10954263061285019,
"step": 2555,
"valid_targets_mean": 2281.6,
"valid_targets_min": 523
},
{
"epoch": 2.6919032597266037,
"grad_norm": 0.5025501202207807,
"learning_rate": 3.092925716292447e-05,
"loss": 0.1273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14490699768066406,
"step": 2560,
"valid_targets_mean": 2398.4,
"valid_targets_min": 911
},
{
"epoch": 2.697160883280757,
"grad_norm": 1.4413956671661858,
"learning_rate": 3.088530324693719e-05,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11001194268465042,
"step": 2565,
"valid_targets_mean": 2059.5,
"valid_targets_min": 696
},
{
"epoch": 2.7024185068349107,
"grad_norm": 0.48597301218526534,
"learning_rate": 3.0841274499975855e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1456114798784256,
"step": 2570,
"valid_targets_mean": 2436.7,
"valid_targets_min": 928
},
{
"epoch": 2.707676130389064,
"grad_norm": 0.4292422973469116,
"learning_rate": 3.079717122471591e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11817838251590729,
"step": 2575,
"valid_targets_mean": 2428.1,
"valid_targets_min": 676
},
{
"epoch": 2.7129337539432177,
"grad_norm": 0.47480229911956606,
"learning_rate": 3.075299372434515e-05,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15318870544433594,
"step": 2580,
"valid_targets_mean": 2268.4,
"valid_targets_min": 820
},
{
"epoch": 2.718191377497371,
"grad_norm": 0.36940081662494484,
"learning_rate": 3.0708742302561606e-05,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10757045447826385,
"step": 2585,
"valid_targets_mean": 2752.0,
"valid_targets_min": 959
},
{
"epoch": 2.7234490010515247,
"grad_norm": 0.47949596398229655,
"learning_rate": 3.066441726357153e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12207190692424774,
"step": 2590,
"valid_targets_mean": 2475.9,
"valid_targets_min": 774
},
{
"epoch": 2.728706624605678,
"grad_norm": 0.5433743165382702,
"learning_rate": 3.062001891208721e-05,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13814394176006317,
"step": 2595,
"valid_targets_mean": 1810.8,
"valid_targets_min": 666
},
{
"epoch": 2.7339642481598316,
"grad_norm": 0.42922263122322435,
"learning_rate": 3.0575547553324944e-05,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12289388477802277,
"step": 2600,
"valid_targets_mean": 2449.1,
"valid_targets_min": 808
},
{
"epoch": 2.739221871713985,
"grad_norm": 0.4559709205563668,
"learning_rate": 3.053100349300291e-05,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13742108643054962,
"step": 2605,
"valid_targets_mean": 2324.9,
"valid_targets_min": 807
},
{
"epoch": 2.7444794952681386,
"grad_norm": 0.4608957789790409,
"learning_rate": 3.0486387037339074e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1124209314584732,
"step": 2610,
"valid_targets_mean": 2033.6,
"valid_targets_min": 683
},
{
"epoch": 2.749737118822292,
"grad_norm": 0.4474527329817486,
"learning_rate": 3.0441698493049078e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11497777700424194,
"step": 2615,
"valid_targets_mean": 2339.6,
"valid_targets_min": 742
},
{
"epoch": 2.7549947423764456,
"grad_norm": 0.4465578093674148,
"learning_rate": 3.0396938167344153e-05,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12491779774427414,
"step": 2620,
"valid_targets_mean": 2372.3,
"valid_targets_min": 774
},
{
"epoch": 2.7602523659305995,
"grad_norm": 0.4658548438561309,
"learning_rate": 3.0352106367928974e-05,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15467898547649384,
"step": 2625,
"valid_targets_mean": 2353.6,
"valid_targets_min": 575
},
{
"epoch": 2.765509989484753,
"grad_norm": 0.4181555161891978,
"learning_rate": 3.030720340299957e-05,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11631730198860168,
"step": 2630,
"valid_targets_mean": 2602.1,
"valid_targets_min": 675
},
{
"epoch": 2.7707676130389065,
"grad_norm": 0.4806825998275714,
"learning_rate": 3.0262229581241197e-05,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14768224954605103,
"step": 2635,
"valid_targets_mean": 2436.3,
"valid_targets_min": 820
},
{
"epoch": 2.77602523659306,
"grad_norm": 0.4619431814251294,
"learning_rate": 3.0217185211826218e-05,
"loss": 0.1154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11479765176773071,
"step": 2640,
"valid_targets_mean": 2398.8,
"valid_targets_min": 474
},
{
"epoch": 2.7812828601472135,
"grad_norm": 0.3863010970690241,
"learning_rate": 3.0172070604411957e-05,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09624399244785309,
"step": 2645,
"valid_targets_mean": 2566.4,
"valid_targets_min": 635
},
{
"epoch": 2.786540483701367,
"grad_norm": 0.44834440185749524,
"learning_rate": 3.0126886069138623e-05,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11984342336654663,
"step": 2650,
"valid_targets_mean": 2300.4,
"valid_targets_min": 612
},
{
"epoch": 2.7917981072555205,
"grad_norm": 0.41833862281237577,
"learning_rate": 3.0081631916627114e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1254144012928009,
"step": 2655,
"valid_targets_mean": 2775.9,
"valid_targets_min": 751
},
{
"epoch": 2.797055730809674,
"grad_norm": 0.4173736679292746,
"learning_rate": 3.003630845797693e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11636321246623993,
"step": 2660,
"valid_targets_mean": 2720.7,
"valid_targets_min": 805
},
{
"epoch": 2.8023133543638274,
"grad_norm": 0.4875903392535986,
"learning_rate": 2.9990916004763996e-05,
"loss": 0.1305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13238069415092468,
"step": 2665,
"valid_targets_mean": 2333.6,
"valid_targets_min": 531
},
{
"epoch": 2.807570977917981,
"grad_norm": 0.5067468193901491,
"learning_rate": 2.9945454869038562e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1356458216905594,
"step": 2670,
"valid_targets_mean": 2160.2,
"valid_targets_min": 633
},
{
"epoch": 2.812828601472135,
"grad_norm": 0.4018575460234702,
"learning_rate": 2.9899925363323022e-05,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12325941026210785,
"step": 2675,
"valid_targets_mean": 2961.1,
"valid_targets_min": 830
},
{
"epoch": 2.8180862250262884,
"grad_norm": 0.46583410321410484,
"learning_rate": 2.9854327800609775e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.131715327501297,
"step": 2680,
"valid_targets_mean": 2380.8,
"valid_targets_min": 814
},
{
"epoch": 2.823343848580442,
"grad_norm": 0.5874155649350631,
"learning_rate": 2.98086624943591e-05,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12297909706830978,
"step": 2685,
"valid_targets_mean": 2154.3,
"valid_targets_min": 705
},
{
"epoch": 2.8286014721345953,
"grad_norm": 0.46409664192737776,
"learning_rate": 2.976292975849696e-05,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1120598092675209,
"step": 2690,
"valid_targets_mean": 1963.8,
"valid_targets_min": 721
},
{
"epoch": 2.833859095688749,
"grad_norm": 0.4807255437981375,
"learning_rate": 2.9717129907412857e-05,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1193617582321167,
"step": 2695,
"valid_targets_mean": 2133.3,
"valid_targets_min": 740
},
{
"epoch": 2.8391167192429023,
"grad_norm": 0.3876768477055061,
"learning_rate": 2.9671263255957697e-05,
"loss": 0.1277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1101631447672844,
"step": 2700,
"valid_targets_mean": 2324.4,
"valid_targets_min": 764
},
{
"epoch": 2.844374342797056,
"grad_norm": 0.5004065842328297,
"learning_rate": 2.9625330119441584e-05,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14245113730430603,
"step": 2705,
"valid_targets_mean": 2310.9,
"valid_targets_min": 727
},
{
"epoch": 2.8496319663512093,
"grad_norm": 0.4025325302705115,
"learning_rate": 2.957933081363169e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10665883123874664,
"step": 2710,
"valid_targets_mean": 2454.0,
"valid_targets_min": 837
},
{
"epoch": 2.854889589905363,
"grad_norm": 0.45621458151474187,
"learning_rate": 2.953326565475006e-05,
"loss": 0.128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329360008239746,
"step": 2715,
"valid_targets_mean": 2548.8,
"valid_targets_min": 613
},
{
"epoch": 2.8601472134595163,
"grad_norm": 0.5558163985537915,
"learning_rate": 2.9487134959471445e-05,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1478731483221054,
"step": 2720,
"valid_targets_mean": 1797.7,
"valid_targets_min": 880
},
{
"epoch": 2.8654048370136698,
"grad_norm": 0.5819274616316016,
"learning_rate": 2.944093904492113e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1630917191505432,
"step": 2725,
"valid_targets_mean": 2108.3,
"valid_targets_min": 593
},
{
"epoch": 2.8706624605678233,
"grad_norm": 0.45059487900938333,
"learning_rate": 2.9394678228672737e-05,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13295793533325195,
"step": 2730,
"valid_targets_mean": 2183.7,
"valid_targets_min": 722
},
{
"epoch": 2.8759200841219767,
"grad_norm": 0.44736809629231983,
"learning_rate": 2.9348352828746076e-05,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12000765651464462,
"step": 2735,
"valid_targets_mean": 2359.3,
"valid_targets_min": 718
},
{
"epoch": 2.8811777076761302,
"grad_norm": 0.40189987125458787,
"learning_rate": 2.9301963163604916e-05,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11780589818954468,
"step": 2740,
"valid_targets_mean": 2646.6,
"valid_targets_min": 908
},
{
"epoch": 2.8864353312302837,
"grad_norm": 0.4240789658342137,
"learning_rate": 2.925550955215483e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11626739054918289,
"step": 2745,
"valid_targets_mean": 2335.8,
"valid_targets_min": 554
},
{
"epoch": 2.891692954784437,
"grad_norm": 0.43067987985146305,
"learning_rate": 2.9208992313740993e-05,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12096014618873596,
"step": 2750,
"valid_targets_mean": 2477.1,
"valid_targets_min": 794
},
{
"epoch": 2.8969505783385907,
"grad_norm": 0.4508477485181296,
"learning_rate": 2.916241176814596e-05,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12107770889997482,
"step": 2755,
"valid_targets_mean": 2193.9,
"valid_targets_min": 588
},
{
"epoch": 2.9022082018927446,
"grad_norm": 0.45469066694036736,
"learning_rate": 2.9115768235587526e-05,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12227421998977661,
"step": 2760,
"valid_targets_mean": 2110.3,
"valid_targets_min": 549
},
{
"epoch": 2.907465825446898,
"grad_norm": 0.4102525643163261,
"learning_rate": 2.9069062036716454e-05,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13152821362018585,
"step": 2765,
"valid_targets_mean": 2510.9,
"valid_targets_min": 494
},
{
"epoch": 2.9127234490010516,
"grad_norm": 0.48551869290981703,
"learning_rate": 2.9022293492614334e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13426774740219116,
"step": 2770,
"valid_targets_mean": 2137.8,
"valid_targets_min": 717
},
{
"epoch": 2.917981072555205,
"grad_norm": 0.6232267022329183,
"learning_rate": 2.8975462924791334e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15056556463241577,
"step": 2775,
"valid_targets_mean": 1371.2,
"valid_targets_min": 737
},
{
"epoch": 2.9232386961093586,
"grad_norm": 0.44024417305390795,
"learning_rate": 2.892857065518401e-05,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14012862741947174,
"step": 2780,
"valid_targets_mean": 2567.3,
"valid_targets_min": 1045
},
{
"epoch": 2.928496319663512,
"grad_norm": 0.4342553995532047,
"learning_rate": 2.8881617006153072e-05,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1255347728729248,
"step": 2785,
"valid_targets_mean": 2145.8,
"valid_targets_min": 700
},
{
"epoch": 2.9337539432176656,
"grad_norm": 0.39849941747351697,
"learning_rate": 2.8834602300481207e-05,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1139749139547348,
"step": 2790,
"valid_targets_mean": 2767.8,
"valid_targets_min": 940
},
{
"epoch": 2.939011566771819,
"grad_norm": 0.4535674208927001,
"learning_rate": 2.878752686137082e-05,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12091179937124252,
"step": 2795,
"valid_targets_mean": 2344.1,
"valid_targets_min": 697
},
{
"epoch": 2.9442691903259726,
"grad_norm": 0.6266178181873837,
"learning_rate": 2.874039101244183e-05,
"loss": 0.1332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15312370657920837,
"step": 2800,
"valid_targets_mean": 1685.9,
"valid_targets_min": 596
},
{
"epoch": 2.949526813880126,
"grad_norm": 0.5028198193272364,
"learning_rate": 2.869319507772944e-05,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15030145645141602,
"step": 2805,
"valid_targets_mean": 2095.8,
"valid_targets_min": 785
},
{
"epoch": 2.9547844374342795,
"grad_norm": 0.47002781115846476,
"learning_rate": 2.864593938168192e-05,
"loss": 0.1293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09862858802080154,
"step": 2810,
"valid_targets_mean": 2946.2,
"valid_targets_min": 704
},
{
"epoch": 2.9600420609884335,
"grad_norm": 0.4208045480471127,
"learning_rate": 2.8598624249158367e-05,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11026174575090408,
"step": 2815,
"valid_targets_mean": 2354.8,
"valid_targets_min": 1007
},
{
"epoch": 2.965299684542587,
"grad_norm": 0.5032185525146141,
"learning_rate": 2.855125000542647e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1321502923965454,
"step": 2820,
"valid_targets_mean": 2240.6,
"valid_targets_min": 534
},
{
"epoch": 2.9705573080967405,
"grad_norm": 0.5984278705336151,
"learning_rate": 2.8503816976160278e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1949070245027542,
"step": 2825,
"valid_targets_mean": 2030.9,
"valid_targets_min": 617
},
{
"epoch": 2.975814931650894,
"grad_norm": 0.5263266410190764,
"learning_rate": 2.8456325487437966e-05,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14382363855838776,
"step": 2830,
"valid_targets_mean": 1991.5,
"valid_targets_min": 756
},
{
"epoch": 2.9810725552050474,
"grad_norm": 0.5704973107874455,
"learning_rate": 2.8408775865739578e-05,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14768922328948975,
"step": 2835,
"valid_targets_mean": 2084.1,
"valid_targets_min": 663
},
{
"epoch": 2.986330178759201,
"grad_norm": 1.354868766169001,
"learning_rate": 2.8361168437944817e-05,
"loss": 0.1294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11687695235013962,
"step": 2840,
"valid_targets_mean": 2189.9,
"valid_targets_min": 770
},
{
"epoch": 2.9915878023133544,
"grad_norm": 0.4454000055536909,
"learning_rate": 2.8313503531330738e-05,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.116331547498703,
"step": 2845,
"valid_targets_mean": 2591.7,
"valid_targets_min": 567
},
{
"epoch": 2.996845425867508,
"grad_norm": 0.47608492485548193,
"learning_rate": 2.826578147356956e-05,
"loss": 0.1344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14574572443962097,
"step": 2850,
"valid_targets_mean": 2241.3,
"valid_targets_min": 424
},
{
"epoch": 3.0021030494216614,
"grad_norm": 0.37543221439720614,
"learning_rate": 2.8218002592726384e-05,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09042000770568848,
"step": 2855,
"valid_targets_mean": 2471.9,
"valid_targets_min": 800
},
{
"epoch": 3.007360672975815,
"grad_norm": 0.3867744829037715,
"learning_rate": 2.8170167217256934e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09279963374137878,
"step": 2860,
"valid_targets_mean": 2448.3,
"valid_targets_min": 750
},
{
"epoch": 3.0126182965299684,
"grad_norm": 0.6209496442639855,
"learning_rate": 2.8122275676005304e-05,
"loss": 0.11,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10986914485692978,
"step": 2865,
"valid_targets_mean": 2157.0,
"valid_targets_min": 717
},
{
"epoch": 3.017875920084122,
"grad_norm": 0.5264751158942041,
"learning_rate": 2.807432829820171e-05,
"loss": 0.1186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11469864100217819,
"step": 2870,
"valid_targets_mean": 1830.4,
"valid_targets_min": 655
},
{
"epoch": 3.0231335436382754,
"grad_norm": 0.5791651432594616,
"learning_rate": 2.8026325413460215e-05,
"loss": 0.1039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12092810869216919,
"step": 2875,
"valid_targets_mean": 2209.1,
"valid_targets_min": 531
},
{
"epoch": 3.028391167192429,
"grad_norm": 0.4982417563594433,
"learning_rate": 2.7978267351776448e-05,
"loss": 0.1035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11411077529191971,
"step": 2880,
"valid_targets_mean": 2098.4,
"valid_targets_min": 503
},
{
"epoch": 3.0336487907465823,
"grad_norm": 0.5054846435917808,
"learning_rate": 2.7930154443525377e-05,
"loss": 0.1062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10371555387973785,
"step": 2885,
"valid_targets_mean": 2441.1,
"valid_targets_min": 659
},
{
"epoch": 3.0389064143007363,
"grad_norm": 0.5643028378460608,
"learning_rate": 2.7881987019458992e-05,
"loss": 0.1147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11611708253622055,
"step": 2890,
"valid_targets_mean": 2507.9,
"valid_targets_min": 681
},
{
"epoch": 3.0441640378548898,
"grad_norm": 0.46661525602939896,
"learning_rate": 2.7833765410704062e-05,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10574992001056671,
"step": 2895,
"valid_targets_mean": 2452.1,
"valid_targets_min": 859
},
{
"epoch": 3.0494216614090432,
"grad_norm": 0.5695014108794103,
"learning_rate": 2.778548994875984e-05,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11309127509593964,
"step": 2900,
"valid_targets_mean": 1910.9,
"valid_targets_min": 576
},
{
"epoch": 3.0546792849631967,
"grad_norm": 0.6054482359044839,
"learning_rate": 2.7737160965495794e-05,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1620527058839798,
"step": 2905,
"valid_targets_mean": 1894.4,
"valid_targets_min": 592
},
{
"epoch": 3.0599369085173502,
"grad_norm": 0.42373977784435296,
"learning_rate": 2.768877879314935e-05,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09606526792049408,
"step": 2910,
"valid_targets_mean": 2880.1,
"valid_targets_min": 754
},
{
"epoch": 3.0651945320715037,
"grad_norm": 0.47407559737469196,
"learning_rate": 2.7640343764323535e-05,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1279953420162201,
"step": 2915,
"valid_targets_mean": 2508.9,
"valid_targets_min": 844
},
{
"epoch": 3.070452155625657,
"grad_norm": 0.47022824262052126,
"learning_rate": 2.7591856211984783e-05,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10582815110683441,
"step": 2920,
"valid_targets_mean": 2362.6,
"valid_targets_min": 742
},
{
"epoch": 3.0757097791798107,
"grad_norm": 0.5138691239266067,
"learning_rate": 2.7543316469460565e-05,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12330075353384018,
"step": 2925,
"valid_targets_mean": 2356.2,
"valid_targets_min": 1020
},
{
"epoch": 3.080967402733964,
"grad_norm": 0.5627899531526662,
"learning_rate": 2.7494724870437147e-05,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10817135870456696,
"step": 2930,
"valid_targets_mean": 1939.3,
"valid_targets_min": 671
},
{
"epoch": 3.0862250262881177,
"grad_norm": 0.48790272469825424,
"learning_rate": 2.7446081748957306e-05,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12890625,
"step": 2935,
"valid_targets_mean": 2308.4,
"valid_targets_min": 666
},
{
"epoch": 3.091482649842271,
"grad_norm": 0.4767590857823866,
"learning_rate": 2.7397387439417963e-05,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10541529953479767,
"step": 2940,
"valid_targets_mean": 2508.8,
"valid_targets_min": 560
},
{
"epoch": 3.0967402733964247,
"grad_norm": 0.5800784082688102,
"learning_rate": 2.7348642276567973e-05,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10997745394706726,
"step": 2945,
"valid_targets_mean": 2250.3,
"valid_targets_min": 843
},
{
"epoch": 3.101997896950578,
"grad_norm": 0.45880655045888574,
"learning_rate": 2.729984659550576e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11031247675418854,
"step": 2950,
"valid_targets_mean": 2468.1,
"valid_targets_min": 722
},
{
"epoch": 3.107255520504732,
"grad_norm": 0.41165328973164356,
"learning_rate": 2.7251000731677035e-05,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11390068382024765,
"step": 2955,
"valid_targets_mean": 3014.0,
"valid_targets_min": 772
},
{
"epoch": 3.1125131440588856,
"grad_norm": 0.45786008725760097,
"learning_rate": 2.72021050208725e-05,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10765732824802399,
"step": 2960,
"valid_targets_mean": 2507.8,
"valid_targets_min": 942
},
{
"epoch": 3.117770767613039,
"grad_norm": 0.45714302538172386,
"learning_rate": 2.715315979922552e-05,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09677045047283173,
"step": 2965,
"valid_targets_mean": 2182.8,
"valid_targets_min": 663
},
{
"epoch": 3.1230283911671926,
"grad_norm": 0.43615604429160654,
"learning_rate": 2.7104165403209843e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09897886961698532,
"step": 2970,
"valid_targets_mean": 2380.8,
"valid_targets_min": 855
},
{
"epoch": 3.128286014721346,
"grad_norm": 0.51168741619374,
"learning_rate": 2.7055122169637224e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11317049711942673,
"step": 2975,
"valid_targets_mean": 1858.6,
"valid_targets_min": 678
},
{
"epoch": 3.1335436382754995,
"grad_norm": 0.5353005078749653,
"learning_rate": 2.7006030435655205e-05,
"loss": 0.1034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12433994561433792,
"step": 2980,
"valid_targets_mean": 1898.4,
"valid_targets_min": 589
},
{
"epoch": 3.138801261829653,
"grad_norm": 0.528591390961327,
"learning_rate": 2.6956890538744703e-05,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13948772847652435,
"step": 2985,
"valid_targets_mean": 2319.1,
"valid_targets_min": 663
},
{
"epoch": 3.1440588853838065,
"grad_norm": 0.6092445235444702,
"learning_rate": 2.6907702816717742e-05,
"loss": 0.1024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10452305525541306,
"step": 2990,
"valid_targets_mean": 1885.6,
"valid_targets_min": 635
},
{
"epoch": 3.14931650893796,
"grad_norm": 0.4688279763065105,
"learning_rate": 2.685846760771513e-05,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0946442112326622,
"step": 2995,
"valid_targets_mean": 2200.3,
"valid_targets_min": 524
},
{
"epoch": 3.1545741324921135,
"grad_norm": 0.5277942062913996,
"learning_rate": 2.6809185250204113e-05,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12642043828964233,
"step": 3000,
"valid_targets_mean": 2345.7,
"valid_targets_min": 739
},
{
"epoch": 3.159831756046267,
"grad_norm": 0.42098600487501703,
"learning_rate": 2.6759856082976066e-05,
"loss": 0.1029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08629012852907181,
"step": 3005,
"valid_targets_mean": 2403.2,
"valid_targets_min": 538
},
{
"epoch": 3.1650893796004205,
"grad_norm": 0.4264989333170223,
"learning_rate": 2.6710480445144145e-05,
"loss": 0.0994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08005677163600922,
"step": 3010,
"valid_targets_mean": 2635.9,
"valid_targets_min": 669
},
{
"epoch": 3.170347003154574,
"grad_norm": 0.4855200009349899,
"learning_rate": 2.666105867614099e-05,
"loss": 0.1087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10743850469589233,
"step": 3015,
"valid_targets_mean": 2048.9,
"valid_targets_min": 740
},
{
"epoch": 3.1756046267087275,
"grad_norm": 0.49414628975394825,
"learning_rate": 2.6611591115716345e-05,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10523631423711777,
"step": 3020,
"valid_targets_mean": 2077.4,
"valid_targets_min": 765
},
{
"epoch": 3.1808622502628814,
"grad_norm": 0.4827349618984835,
"learning_rate": 2.6562078103934755e-05,
"loss": 0.1132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1223248541355133,
"step": 3025,
"valid_targets_mean": 2798.0,
"valid_targets_min": 761
},
{
"epoch": 3.186119873817035,
"grad_norm": 0.44893822320472543,
"learning_rate": 2.6512519981173238e-05,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11694766581058502,
"step": 3030,
"valid_targets_mean": 2648.8,
"valid_targets_min": 794
},
{
"epoch": 3.1913774973711884,
"grad_norm": 0.456199715287159,
"learning_rate": 2.64629170881189e-05,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10553974658250809,
"step": 3035,
"valid_targets_mean": 2706.0,
"valid_targets_min": 963
},
{
"epoch": 3.196635120925342,
"grad_norm": 0.556699588025355,
"learning_rate": 2.641326976576664e-05,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1373308151960373,
"step": 3040,
"valid_targets_mean": 1819.5,
"valid_targets_min": 638
},
{
"epoch": 3.2018927444794953,
"grad_norm": 0.4621425994561363,
"learning_rate": 2.6363578355416772e-05,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10977025330066681,
"step": 3045,
"valid_targets_mean": 1999.9,
"valid_targets_min": 606
},
{
"epoch": 3.207150368033649,
"grad_norm": 0.46886508326813897,
"learning_rate": 2.6313843198672712e-05,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10616603493690491,
"step": 3050,
"valid_targets_mean": 2238.6,
"valid_targets_min": 676
},
{
"epoch": 3.2124079915878023,
"grad_norm": 0.5332609131940856,
"learning_rate": 2.6264064637438585e-05,
"loss": 0.1152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1407933533191681,
"step": 3055,
"valid_targets_mean": 2192.1,
"valid_targets_min": 799
},
{
"epoch": 3.217665615141956,
"grad_norm": 0.4602700556613322,
"learning_rate": 2.6214243013916915e-05,
"loss": 0.1121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11290593445301056,
"step": 3060,
"valid_targets_mean": 2515.7,
"valid_targets_min": 617
},
{
"epoch": 3.2229232386961093,
"grad_norm": 0.5638522514752865,
"learning_rate": 2.616437867060627e-05,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13324710726737976,
"step": 3065,
"valid_targets_mean": 1787.2,
"valid_targets_min": 827
},
{
"epoch": 3.228180862250263,
"grad_norm": 0.5468573075365044,
"learning_rate": 2.6114471950298853e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13356804847717285,
"step": 3070,
"valid_targets_mean": 2297.2,
"valid_targets_min": 446
},
{
"epoch": 3.2334384858044163,
"grad_norm": 0.5244598391270896,
"learning_rate": 2.6064523196078248e-05,
"loss": 0.1195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11893997341394424,
"step": 3075,
"valid_targets_mean": 2030.5,
"valid_targets_min": 526
},
{
"epoch": 3.2386961093585698,
"grad_norm": 0.4816143508495792,
"learning_rate": 2.6014532751316937e-05,
"loss": 0.1048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11238957941532135,
"step": 3080,
"valid_targets_mean": 2355.4,
"valid_targets_min": 693
},
{
"epoch": 3.2439537329127233,
"grad_norm": 0.4589235822680556,
"learning_rate": 2.5964500959674057e-05,
"loss": 0.1054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1107926219701767,
"step": 3085,
"valid_targets_mean": 2607.0,
"valid_targets_min": 522
},
{
"epoch": 3.249211356466877,
"grad_norm": 0.6111473627885837,
"learning_rate": 2.5914428165092956e-05,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14418260753154755,
"step": 3090,
"valid_targets_mean": 1805.6,
"valid_targets_min": 756
},
{
"epoch": 3.2544689800210307,
"grad_norm": 0.5228830866818445,
"learning_rate": 2.5864314711798856e-05,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1501845270395279,
"step": 3095,
"valid_targets_mean": 2147.2,
"valid_targets_min": 774
},
{
"epoch": 3.259726603575184,
"grad_norm": 0.4137547276710081,
"learning_rate": 2.5814160944296495e-05,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10305169224739075,
"step": 3100,
"valid_targets_mean": 2493.4,
"valid_targets_min": 1067
},
{
"epoch": 3.2649842271293377,
"grad_norm": 0.4875334492181037,
"learning_rate": 2.5763967207367752e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1528482884168625,
"step": 3105,
"valid_targets_mean": 2129.7,
"valid_targets_min": 548
},
{
"epoch": 3.270241850683491,
"grad_norm": 0.42032256315169425,
"learning_rate": 2.5713733846069272e-05,
"loss": 0.1022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11212792992591858,
"step": 3110,
"valid_targets_mean": 3008.8,
"valid_targets_min": 553
},
{
"epoch": 3.2754994742376446,
"grad_norm": 0.5234311888057125,
"learning_rate": 2.56634612057301e-05,
"loss": 0.1141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11078391969203949,
"step": 3115,
"valid_targets_mean": 2355.9,
"valid_targets_min": 727
},
{
"epoch": 3.280757097791798,
"grad_norm": 0.4941605261662112,
"learning_rate": 2.561314963194929e-05,
"loss": 0.121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1029837429523468,
"step": 3120,
"valid_targets_mean": 2144.1,
"valid_targets_min": 577
},
{
"epoch": 3.2860147213459516,
"grad_norm": 0.5397737652200215,
"learning_rate": 2.556279947059358e-05,
"loss": 0.1136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11686725914478302,
"step": 3125,
"valid_targets_mean": 2364.9,
"valid_targets_min": 823
},
{
"epoch": 3.291272344900105,
"grad_norm": 0.5271890184522846,
"learning_rate": 2.551241106779494e-05,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11344581842422485,
"step": 3130,
"valid_targets_mean": 2355.1,
"valid_targets_min": 780
},
{
"epoch": 3.2965299684542586,
"grad_norm": 0.4828514547087221,
"learning_rate": 2.5461984769948244e-05,
"loss": 0.1011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10826694220304489,
"step": 3135,
"valid_targets_mean": 2397.0,
"valid_targets_min": 682
},
{
"epoch": 3.301787592008412,
"grad_norm": 0.4564616846068297,
"learning_rate": 2.5411520923708874e-05,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10306870192289352,
"step": 3140,
"valid_targets_mean": 2625.2,
"valid_targets_min": 848
},
{
"epoch": 3.3070452155625656,
"grad_norm": 0.5426748992894767,
"learning_rate": 2.536101987599036e-05,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11682391911745071,
"step": 3145,
"valid_targets_mean": 1922.8,
"valid_targets_min": 719
},
{
"epoch": 3.312302839116719,
"grad_norm": 0.47639365158347863,
"learning_rate": 2.5310481973961935e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10468867421150208,
"step": 3150,
"valid_targets_mean": 2201.1,
"valid_targets_min": 619
},
{
"epoch": 3.3175604626708726,
"grad_norm": 0.6085747776983041,
"learning_rate": 2.5259907565046217e-05,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12527263164520264,
"step": 3155,
"valid_targets_mean": 1836.1,
"valid_targets_min": 724
},
{
"epoch": 3.322818086225026,
"grad_norm": 0.6218410011450068,
"learning_rate": 2.5209296996916774e-05,
"loss": 0.1117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14689847826957703,
"step": 3160,
"valid_targets_mean": 1895.2,
"valid_targets_min": 776
},
{
"epoch": 3.32807570977918,
"grad_norm": 0.4316088953474699,
"learning_rate": 2.5158650617495753e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09639740735292435,
"step": 3165,
"valid_targets_mean": 2720.7,
"valid_targets_min": 825
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.48262081877527613,
"learning_rate": 2.5107968774951504e-05,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10296712815761566,
"step": 3170,
"valid_targets_mean": 2184.6,
"valid_targets_min": 599
},
{
"epoch": 3.338590956887487,
"grad_norm": 0.5673609650493359,
"learning_rate": 2.5057251817696138e-05,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17327016592025757,
"step": 3175,
"valid_targets_mean": 2122.7,
"valid_targets_min": 668
},
{
"epoch": 3.3438485804416405,
"grad_norm": 0.5457146473443527,
"learning_rate": 2.5006500094383176e-05,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12017304450273514,
"step": 3180,
"valid_targets_mean": 2251.6,
"valid_targets_min": 244
},
{
"epoch": 3.349106203995794,
"grad_norm": 0.5630254459809951,
"learning_rate": 2.4955713953905155e-05,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11483124643564224,
"step": 3185,
"valid_targets_mean": 1662.8,
"valid_targets_min": 634
},
{
"epoch": 3.3543638275499474,
"grad_norm": 0.381805633766247,
"learning_rate": 2.490489374539118e-05,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09102381765842438,
"step": 3190,
"valid_targets_mean": 2875.4,
"valid_targets_min": 516
},
{
"epoch": 3.359621451104101,
"grad_norm": 0.5433769005754793,
"learning_rate": 2.4854039818204577e-05,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1219017282128334,
"step": 3195,
"valid_targets_mean": 2152.2,
"valid_targets_min": 795
},
{
"epoch": 3.3648790746582544,
"grad_norm": 0.46582062688416787,
"learning_rate": 2.480315252194047e-05,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1032124012708664,
"step": 3200,
"valid_targets_mean": 2366.8,
"valid_targets_min": 504
},
{
"epoch": 3.370136698212408,
"grad_norm": 0.528744079370394,
"learning_rate": 2.4752232206423387e-05,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11800310015678406,
"step": 3205,
"valid_targets_mean": 2031.2,
"valid_targets_min": 605
},
{
"epoch": 3.3753943217665614,
"grad_norm": 0.4052584478950322,
"learning_rate": 2.4701279221704812e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10734105855226517,
"step": 3210,
"valid_targets_mean": 2741.9,
"valid_targets_min": 756
},
{
"epoch": 3.380651945320715,
"grad_norm": 0.5342731178889146,
"learning_rate": 2.4650293918060845e-05,
"loss": 0.1099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12310801446437836,
"step": 3215,
"valid_targets_mean": 2361.0,
"valid_targets_min": 725
},
{
"epoch": 3.3859095688748684,
"grad_norm": 0.4072106829611508,
"learning_rate": 2.4599276645989763e-05,
"loss": 0.1019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09146159887313843,
"step": 3220,
"valid_targets_mean": 2975.6,
"valid_targets_min": 1024
},
{
"epoch": 3.3911671924290223,
"grad_norm": 0.5105330409760318,
"learning_rate": 2.4548227756209593e-05,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11646340042352676,
"step": 3225,
"valid_targets_mean": 2077.1,
"valid_targets_min": 660
},
{
"epoch": 3.396424815983176,
"grad_norm": 0.5041477703196249,
"learning_rate": 2.4497147599655726e-05,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10835779458284378,
"step": 3230,
"valid_targets_mean": 1994.6,
"valid_targets_min": 694
},
{
"epoch": 3.4016824395373293,
"grad_norm": 0.41879217149919973,
"learning_rate": 2.44460365274785e-05,
"loss": 0.112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10331692546606064,
"step": 3235,
"valid_targets_mean": 2441.9,
"valid_targets_min": 722
},
{
"epoch": 3.406940063091483,
"grad_norm": 0.4974378539269013,
"learning_rate": 2.4394894891040774e-05,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12304258346557617,
"step": 3240,
"valid_targets_mean": 2316.9,
"valid_targets_min": 801
},
{
"epoch": 3.4121976866456363,
"grad_norm": 0.48344036663308226,
"learning_rate": 2.434372304191553e-05,
"loss": 0.115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10580900311470032,
"step": 3245,
"valid_targets_mean": 2243.6,
"valid_targets_min": 518
},
{
"epoch": 3.4174553101997898,
"grad_norm": 0.5659622930062288,
"learning_rate": 2.4292521331883432e-05,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12814448773860931,
"step": 3250,
"valid_targets_mean": 2061.2,
"valid_targets_min": 457
},
{
"epoch": 3.4227129337539433,
"grad_norm": 0.5570555041473756,
"learning_rate": 2.4241290112930448e-05,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09381797164678574,
"step": 3255,
"valid_targets_mean": 2421.0,
"valid_targets_min": 708
},
{
"epoch": 3.4279705573080967,
"grad_norm": 0.39135406975269277,
"learning_rate": 2.4190029737245368e-05,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08433152735233307,
"step": 3260,
"valid_targets_mean": 2685.0,
"valid_targets_min": 744
},
{
"epoch": 3.4332281808622502,
"grad_norm": 0.41613582732082494,
"learning_rate": 2.4138740557217462e-05,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0847037136554718,
"step": 3265,
"valid_targets_mean": 2542.6,
"valid_targets_min": 1081
},
{
"epoch": 3.4384858044164037,
"grad_norm": 0.5697380084850582,
"learning_rate": 2.4087422925433988e-05,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17015275359153748,
"step": 3270,
"valid_targets_mean": 1940.0,
"valid_targets_min": 744
},
{
"epoch": 3.443743427970557,
"grad_norm": 0.5376585662140428,
"learning_rate": 2.4036077194677803e-05,
"loss": 0.1183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12273421138525009,
"step": 3275,
"valid_targets_mean": 2094.6,
"valid_targets_min": 883
},
{
"epoch": 3.4490010515247107,
"grad_norm": 0.4830615663735012,
"learning_rate": 2.3984703717924932e-05,
"loss": 0.1054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1146085113286972,
"step": 3280,
"valid_targets_mean": 2269.4,
"valid_targets_min": 531
},
{
"epoch": 3.454258675078864,
"grad_norm": 0.4182520811536129,
"learning_rate": 2.3933302848342127e-05,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07924157381057739,
"step": 3285,
"valid_targets_mean": 1966.1,
"valid_targets_min": 672
},
{
"epoch": 3.4595162986330177,
"grad_norm": 0.4179138319288651,
"learning_rate": 2.388187493928447e-05,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0936025008559227,
"step": 3290,
"valid_targets_mean": 2802.2,
"valid_targets_min": 814
},
{
"epoch": 3.464773922187171,
"grad_norm": 0.3909002047938263,
"learning_rate": 2.3830420344292922e-05,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08706749975681305,
"step": 3295,
"valid_targets_mean": 3199.2,
"valid_targets_min": 779
},
{
"epoch": 3.470031545741325,
"grad_norm": 0.5313132582685511,
"learning_rate": 2.377893941709189e-05,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11644217371940613,
"step": 3300,
"valid_targets_mean": 2117.6,
"valid_targets_min": 662
},
{
"epoch": 3.4752891692954786,
"grad_norm": 0.4134644980708326,
"learning_rate": 2.3727432511586802e-05,
"loss": 0.1043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08773890882730484,
"step": 3305,
"valid_targets_mean": 2414.2,
"valid_targets_min": 536
},
{
"epoch": 3.480546792849632,
"grad_norm": 0.4316140203587372,
"learning_rate": 2.3675899981861675e-05,
"loss": 0.1223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11186422407627106,
"step": 3310,
"valid_targets_mean": 2549.9,
"valid_targets_min": 530
},
{
"epoch": 3.4858044164037856,
"grad_norm": 0.5011652105314757,
"learning_rate": 2.362434218217668e-05,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13110128045082092,
"step": 3315,
"valid_targets_mean": 2335.2,
"valid_targets_min": 484
},
{
"epoch": 3.491062039957939,
"grad_norm": 0.5743042549172922,
"learning_rate": 2.3572759466965706e-05,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13477513194084167,
"step": 3320,
"valid_targets_mean": 1921.1,
"valid_targets_min": 753
},
{
"epoch": 3.4963196635120926,
"grad_norm": 0.5401670010598917,
"learning_rate": 2.3521152190833934e-05,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13402019441127777,
"step": 3325,
"valid_targets_mean": 1708.1,
"valid_targets_min": 715
},
{
"epoch": 3.501577287066246,
"grad_norm": 0.43785527071182206,
"learning_rate": 2.346952070855537e-05,
"loss": 0.1043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09364502131938934,
"step": 3330,
"valid_targets_mean": 2542.5,
"valid_targets_min": 727
},
{
"epoch": 3.5068349106203995,
"grad_norm": 0.506466021212808,
"learning_rate": 2.3417865375070433e-05,
"loss": 0.1134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11375842988491058,
"step": 3335,
"valid_targets_mean": 2114.2,
"valid_targets_min": 758
},
{
"epoch": 3.512092534174553,
"grad_norm": 0.4688424357662533,
"learning_rate": 2.336618654548352e-05,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11045517772436142,
"step": 3340,
"valid_targets_mean": 2478.2,
"valid_targets_min": 729
},
{
"epoch": 3.5173501577287065,
"grad_norm": 0.42670263102723194,
"learning_rate": 2.331448457506053e-05,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09782717376947403,
"step": 3345,
"valid_targets_mean": 2741.0,
"valid_targets_min": 726
},
{
"epoch": 3.52260778128286,
"grad_norm": 0.43500495067088274,
"learning_rate": 2.326275981922645e-05,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09490084648132324,
"step": 3350,
"valid_targets_mean": 2736.9,
"valid_targets_min": 858
},
{
"epoch": 3.527865404837014,
"grad_norm": 0.5319946974987949,
"learning_rate": 2.3211012633562923e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11997735500335693,
"step": 3355,
"valid_targets_mean": 1953.1,
"valid_targets_min": 424
},
{
"epoch": 3.5331230283911674,
"grad_norm": 0.49363023614899704,
"learning_rate": 2.3159243373805764e-05,
"loss": 0.129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12348274141550064,
"step": 3360,
"valid_targets_mean": 2254.8,
"valid_targets_min": 871
},
{
"epoch": 3.538380651945321,
"grad_norm": 0.42833169020835166,
"learning_rate": 2.3107452395842542e-05,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0981355607509613,
"step": 3365,
"valid_targets_mean": 2488.3,
"valid_targets_min": 744
},
{
"epoch": 3.5436382754994744,
"grad_norm": 0.5084986816088525,
"learning_rate": 2.3055640055710132e-05,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12088331580162048,
"step": 3370,
"valid_targets_mean": 2525.2,
"valid_targets_min": 719
},
{
"epoch": 3.548895899053628,
"grad_norm": 0.4693403284495062,
"learning_rate": 2.3003806709592268e-05,
"loss": 0.1118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12300702929496765,
"step": 3375,
"valid_targets_mean": 2723.6,
"valid_targets_min": 918
},
{
"epoch": 3.5541535226077814,
"grad_norm": 0.4701124182890195,
"learning_rate": 2.295195271381707e-05,
"loss": 0.1013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10778406262397766,
"step": 3380,
"valid_targets_mean": 2073.8,
"valid_targets_min": 583
},
{
"epoch": 3.559411146161935,
"grad_norm": 0.42889386294241544,
"learning_rate": 2.290007842485463e-05,
"loss": 0.1188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10507388412952423,
"step": 3385,
"valid_targets_mean": 2516.1,
"valid_targets_min": 1145
},
{
"epoch": 3.5646687697160884,
"grad_norm": 0.41625842374711514,
"learning_rate": 2.2848184199314546e-05,
"loss": 0.1087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09518253058195114,
"step": 3390,
"valid_targets_mean": 2691.8,
"valid_targets_min": 872
},
{
"epoch": 3.569926393270242,
"grad_norm": 0.4387018710353009,
"learning_rate": 2.2796270393943472e-05,
"loss": 0.1215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09436045587062836,
"step": 3395,
"valid_targets_mean": 2296.1,
"valid_targets_min": 554
},
{
"epoch": 3.5751840168243953,
"grad_norm": 0.5495356752582214,
"learning_rate": 2.274433736562264e-05,
"loss": 0.1244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11270991712808609,
"step": 3400,
"valid_targets_mean": 1764.7,
"valid_targets_min": 647
},
{
"epoch": 3.580441640378549,
"grad_norm": 0.617043044531592,
"learning_rate": 2.2692385471365465e-05,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1819651871919632,
"step": 3405,
"valid_targets_mean": 1844.1,
"valid_targets_min": 512
},
{
"epoch": 3.5856992639327023,
"grad_norm": 0.4855141371569252,
"learning_rate": 2.264041506831503e-05,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11603636294603348,
"step": 3410,
"valid_targets_mean": 2135.2,
"valid_targets_min": 637
},
{
"epoch": 3.590956887486856,
"grad_norm": 0.8413069803155135,
"learning_rate": 2.258842651374166e-05,
"loss": 0.1098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10120347142219543,
"step": 3415,
"valid_targets_mean": 2140.9,
"valid_targets_min": 588
},
{
"epoch": 3.5962145110410093,
"grad_norm": 0.4302795627289212,
"learning_rate": 2.2536420165040478e-05,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10650207847356796,
"step": 3420,
"valid_targets_mean": 2953.6,
"valid_targets_min": 800
},
{
"epoch": 3.601472134595163,
"grad_norm": 0.5333965110826944,
"learning_rate": 2.248439637972892e-05,
"loss": 0.1017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10774208605289459,
"step": 3425,
"valid_targets_mean": 2051.7,
"valid_targets_min": 676
},
{
"epoch": 3.6067297581493163,
"grad_norm": 0.6500026102597213,
"learning_rate": 2.2432355515444284e-05,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1189243346452713,
"step": 3430,
"valid_targets_mean": 2236.4,
"valid_targets_min": 689
},
{
"epoch": 3.61198738170347,
"grad_norm": 0.6391587477739512,
"learning_rate": 2.2380297929941296e-05,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1473112851381302,
"step": 3435,
"valid_targets_mean": 2142.1,
"valid_targets_min": 793
},
{
"epoch": 3.6172450052576237,
"grad_norm": 0.5622590899080744,
"learning_rate": 2.2328223981089613e-05,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11607543379068375,
"step": 3440,
"valid_targets_mean": 1869.6,
"valid_targets_min": 663
},
{
"epoch": 3.622502628811777,
"grad_norm": 0.5499942253003627,
"learning_rate": 2.2276134026871393e-05,
"loss": 0.1069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10942299664020538,
"step": 3445,
"valid_targets_mean": 1989.9,
"valid_targets_min": 623
},
{
"epoch": 3.6277602523659307,
"grad_norm": 0.4419057507126453,
"learning_rate": 2.222402842537882e-05,
"loss": 0.1214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10143234580755234,
"step": 3450,
"valid_targets_mean": 2870.7,
"valid_targets_min": 828
},
{
"epoch": 3.633017875920084,
"grad_norm": 0.5610153093195461,
"learning_rate": 2.2171907534811652e-05,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1339399665594101,
"step": 3455,
"valid_targets_mean": 1753.9,
"valid_targets_min": 610
},
{
"epoch": 3.6382754994742377,
"grad_norm": 0.5397426958527057,
"learning_rate": 2.2119771713474732e-05,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15266606211662292,
"step": 3460,
"valid_targets_mean": 2078.9,
"valid_targets_min": 777
},
{
"epoch": 3.643533123028391,
"grad_norm": 0.5005898238491538,
"learning_rate": 2.2067621319775564e-05,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10755124688148499,
"step": 3465,
"valid_targets_mean": 2634.8,
"valid_targets_min": 696
},
{
"epoch": 3.6487907465825447,
"grad_norm": 0.484003042738071,
"learning_rate": 2.201545671222183e-05,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11154371500015259,
"step": 3470,
"valid_targets_mean": 2315.6,
"valid_targets_min": 615
},
{
"epoch": 3.654048370136698,
"grad_norm": 0.5368915771584432,
"learning_rate": 2.1963278249418894e-05,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12409842014312744,
"step": 3475,
"valid_targets_mean": 2165.6,
"valid_targets_min": 680
},
{
"epoch": 3.6593059936908516,
"grad_norm": 0.5311406165106639,
"learning_rate": 2.191108629006742e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14158453047275543,
"step": 3480,
"valid_targets_mean": 2103.0,
"valid_targets_min": 632
},
{
"epoch": 3.664563617245005,
"grad_norm": 0.5172911807540274,
"learning_rate": 2.1858881192960814e-05,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11360710859298706,
"step": 3485,
"valid_targets_mean": 2339.9,
"valid_targets_min": 736
},
{
"epoch": 3.669821240799159,
"grad_norm": 0.450828554054094,
"learning_rate": 2.180666331698281e-05,
"loss": 0.126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09024304151535034,
"step": 3490,
"valid_targets_mean": 1989.1,
"valid_targets_min": 738
},
{
"epoch": 3.6750788643533125,
"grad_norm": 0.42913794636854274,
"learning_rate": 2.1754433021104985e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09447701275348663,
"step": 3495,
"valid_targets_mean": 2427.8,
"valid_targets_min": 577
},
{
"epoch": 3.680336487907466,
"grad_norm": 0.48945098109108737,
"learning_rate": 2.170219066438431e-05,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1112595796585083,
"step": 3500,
"valid_targets_mean": 2368.2,
"valid_targets_min": 921
},
{
"epoch": 3.6855941114616195,
"grad_norm": 0.4640547924807341,
"learning_rate": 2.164993660596065e-05,
"loss": 0.1196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10272429883480072,
"step": 3505,
"valid_targets_mean": 2218.4,
"valid_targets_min": 593
},
{
"epoch": 3.690851735015773,
"grad_norm": 0.45129110336924744,
"learning_rate": 2.1597671205054326e-05,
"loss": 0.1199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10291942954063416,
"step": 3510,
"valid_targets_mean": 2482.1,
"valid_targets_min": 790
},
{
"epoch": 3.6961093585699265,
"grad_norm": 0.45704894891573966,
"learning_rate": 2.1545394820963637e-05,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12160168588161469,
"step": 3515,
"valid_targets_mean": 2036.5,
"valid_targets_min": 811
},
{
"epoch": 3.70136698212408,
"grad_norm": 0.42569844935970896,
"learning_rate": 2.149310781306237e-05,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09846076369285583,
"step": 3520,
"valid_targets_mean": 2688.5,
"valid_targets_min": 888
},
{
"epoch": 3.7066246056782335,
"grad_norm": 0.48318716646802223,
"learning_rate": 2.1440810540797354e-05,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10648829489946365,
"step": 3525,
"valid_targets_mean": 1977.8,
"valid_targets_min": 734
},
{
"epoch": 3.711882229232387,
"grad_norm": 0.4567306404867012,
"learning_rate": 2.1388503363685985e-05,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09814627468585968,
"step": 3530,
"valid_targets_mean": 2088.6,
"valid_targets_min": 806
},
{
"epoch": 3.7171398527865405,
"grad_norm": 0.4633234764201535,
"learning_rate": 2.133618664131374e-05,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12074621021747589,
"step": 3535,
"valid_targets_mean": 2728.8,
"valid_targets_min": 768
},
{
"epoch": 3.722397476340694,
"grad_norm": 0.5596045588771613,
"learning_rate": 2.1283860733331722e-05,
"loss": 0.1133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12292230129241943,
"step": 3540,
"valid_targets_mean": 1893.4,
"valid_targets_min": 728
},
{
"epoch": 3.7276550998948474,
"grad_norm": 0.5165796220257279,
"learning_rate": 2.123152599945417e-05,
"loss": 0.1053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13469788432121277,
"step": 3545,
"valid_targets_mean": 2299.9,
"valid_targets_min": 711
},
{
"epoch": 3.732912723449001,
"grad_norm": 0.5214436389330018,
"learning_rate": 2.1179182799456024e-05,
"loss": 0.1192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13773241639137268,
"step": 3550,
"valid_targets_mean": 2166.2,
"valid_targets_min": 567
},
{
"epoch": 3.7381703470031544,
"grad_norm": 0.47108735926186085,
"learning_rate": 2.112683149317039e-05,
"loss": 0.1121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10124912858009338,
"step": 3555,
"valid_targets_mean": 2148.1,
"valid_targets_min": 806
},
{
"epoch": 3.743427970557308,
"grad_norm": 0.5298200427399173,
"learning_rate": 2.1074472440486118e-05,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12113603949546814,
"step": 3560,
"valid_targets_mean": 2554.8,
"valid_targets_min": 1019
},
{
"epoch": 3.7486855941114614,
"grad_norm": 0.5287256188647269,
"learning_rate": 2.102210600134531e-05,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11768949776887894,
"step": 3565,
"valid_targets_mean": 1844.4,
"valid_targets_min": 699
},
{
"epoch": 3.753943217665615,
"grad_norm": 0.5743303600551449,
"learning_rate": 2.096973253574084e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.121823251247406,
"step": 3570,
"valid_targets_mean": 1913.6,
"valid_targets_min": 509
},
{
"epoch": 3.759200841219769,
"grad_norm": 0.5949343625302866,
"learning_rate": 2.09173524037139e-05,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12200993299484253,
"step": 3575,
"valid_targets_mean": 2039.6,
"valid_targets_min": 549
},
{
"epoch": 3.7644584647739223,
"grad_norm": 0.4963455031579976,
"learning_rate": 2.0864965965351495e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11638784408569336,
"step": 3580,
"valid_targets_mean": 2245.8,
"valid_targets_min": 764
},
{
"epoch": 3.769716088328076,
"grad_norm": 0.4025297249017998,
"learning_rate": 2.081257358078398e-05,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0868837982416153,
"step": 3585,
"valid_targets_mean": 2853.3,
"valid_targets_min": 613
},
{
"epoch": 3.7749737118822293,
"grad_norm": 0.433132265132753,
"learning_rate": 2.0760175610182613e-05,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09999372065067291,
"step": 3590,
"valid_targets_mean": 2332.7,
"valid_targets_min": 622
},
{
"epoch": 3.780231335436383,
"grad_norm": 0.5475012338379195,
"learning_rate": 2.0707772413757016e-05,
"loss": 0.1092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11299513280391693,
"step": 3595,
"valid_targets_mean": 1802.6,
"valid_targets_min": 700
},
{
"epoch": 3.7854889589905363,
"grad_norm": 0.5507554370926947,
"learning_rate": 2.0655364351752763e-05,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11380542814731598,
"step": 3600,
"valid_targets_mean": 2031.1,
"valid_targets_min": 605
},
{
"epoch": 3.7907465825446898,
"grad_norm": 0.49997009617727645,
"learning_rate": 2.060295178444887e-05,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11200733482837677,
"step": 3605,
"valid_targets_mean": 2119.8,
"valid_targets_min": 743
},
{
"epoch": 3.7960042060988433,
"grad_norm": 0.4496140670419227,
"learning_rate": 2.055053507215533e-05,
"loss": 0.1184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08896288275718689,
"step": 3610,
"valid_targets_mean": 2048.6,
"valid_targets_min": 570
},
{
"epoch": 3.8012618296529967,
"grad_norm": 0.4047396865904987,
"learning_rate": 2.049811457521061e-05,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09981025755405426,
"step": 3615,
"valid_targets_mean": 3184.6,
"valid_targets_min": 948
},
{
"epoch": 3.8065194532071502,
"grad_norm": 0.5430555562663548,
"learning_rate": 2.0445690653979216e-05,
"loss": 0.1171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14627373218536377,
"step": 3620,
"valid_targets_mean": 2295.7,
"valid_targets_min": 665
},
{
"epoch": 3.8117770767613037,
"grad_norm": 0.5403404648686355,
"learning_rate": 2.039326366884919e-05,
"loss": 0.1145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12071286886930466,
"step": 3625,
"valid_targets_mean": 2385.2,
"valid_targets_min": 768
},
{
"epoch": 3.8170347003154577,
"grad_norm": 0.4690895172622104,
"learning_rate": 2.034083398022963e-05,
"loss": 0.1157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09785957634449005,
"step": 3630,
"valid_targets_mean": 2378.1,
"valid_targets_min": 741
},
{
"epoch": 3.822292323869611,
"grad_norm": 0.5620241182263188,
"learning_rate": 2.028840194854822e-05,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10536280274391174,
"step": 3635,
"valid_targets_mean": 2182.9,
"valid_targets_min": 791
},
{
"epoch": 3.8275499474237646,
"grad_norm": 0.5190966653328027,
"learning_rate": 2.0235967934248756e-05,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10840453207492828,
"step": 3640,
"valid_targets_mean": 1759.5,
"valid_targets_min": 593
},
{
"epoch": 3.832807570977918,
"grad_norm": 0.5650132555883536,
"learning_rate": 2.018353229778867e-05,
"loss": 0.1061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11311180889606476,
"step": 3645,
"valid_targets_mean": 2058.0,
"valid_targets_min": 720
},
{
"epoch": 3.8380651945320716,
"grad_norm": 0.5538497201770207,
"learning_rate": 2.0131095399636522e-05,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1371322125196457,
"step": 3650,
"valid_targets_mean": 2529.8,
"valid_targets_min": 645
},
{
"epoch": 3.843322818086225,
"grad_norm": 0.4895615071833436,
"learning_rate": 2.0078657600269573e-05,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11361433565616608,
"step": 3655,
"valid_targets_mean": 2241.3,
"valid_targets_min": 874
},
{
"epoch": 3.8485804416403786,
"grad_norm": 0.6588429282327887,
"learning_rate": 2.0026219260171262e-05,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0961027517914772,
"step": 3660,
"valid_targets_mean": 2566.3,
"valid_targets_min": 851
},
{
"epoch": 3.853838065194532,
"grad_norm": 0.47105340408588986,
"learning_rate": 1.9973780739828748e-05,
"loss": 0.1084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10666951537132263,
"step": 3665,
"valid_targets_mean": 2143.0,
"valid_targets_min": 387
},
{
"epoch": 3.8590956887486856,
"grad_norm": 0.5702963870389707,
"learning_rate": 1.9921342399730433e-05,
"loss": 0.1086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14022137224674225,
"step": 3670,
"valid_targets_mean": 2051.1,
"valid_targets_min": 612
},
{
"epoch": 3.864353312302839,
"grad_norm": 0.5293206117699157,
"learning_rate": 1.9868904600363485e-05,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12130927294492722,
"step": 3675,
"valid_targets_mean": 2072.1,
"valid_targets_min": 637
},
{
"epoch": 3.8696109358569926,
"grad_norm": 0.4711162921626716,
"learning_rate": 1.9816467702211342e-05,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10494031012058258,
"step": 3680,
"valid_targets_mean": 2328.9,
"valid_targets_min": 591
},
{
"epoch": 3.874868559411146,
"grad_norm": 0.5227397705947019,
"learning_rate": 1.9764032065751248e-05,
"loss": 0.1183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12430229038000107,
"step": 3685,
"valid_targets_mean": 2161.8,
"valid_targets_min": 602
},
{
"epoch": 3.8801261829652995,
"grad_norm": 0.5021498222245417,
"learning_rate": 1.971159805145178e-05,
"loss": 0.1142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09423937648534775,
"step": 3690,
"valid_targets_mean": 2945.0,
"valid_targets_min": 1222
},
{
"epoch": 3.885383806519453,
"grad_norm": 0.5460546825082218,
"learning_rate": 1.965916601977038e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13521108031272888,
"step": 3695,
"valid_targets_mean": 2023.5,
"valid_targets_min": 727
},
{
"epoch": 3.8906414300736065,
"grad_norm": 0.49704541316839473,
"learning_rate": 1.9606736331150812e-05,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15039195120334625,
"step": 3700,
"valid_targets_mean": 2282.1,
"valid_targets_min": 821
},
{
"epoch": 3.89589905362776,
"grad_norm": 0.41486339884353696,
"learning_rate": 1.9554309346020784e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09099794924259186,
"step": 3705,
"valid_targets_mean": 2675.0,
"valid_targets_min": 702
},
{
"epoch": 3.9011566771819135,
"grad_norm": 0.6737944729650831,
"learning_rate": 1.9501885424789394e-05,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13288956880569458,
"step": 3710,
"valid_targets_mean": 1693.2,
"valid_targets_min": 639
},
{
"epoch": 3.9064143007360674,
"grad_norm": 0.4674025231220049,
"learning_rate": 1.9449464927844677e-05,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11063611507415771,
"step": 3715,
"valid_targets_mean": 2003.1,
"valid_targets_min": 660
},
{
"epoch": 3.911671924290221,
"grad_norm": 0.5231541405838046,
"learning_rate": 1.939704821555113e-05,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14501771330833435,
"step": 3720,
"valid_targets_mean": 2228.4,
"valid_targets_min": 759
},
{
"epoch": 3.9169295478443744,
"grad_norm": 0.4817907114246795,
"learning_rate": 1.9344635648247244e-05,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11101260036230087,
"step": 3725,
"valid_targets_mean": 2157.5,
"valid_targets_min": 838
},
{
"epoch": 3.922187171398528,
"grad_norm": 0.48005352400351275,
"learning_rate": 1.9292227586242994e-05,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09855275601148605,
"step": 3730,
"valid_targets_mean": 2368.6,
"valid_targets_min": 568
},
{
"epoch": 3.9274447949526814,
"grad_norm": 0.494870153962298,
"learning_rate": 1.9239824389817397e-05,
"loss": 0.1136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12282229959964752,
"step": 3735,
"valid_targets_mean": 2194.5,
"valid_targets_min": 842
},
{
"epoch": 3.932702418506835,
"grad_norm": 0.4216307061748337,
"learning_rate": 1.9187426419216026e-05,
"loss": 0.1215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11283373832702637,
"step": 3740,
"valid_targets_mean": 2860.7,
"valid_targets_min": 964
},
{
"epoch": 3.9379600420609884,
"grad_norm": 0.5487288710827547,
"learning_rate": 1.9135034034648515e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10530532896518707,
"step": 3745,
"valid_targets_mean": 2240.8,
"valid_targets_min": 610
},
{
"epoch": 3.943217665615142,
"grad_norm": 0.5334742046006723,
"learning_rate": 1.90826475962861e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1639787256717682,
"step": 3750,
"valid_targets_mean": 2194.3,
"valid_targets_min": 821
},
{
"epoch": 3.9484752891692954,
"grad_norm": 0.44471418938462315,
"learning_rate": 1.9030267464259164e-05,
"loss": 0.1175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09661805629730225,
"step": 3755,
"valid_targets_mean": 2463.7,
"valid_targets_min": 685
},
{
"epoch": 3.953732912723449,
"grad_norm": 0.6863647602242162,
"learning_rate": 1.8977893998654692e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17349067330360413,
"step": 3760,
"valid_targets_mean": 1545.1,
"valid_targets_min": 727
},
{
"epoch": 3.958990536277603,
"grad_norm": 0.42976635890436815,
"learning_rate": 1.8925527559513886e-05,
"loss": 0.1035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09973946213722229,
"step": 3765,
"valid_targets_mean": 2579.3,
"valid_targets_min": 1034
},
{
"epoch": 3.9642481598317563,
"grad_norm": 0.46378885918678187,
"learning_rate": 1.8873168506829614e-05,
"loss": 0.1263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11329721659421921,
"step": 3770,
"valid_targets_mean": 2522.1,
"valid_targets_min": 990
},
{
"epoch": 3.9695057833859098,
"grad_norm": 0.4320207799742031,
"learning_rate": 1.882081720054398e-05,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1261582225561142,
"step": 3775,
"valid_targets_mean": 2518.4,
"valid_targets_min": 1007
},
{
"epoch": 3.9747634069400632,
"grad_norm": 0.5393454576994771,
"learning_rate": 1.876847400054583e-05,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11026948690414429,
"step": 3780,
"valid_targets_mean": 1841.8,
"valid_targets_min": 570
},
{
"epoch": 3.9800210304942167,
"grad_norm": 0.47994326215344363,
"learning_rate": 1.8716139266668288e-05,
"loss": 0.1046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.094925656914711,
"step": 3785,
"valid_targets_mean": 2411.9,
"valid_targets_min": 658
},
{
"epoch": 3.9852786540483702,
"grad_norm": 0.47213110501326233,
"learning_rate": 1.8663813358686267e-05,
"loss": 0.1142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13710609078407288,
"step": 3790,
"valid_targets_mean": 2730.3,
"valid_targets_min": 580
},
{
"epoch": 3.9905362776025237,
"grad_norm": 0.5508226364276274,
"learning_rate": 1.8611496636314025e-05,
"loss": 0.1182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10945984721183777,
"step": 3795,
"valid_targets_mean": 2272.2,
"valid_targets_min": 876
},
{
"epoch": 3.995793901156677,
"grad_norm": 0.4802520009795041,
"learning_rate": 1.8559189459202653e-05,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10392237454652786,
"step": 3800,
"valid_targets_mean": 2118.9,
"valid_targets_min": 674
},
{
"epoch": 4.001051524710831,
"grad_norm": 0.6154016743647607,
"learning_rate": 1.8506892186937636e-05,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12505027651786804,
"step": 3805,
"valid_targets_mean": 1623.6,
"valid_targets_min": 609
},
{
"epoch": 4.006309148264984,
"grad_norm": 0.4187162914832128,
"learning_rate": 1.845460517903637e-05,
"loss": 0.0934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08397223055362701,
"step": 3810,
"valid_targets_mean": 2492.9,
"valid_targets_min": 387
},
{
"epoch": 4.011566771819138,
"grad_norm": 0.4644782379013764,
"learning_rate": 1.8402328794945678e-05,
"loss": 0.0965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08901005983352661,
"step": 3815,
"valid_targets_mean": 2709.0,
"valid_targets_min": 549
},
{
"epoch": 4.016824395373291,
"grad_norm": 0.47504418703541157,
"learning_rate": 1.8350063394039352e-05,
"loss": 0.1018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08746888488531113,
"step": 3820,
"valid_targets_mean": 2359.4,
"valid_targets_min": 858
},
{
"epoch": 4.022082018927445,
"grad_norm": 0.5237048900291029,
"learning_rate": 1.82978093356157e-05,
"loss": 0.0909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09657467901706696,
"step": 3825,
"valid_targets_mean": 2222.1,
"valid_targets_min": 622
},
{
"epoch": 4.027339642481598,
"grad_norm": 0.44291534970251967,
"learning_rate": 1.824556697889502e-05,
"loss": 0.0927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07914161682128906,
"step": 3830,
"valid_targets_mean": 2424.0,
"valid_targets_min": 703
},
{
"epoch": 4.032597266035752,
"grad_norm": 0.4992982667058541,
"learning_rate": 1.8193336683017197e-05,
"loss": 0.1016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09114516526460648,
"step": 3835,
"valid_targets_mean": 2408.9,
"valid_targets_min": 748
},
{
"epoch": 4.037854889589905,
"grad_norm": 0.5092828321740024,
"learning_rate": 1.8141118807039193e-05,
"loss": 0.0958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09602051973342896,
"step": 3840,
"valid_targets_mean": 2687.4,
"valid_targets_min": 869
},
{
"epoch": 4.043112513144059,
"grad_norm": 0.5215237366125056,
"learning_rate": 1.8088913709932582e-05,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12407802045345306,
"step": 3845,
"valid_targets_mean": 2487.4,
"valid_targets_min": 803
},
{
"epoch": 4.048370136698212,
"grad_norm": 0.4260836759080378,
"learning_rate": 1.8036721750581106e-05,
"loss": 0.099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09371296316385269,
"step": 3850,
"valid_targets_mean": 2907.2,
"valid_targets_min": 553
},
{
"epoch": 4.053627760252366,
"grad_norm": 0.3789795718044728,
"learning_rate": 1.7984543287778185e-05,
"loss": 0.0937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07781212031841278,
"step": 3855,
"valid_targets_mean": 3208.1,
"valid_targets_min": 696
},
{
"epoch": 4.058885383806519,
"grad_norm": 0.44988304525289946,
"learning_rate": 1.7932378680224443e-05,
"loss": 0.1012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0846400335431099,
"step": 3860,
"valid_targets_mean": 2850.8,
"valid_targets_min": 664
},
{
"epoch": 4.064143007360673,
"grad_norm": 0.44680963570420906,
"learning_rate": 1.7880228286525275e-05,
"loss": 0.0985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0894576907157898,
"step": 3865,
"valid_targets_mean": 2894.3,
"valid_targets_min": 750
},
{
"epoch": 4.069400630914826,
"grad_norm": 0.4095334570073506,
"learning_rate": 1.782809246518836e-05,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08346300572156906,
"step": 3870,
"valid_targets_mean": 2864.2,
"valid_targets_min": 964
},
{
"epoch": 4.0746582544689804,
"grad_norm": 0.6237447882734388,
"learning_rate": 1.7775971574621186e-05,
"loss": 0.0955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10113894939422607,
"step": 3875,
"valid_targets_mean": 1858.5,
"valid_targets_min": 767
},
{
"epoch": 4.079915878023134,
"grad_norm": 0.5526198430574176,
"learning_rate": 1.772386597312861e-05,
"loss": 0.0986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09907979518175125,
"step": 3880,
"valid_targets_mean": 1944.2,
"valid_targets_min": 582
},
{
"epoch": 4.085173501577287,
"grad_norm": 0.49989094353990815,
"learning_rate": 1.7671776018910397e-05,
"loss": 0.0955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08454187959432602,
"step": 3885,
"valid_targets_mean": 2620.6,
"valid_targets_min": 1216
},
{
"epoch": 4.090431125131441,
"grad_norm": 0.5384845374319656,
"learning_rate": 1.761970207005871e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09822037816047668,
"step": 3890,
"valid_targets_mean": 1812.9,
"valid_targets_min": 702
},
{
"epoch": 4.095688748685594,
"grad_norm": 0.4751345331625872,
"learning_rate": 1.756764448455572e-05,
"loss": 0.1067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0786370187997818,
"step": 3895,
"valid_targets_mean": 2295.7,
"valid_targets_min": 595
},
{
"epoch": 4.100946372239748,
"grad_norm": 0.6069871024504523,
"learning_rate": 1.7515603620271087e-05,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09270045906305313,
"step": 3900,
"valid_targets_mean": 1902.6,
"valid_targets_min": 783
},
{
"epoch": 4.106203995793901,
"grad_norm": 0.5105586805216777,
"learning_rate": 1.7463579834959525e-05,
"loss": 0.0924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09300537407398224,
"step": 3905,
"valid_targets_mean": 2262.1,
"valid_targets_min": 560
},
{
"epoch": 4.111461619348055,
"grad_norm": 0.4925420404959546,
"learning_rate": 1.7411573486258343e-05,
"loss": 0.1021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10601294785737991,
"step": 3910,
"valid_targets_mean": 2308.6,
"valid_targets_min": 859
},
{
"epoch": 4.116719242902208,
"grad_norm": 0.4891125312268697,
"learning_rate": 1.735958493168498e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09458284080028534,
"step": 3915,
"valid_targets_mean": 2694.0,
"valid_targets_min": 614
},
{
"epoch": 4.121976866456362,
"grad_norm": 0.5567899507243081,
"learning_rate": 1.730761452863454e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12221285700798035,
"step": 3920,
"valid_targets_mean": 1939.8,
"valid_targets_min": 488
},
{
"epoch": 4.127234490010515,
"grad_norm": 0.5429337348501369,
"learning_rate": 1.7255662634377365e-05,
"loss": 0.0988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08848828077316284,
"step": 3925,
"valid_targets_mean": 2168.9,
"valid_targets_min": 665
},
{
"epoch": 4.132492113564669,
"grad_norm": 0.43123482551876086,
"learning_rate": 1.720372960605654e-05,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07387609779834747,
"step": 3930,
"valid_targets_mean": 2426.4,
"valid_targets_min": 682
},
{
"epoch": 4.137749737118822,
"grad_norm": 0.525743802866739,
"learning_rate": 1.715181580068546e-05,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09564240276813507,
"step": 3935,
"valid_targets_mean": 2123.9,
"valid_targets_min": 741
},
{
"epoch": 4.143007360672976,
"grad_norm": 0.5431857482684502,
"learning_rate": 1.7099921575145372e-05,
"loss": 0.0859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09785217046737671,
"step": 3940,
"valid_targets_mean": 1977.2,
"valid_targets_min": 880
},
{
"epoch": 4.148264984227129,
"grad_norm": 0.4815253009344995,
"learning_rate": 1.7048047286182945e-05,
"loss": 0.1,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08684001863002777,
"step": 3945,
"valid_targets_mean": 2468.2,
"valid_targets_min": 799
},
{
"epoch": 4.153522607781283,
"grad_norm": 0.48070976206339466,
"learning_rate": 1.6996193290407742e-05,
"loss": 0.1088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11913721263408661,
"step": 3950,
"valid_targets_mean": 2623.4,
"valid_targets_min": 801
},
{
"epoch": 4.158780231335436,
"grad_norm": 0.5051148971559885,
"learning_rate": 1.694435994428987e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09588249027729034,
"step": 3955,
"valid_targets_mean": 2178.3,
"valid_targets_min": 800
},
{
"epoch": 4.16403785488959,
"grad_norm": 0.493804524200127,
"learning_rate": 1.6892547604157464e-05,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10550133883953094,
"step": 3960,
"valid_targets_mean": 2407.4,
"valid_targets_min": 609
},
{
"epoch": 4.169295478443743,
"grad_norm": 0.43098992206363373,
"learning_rate": 1.6840756626194242e-05,
"loss": 0.0995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0775129646062851,
"step": 3965,
"valid_targets_mean": 2808.8,
"valid_targets_min": 698
},
{
"epoch": 4.174553101997897,
"grad_norm": 0.4819574493905566,
"learning_rate": 1.678898736643708e-05,
"loss": 0.0974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08578978478908539,
"step": 3970,
"valid_targets_mean": 2649.3,
"valid_targets_min": 724
},
{
"epoch": 4.17981072555205,
"grad_norm": 0.4841531800469526,
"learning_rate": 1.6737240180773554e-05,
"loss": 0.0977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08698216080665588,
"step": 3975,
"valid_targets_mean": 2274.5,
"valid_targets_min": 661
},
{
"epoch": 4.185068349106204,
"grad_norm": 0.5473968284202807,
"learning_rate": 1.6685515424939478e-05,
"loss": 0.0892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09150893986225128,
"step": 3980,
"valid_targets_mean": 2240.1,
"valid_targets_min": 758
},
{
"epoch": 4.190325972660357,
"grad_norm": 0.5372511554955457,
"learning_rate": 1.6633813454516486e-05,
"loss": 0.105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10967753827571869,
"step": 3985,
"valid_targets_mean": 2407.5,
"valid_targets_min": 627
},
{
"epoch": 4.195583596214511,
"grad_norm": 0.461537896217363,
"learning_rate": 1.658213462492957e-05,
"loss": 0.105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09982563555240631,
"step": 3990,
"valid_targets_mean": 2724.3,
"valid_targets_min": 960
},
{
"epoch": 4.200841219768664,
"grad_norm": 0.5682378401486455,
"learning_rate": 1.6530479291444636e-05,
"loss": 0.102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0959588885307312,
"step": 3995,
"valid_targets_mean": 2118.4,
"valid_targets_min": 959
},
{
"epoch": 4.206098843322818,
"grad_norm": 0.4371959088072071,
"learning_rate": 1.6478847809166066e-05,
"loss": 0.1001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1117955818772316,
"step": 4000,
"valid_targets_mean": 3041.2,
"valid_targets_min": 898
},
{
"epoch": 4.211356466876971,
"grad_norm": 0.5673584626737319,
"learning_rate": 1.64272405330343e-05,
"loss": 0.0971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0908890813589096,
"step": 4005,
"valid_targets_mean": 1950.1,
"valid_targets_min": 722
},
{
"epoch": 4.216614090431126,
"grad_norm": 0.5389092021279812,
"learning_rate": 1.6375657817823323e-05,
"loss": 0.0883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10546024143695831,
"step": 4010,
"valid_targets_mean": 2117.4,
"valid_targets_min": 596
},
{
"epoch": 4.221871713985279,
"grad_norm": 0.5328521389983714,
"learning_rate": 1.6324100018138328e-05,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10617490112781525,
"step": 4015,
"valid_targets_mean": 2236.5,
"valid_targets_min": 754
},
{
"epoch": 4.2271293375394325,
"grad_norm": 0.463545730273827,
"learning_rate": 1.6272567488413204e-05,
"loss": 0.0966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08383120596408844,
"step": 4020,
"valid_targets_mean": 2362.3,
"valid_targets_min": 687
},
{
"epoch": 4.232386961093586,
"grad_norm": 0.5419587665952631,
"learning_rate": 1.6221060582908115e-05,
"loss": 0.0959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1114029735326767,
"step": 4025,
"valid_targets_mean": 2000.4,
"valid_targets_min": 634
},
{
"epoch": 4.2376445846477395,
"grad_norm": 0.5337355493878079,
"learning_rate": 1.616957965570708e-05,
"loss": 0.0967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09510698914527893,
"step": 4030,
"valid_targets_mean": 2540.3,
"valid_targets_min": 682
},
{
"epoch": 4.242902208201893,
"grad_norm": 0.5131807310811538,
"learning_rate": 1.6118125060715534e-05,
"loss": 0.0963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09756757318973541,
"step": 4035,
"valid_targets_mean": 2316.0,
"valid_targets_min": 516
},
{
"epoch": 4.2481598317560465,
"grad_norm": 0.5842890128017805,
"learning_rate": 1.6066697151657876e-05,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09377151727676392,
"step": 4040,
"valid_targets_mean": 2363.4,
"valid_targets_min": 1057
},
{
"epoch": 4.2534174553102,
"grad_norm": 0.6029635584302082,
"learning_rate": 1.601529628207508e-05,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11593151837587357,
"step": 4045,
"valid_targets_mean": 2001.6,
"valid_targets_min": 790
},
{
"epoch": 4.2586750788643535,
"grad_norm": 0.5075833178292704,
"learning_rate": 1.5963922805322204e-05,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09981006383895874,
"step": 4050,
"valid_targets_mean": 2532.9,
"valid_targets_min": 663
},
{
"epoch": 4.263932702418507,
"grad_norm": 0.4780454372959979,
"learning_rate": 1.5912577074566016e-05,
"loss": 0.0963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08640825003385544,
"step": 4055,
"valid_targets_mean": 2389.4,
"valid_targets_min": 645
},
{
"epoch": 4.2691903259726605,
"grad_norm": 0.5313076838607088,
"learning_rate": 1.5861259442782548e-05,
"loss": 0.0955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09783901274204254,
"step": 4060,
"valid_targets_mean": 2114.4,
"valid_targets_min": 693
},
{
"epoch": 4.274447949526814,
"grad_norm": 0.616517654658599,
"learning_rate": 1.580997026275464e-05,
"loss": 0.1088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1255756914615631,
"step": 4065,
"valid_targets_mean": 1939.2,
"valid_targets_min": 605
},
{
"epoch": 4.279705573080967,
"grad_norm": 0.45481917819591744,
"learning_rate": 1.5758709887069562e-05,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.080144502222538,
"step": 4070,
"valid_targets_mean": 2460.1,
"valid_targets_min": 936
},
{
"epoch": 4.284963196635121,
"grad_norm": 0.4352522444525687,
"learning_rate": 1.570747866811658e-05,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08977779000997543,
"step": 4075,
"valid_targets_mean": 2534.4,
"valid_targets_min": 712
},
{
"epoch": 4.290220820189274,
"grad_norm": 0.43320224167988264,
"learning_rate": 1.5656276958084478e-05,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08739292621612549,
"step": 4080,
"valid_targets_mean": 2557.2,
"valid_targets_min": 878
},
{
"epoch": 4.295478443743428,
"grad_norm": 0.5187587814445953,
"learning_rate": 1.560510510895923e-05,
"loss": 0.1034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09790067374706268,
"step": 4085,
"valid_targets_mean": 2257.9,
"valid_targets_min": 689
},
{
"epoch": 4.300736067297581,
"grad_norm": 0.5612092057810208,
"learning_rate": 1.5553963472521506e-05,
"loss": 0.0962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1016916036605835,
"step": 4090,
"valid_targets_mean": 3216.2,
"valid_targets_min": 789
},
{
"epoch": 4.305993690851735,
"grad_norm": 0.4754144964970902,
"learning_rate": 1.5502852400344277e-05,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09235286712646484,
"step": 4095,
"valid_targets_mean": 2406.9,
"valid_targets_min": 792
},
{
"epoch": 4.311251314405888,
"grad_norm": 0.49831080617356127,
"learning_rate": 1.545177224379041e-05,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08789409697055817,
"step": 4100,
"valid_targets_mean": 2592.8,
"valid_targets_min": 692
},
{
"epoch": 4.316508937960042,
"grad_norm": 0.4729401427746108,
"learning_rate": 1.5400723354010244e-05,
"loss": 0.0966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09665529429912567,
"step": 4105,
"valid_targets_mean": 2757.2,
"valid_targets_min": 720
},
{
"epoch": 4.321766561514195,
"grad_norm": 0.49450294184793975,
"learning_rate": 1.5349706081939158e-05,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08979354798793793,
"step": 4110,
"valid_targets_mean": 2533.6,
"valid_targets_min": 806
},
{
"epoch": 4.327024185068349,
"grad_norm": 0.5755840128164587,
"learning_rate": 1.5298720778295195e-05,
"loss": 0.1043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10626491159200668,
"step": 4115,
"valid_targets_mean": 1994.1,
"valid_targets_min": 849
},
{
"epoch": 4.332281808622502,
"grad_norm": 0.42348822727191493,
"learning_rate": 1.5247767793576625e-05,
"loss": 0.0946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07282793521881104,
"step": 4120,
"valid_targets_mean": 2663.2,
"valid_targets_min": 539
},
{
"epoch": 4.337539432176656,
"grad_norm": 0.45936948713447534,
"learning_rate": 1.519684747805953e-05,
"loss": 0.091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09010601788759232,
"step": 4125,
"valid_targets_mean": 2681.1,
"valid_targets_min": 733
},
{
"epoch": 4.342797055730809,
"grad_norm": 0.5401190328293503,
"learning_rate": 1.5145960181795421e-05,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12450847029685974,
"step": 4130,
"valid_targets_mean": 2306.4,
"valid_targets_min": 572
},
{
"epoch": 4.348054679284963,
"grad_norm": 0.4739107220500607,
"learning_rate": 1.509510625460883e-05,
"loss": 0.1014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1023867130279541,
"step": 4135,
"valid_targets_mean": 2806.1,
"valid_targets_min": 727
},
{
"epoch": 4.353312302839116,
"grad_norm": 0.5793612653952754,
"learning_rate": 1.5044286046094851e-05,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10863249003887177,
"step": 4140,
"valid_targets_mean": 2103.9,
"valid_targets_min": 502
},
{
"epoch": 4.358569926393271,
"grad_norm": 0.7763733995462617,
"learning_rate": 1.4993499905616823e-05,
"loss": 0.1004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12005244195461273,
"step": 4145,
"valid_targets_mean": 1644.9,
"valid_targets_min": 743
},
{
"epoch": 4.363827549947424,
"grad_norm": 0.5256860719791939,
"learning_rate": 1.494274818230387e-05,
"loss": 0.1039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09499655663967133,
"step": 4150,
"valid_targets_mean": 2255.0,
"valid_targets_min": 669
},
{
"epoch": 4.369085173501578,
"grad_norm": 0.47678584994963846,
"learning_rate": 1.4892031225048503e-05,
"loss": 0.0971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08429034054279327,
"step": 4155,
"valid_targets_mean": 2325.4,
"valid_targets_min": 650
},
{
"epoch": 4.374342797055731,
"grad_norm": 0.5113954318002024,
"learning_rate": 1.4841349382504247e-05,
"loss": 0.0937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09738793224096298,
"step": 4160,
"valid_targets_mean": 2161.3,
"valid_targets_min": 393
},
{
"epoch": 4.379600420609885,
"grad_norm": 0.4722305024786219,
"learning_rate": 1.4790703003083236e-05,
"loss": 0.0914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09080841392278671,
"step": 4165,
"valid_targets_mean": 2437.1,
"valid_targets_min": 841
},
{
"epoch": 4.384858044164038,
"grad_norm": 0.6859379915481925,
"learning_rate": 1.4740092434953793e-05,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10347820073366165,
"step": 4170,
"valid_targets_mean": 2084.9,
"valid_targets_min": 771
},
{
"epoch": 4.390115667718192,
"grad_norm": 0.5067080772057561,
"learning_rate": 1.4689518026038065e-05,
"loss": 0.0978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10102088004350662,
"step": 4175,
"valid_targets_mean": 2800.9,
"valid_targets_min": 636
},
{
"epoch": 4.395373291272345,
"grad_norm": 0.508213874596892,
"learning_rate": 1.4638980124009649e-05,
"loss": 0.0918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08990977704524994,
"step": 4180,
"valid_targets_mean": 2340.9,
"valid_targets_min": 827
},
{
"epoch": 4.400630914826499,
"grad_norm": 0.5761988282887481,
"learning_rate": 1.458847907629113e-05,
"loss": 0.089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10000157356262207,
"step": 4185,
"valid_targets_mean": 1966.2,
"valid_targets_min": 893
},
{
"epoch": 4.405888538380652,
"grad_norm": 0.530262461172536,
"learning_rate": 1.4538015230051761e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12000936269760132,
"step": 4190,
"valid_targets_mean": 2091.3,
"valid_targets_min": 909
},
{
"epoch": 4.411146161934806,
"grad_norm": 0.5220984813977081,
"learning_rate": 1.4487588932205072e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09813818335533142,
"step": 4195,
"valid_targets_mean": 2626.4,
"valid_targets_min": 920
},
{
"epoch": 4.416403785488959,
"grad_norm": 0.5116144008783395,
"learning_rate": 1.4437200529406425e-05,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10012590885162354,
"step": 4200,
"valid_targets_mean": 2199.6,
"valid_targets_min": 531
},
{
"epoch": 4.421661409043113,
"grad_norm": 0.4151629623128838,
"learning_rate": 1.4386850368050706e-05,
"loss": 0.0952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08200868964195251,
"step": 4205,
"valid_targets_mean": 2937.8,
"valid_targets_min": 832
},
{
"epoch": 4.426919032597266,
"grad_norm": 0.48864312129435655,
"learning_rate": 1.433653879426991e-05,
"loss": 0.0972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09346634149551392,
"step": 4210,
"valid_targets_mean": 2246.5,
"valid_targets_min": 789
},
{
"epoch": 4.4321766561514195,
"grad_norm": 0.4359286527388814,
"learning_rate": 1.4286266153930733e-05,
"loss": 0.0915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0775316059589386,
"step": 4215,
"valid_targets_mean": 2769.1,
"valid_targets_min": 734
},
{
"epoch": 4.437434279705573,
"grad_norm": 0.4927731730684629,
"learning_rate": 1.4236032792632251e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08639310300350189,
"step": 4220,
"valid_targets_mean": 2197.0,
"valid_targets_min": 845
},
{
"epoch": 4.4426919032597265,
"grad_norm": 0.5686740593088553,
"learning_rate": 1.4185839055703511e-05,
"loss": 0.1134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1238737627863884,
"step": 4225,
"valid_targets_mean": 2144.8,
"valid_targets_min": 667
},
{
"epoch": 4.44794952681388,
"grad_norm": 0.602433185219975,
"learning_rate": 1.4135685288201151e-05,
"loss": 0.108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14720064401626587,
"step": 4230,
"valid_targets_mean": 2214.4,
"valid_targets_min": 824
},
{
"epoch": 4.4532071503680335,
"grad_norm": 0.5078558911585165,
"learning_rate": 1.4085571834907046e-05,
"loss": 0.0929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08777768909931183,
"step": 4235,
"valid_targets_mean": 2221.4,
"valid_targets_min": 592
},
{
"epoch": 4.458464773922187,
"grad_norm": 0.6091488215881007,
"learning_rate": 1.4035499040325946e-05,
"loss": 0.1155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11326266825199127,
"step": 4240,
"valid_targets_mean": 1869.6,
"valid_targets_min": 654
},
{
"epoch": 4.4637223974763405,
"grad_norm": 0.43754366834226255,
"learning_rate": 1.3985467248683064e-05,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07875297963619232,
"step": 4245,
"valid_targets_mean": 2371.3,
"valid_targets_min": 447
},
{
"epoch": 4.468980021030494,
"grad_norm": 0.49752868663224764,
"learning_rate": 1.3935476803921755e-05,
"loss": 0.0921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09022815525531769,
"step": 4250,
"valid_targets_mean": 2247.9,
"valid_targets_min": 525
},
{
"epoch": 4.4742376445846475,
"grad_norm": 0.5101025547005126,
"learning_rate": 1.3885528049701148e-05,
"loss": 0.0909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0945524126291275,
"step": 4255,
"valid_targets_mean": 2284.1,
"valid_targets_min": 705
},
{
"epoch": 4.479495268138801,
"grad_norm": 0.5205417490514214,
"learning_rate": 1.3835621329393738e-05,
"loss": 0.1016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09605126082897186,
"step": 4260,
"valid_targets_mean": 2261.2,
"valid_targets_min": 743
},
{
"epoch": 4.484752891692954,
"grad_norm": 0.4995622499375302,
"learning_rate": 1.3785756986083091e-05,
"loss": 0.0991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1203717291355133,
"step": 4265,
"valid_targets_mean": 2634.0,
"valid_targets_min": 766
},
{
"epoch": 4.490010515247108,
"grad_norm": 0.4886965157495099,
"learning_rate": 1.3735935362561419e-05,
"loss": 0.101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08887738734483719,
"step": 4270,
"valid_targets_mean": 2382.4,
"valid_targets_min": 934
},
{
"epoch": 4.495268138801261,
"grad_norm": 0.6108096582337215,
"learning_rate": 1.3686156801327293e-05,
"loss": 0.0973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08554866909980774,
"step": 4275,
"valid_targets_mean": 2037.9,
"valid_targets_min": 686
},
{
"epoch": 4.500525762355416,
"grad_norm": 0.5246026819941239,
"learning_rate": 1.3636421644583231e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09727829694747925,
"step": 4280,
"valid_targets_mean": 2043.1,
"valid_targets_min": 677
},
{
"epoch": 4.505783385909568,
"grad_norm": 0.4802104884520141,
"learning_rate": 1.3586730234233367e-05,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09578914940357208,
"step": 4285,
"valid_targets_mean": 2729.4,
"valid_targets_min": 856
},
{
"epoch": 4.511041009463723,
"grad_norm": 0.44914677466539615,
"learning_rate": 1.3537082911881106e-05,
"loss": 0.0984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09804667532444,
"step": 4290,
"valid_targets_mean": 2962.4,
"valid_targets_min": 836
},
{
"epoch": 4.516298633017876,
"grad_norm": 0.43893972534711506,
"learning_rate": 1.3487480018826772e-05,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07683141529560089,
"step": 4295,
"valid_targets_mean": 2627.2,
"valid_targets_min": 707
},
{
"epoch": 4.52155625657203,
"grad_norm": 0.47447041458999534,
"learning_rate": 1.343792189606525e-05,
"loss": 0.1029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10103709995746613,
"step": 4300,
"valid_targets_mean": 2409.9,
"valid_targets_min": 762
},
{
"epoch": 4.526813880126183,
"grad_norm": 0.5907813961137309,
"learning_rate": 1.338840888428366e-05,
"loss": 0.1024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1014014482498169,
"step": 4305,
"valid_targets_mean": 1969.4,
"valid_targets_min": 678
},
{
"epoch": 4.532071503680337,
"grad_norm": 0.5486562924204613,
"learning_rate": 1.3338941323859023e-05,
"loss": 0.1006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11533983051776886,
"step": 4310,
"valid_targets_mean": 2122.3,
"valid_targets_min": 632
},
{
"epoch": 4.53732912723449,
"grad_norm": 0.5863172986758325,
"learning_rate": 1.3289519554855858e-05,
"loss": 0.1021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10254557430744171,
"step": 4315,
"valid_targets_mean": 1766.0,
"valid_targets_min": 658
},
{
"epoch": 4.542586750788644,
"grad_norm": 0.5278985712409593,
"learning_rate": 1.3240143917023938e-05,
"loss": 0.0995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10159458965063095,
"step": 4320,
"valid_targets_mean": 2394.6,
"valid_targets_min": 613
},
{
"epoch": 4.547844374342797,
"grad_norm": 0.4774054068903969,
"learning_rate": 1.3190814749795893e-05,
"loss": 0.098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07897340506315231,
"step": 4325,
"valid_targets_mean": 2894.0,
"valid_targets_min": 950
},
{
"epoch": 4.553101997896951,
"grad_norm": 0.5168737209139629,
"learning_rate": 1.3141532392284873e-05,
"loss": 0.1011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08843906968832016,
"step": 4330,
"valid_targets_mean": 2335.8,
"valid_targets_min": 853
},
{
"epoch": 4.558359621451104,
"grad_norm": 0.39551277982685173,
"learning_rate": 1.3092297183282261e-05,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07138287276029587,
"step": 4335,
"valid_targets_mean": 2725.4,
"valid_targets_min": 786
},
{
"epoch": 4.563617245005258,
"grad_norm": 0.5548480950101169,
"learning_rate": 1.3043109461255305e-05,
"loss": 0.1025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11713875830173492,
"step": 4340,
"valid_targets_mean": 2078.0,
"valid_targets_min": 616
},
{
"epoch": 4.568874868559411,
"grad_norm": 0.4924603270925254,
"learning_rate": 1.29939695643448e-05,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08613575249910355,
"step": 4345,
"valid_targets_mean": 2753.4,
"valid_targets_min": 676
},
{
"epoch": 4.574132492113565,
"grad_norm": 0.49169377368919964,
"learning_rate": 1.2944877830362777e-05,
"loss": 0.0968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09385289996862411,
"step": 4350,
"valid_targets_mean": 2377.4,
"valid_targets_min": 718
},
{
"epoch": 4.579390115667718,
"grad_norm": 0.575683120788377,
"learning_rate": 1.289583459679017e-05,
"loss": 0.0974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11349628120660782,
"step": 4355,
"valid_targets_mean": 1961.9,
"valid_targets_min": 710
},
{
"epoch": 4.584647739221872,
"grad_norm": 0.4434783535916279,
"learning_rate": 1.2846840200774484e-05,
"loss": 0.0897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0868612676858902,
"step": 4360,
"valid_targets_mean": 2524.8,
"valid_targets_min": 492
},
{
"epoch": 4.589905362776025,
"grad_norm": 0.6382905408653129,
"learning_rate": 1.2797894979127503e-05,
"loss": 0.0992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10802309215068817,
"step": 4365,
"valid_targets_mean": 1759.8,
"valid_targets_min": 743
},
{
"epoch": 4.595162986330179,
"grad_norm": 0.5247670703693159,
"learning_rate": 1.2748999268322977e-05,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09265201538801193,
"step": 4370,
"valid_targets_mean": 2041.3,
"valid_targets_min": 669
},
{
"epoch": 4.600420609884332,
"grad_norm": 0.47283527268539327,
"learning_rate": 1.2700153404494247e-05,
"loss": 0.1048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08191613852977753,
"step": 4375,
"valid_targets_mean": 2473.2,
"valid_targets_min": 655
},
{
"epoch": 4.605678233438486,
"grad_norm": 0.48593794565176385,
"learning_rate": 1.2651357723432027e-05,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10152431577444077,
"step": 4380,
"valid_targets_mean": 2557.3,
"valid_targets_min": 574
},
{
"epoch": 4.610935856992639,
"grad_norm": 0.4397832835251465,
"learning_rate": 1.2602612560582044e-05,
"loss": 0.0903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08215966075658798,
"step": 4385,
"valid_targets_mean": 2609.4,
"valid_targets_min": 890
},
{
"epoch": 4.616193480546793,
"grad_norm": 0.4947320130064308,
"learning_rate": 1.2553918251042701e-05,
"loss": 0.1011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10161542892456055,
"step": 4390,
"valid_targets_mean": 2460.9,
"valid_targets_min": 627
},
{
"epoch": 4.621451104100946,
"grad_norm": 0.5695165526751769,
"learning_rate": 1.2505275129562851e-05,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14086773991584778,
"step": 4395,
"valid_targets_mean": 2030.6,
"valid_targets_min": 711
},
{
"epoch": 4.6267087276550996,
"grad_norm": 0.5650381504945126,
"learning_rate": 1.2456683530539446e-05,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077423244714737,
"step": 4400,
"valid_targets_mean": 2253.3,
"valid_targets_min": 722
},
{
"epoch": 4.631966351209253,
"grad_norm": 0.5170946354420293,
"learning_rate": 1.2408143788015225e-05,
"loss": 0.0991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09927581995725632,
"step": 4405,
"valid_targets_mean": 2233.8,
"valid_targets_min": 754
},
{
"epoch": 4.6372239747634065,
"grad_norm": 0.5234400667762248,
"learning_rate": 1.2359656235676468e-05,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10893240571022034,
"step": 4410,
"valid_targets_mean": 2456.2,
"valid_targets_min": 892
},
{
"epoch": 4.642481598317561,
"grad_norm": 0.44412533521629255,
"learning_rate": 1.231122120685066e-05,
"loss": 0.1054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09738484770059586,
"step": 4415,
"valid_targets_mean": 2819.4,
"valid_targets_min": 775
},
{
"epoch": 4.6477392218717135,
"grad_norm": 0.5434749885366846,
"learning_rate": 1.2262839034504208e-05,
"loss": 0.1113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10426691174507141,
"step": 4420,
"valid_targets_mean": 2262.4,
"valid_targets_min": 647
},
{
"epoch": 4.652996845425868,
"grad_norm": 0.48253506122661793,
"learning_rate": 1.2214510051240164e-05,
"loss": 0.0891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08545523136854172,
"step": 4425,
"valid_targets_mean": 2235.4,
"valid_targets_min": 685
},
{
"epoch": 4.658254468980021,
"grad_norm": 0.4527197792427856,
"learning_rate": 1.2166234589295951e-05,
"loss": 0.0883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07737896591424942,
"step": 4430,
"valid_targets_mean": 2266.4,
"valid_targets_min": 518
},
{
"epoch": 4.663512092534175,
"grad_norm": 0.4998494823076504,
"learning_rate": 1.2118012980541013e-05,
"loss": 0.0984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09616045653820038,
"step": 4435,
"valid_targets_mean": 2290.9,
"valid_targets_min": 851
},
{
"epoch": 4.668769716088328,
"grad_norm": 0.4230991236137391,
"learning_rate": 1.2069845556474626e-05,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07516521215438843,
"step": 4440,
"valid_targets_mean": 2595.4,
"valid_targets_min": 814
},
{
"epoch": 4.674027339642482,
"grad_norm": 0.590037819654043,
"learning_rate": 1.2021732648223553e-05,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11608242988586426,
"step": 4445,
"valid_targets_mean": 2037.6,
"valid_targets_min": 847
},
{
"epoch": 4.679284963196635,
"grad_norm": 0.43915378094587154,
"learning_rate": 1.1973674586539791e-05,
"loss": 0.1031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09132928401231766,
"step": 4450,
"valid_targets_mean": 2833.8,
"valid_targets_min": 607
},
{
"epoch": 4.684542586750789,
"grad_norm": 0.5710654884244168,
"learning_rate": 1.1925671701798292e-05,
"loss": 0.0929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09262624382972717,
"step": 4455,
"valid_targets_mean": 2008.8,
"valid_targets_min": 591
},
{
"epoch": 4.689800210304942,
"grad_norm": 0.7331837361388599,
"learning_rate": 1.1877724323994704e-05,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10521057993173599,
"step": 4460,
"valid_targets_mean": 2348.8,
"valid_targets_min": 887
},
{
"epoch": 4.695057833859096,
"grad_norm": 0.4043023336963058,
"learning_rate": 1.1829832782743074e-05,
"loss": 0.1053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09723056852817535,
"step": 4465,
"valid_targets_mean": 3220.9,
"valid_targets_min": 1144
},
{
"epoch": 4.700315457413249,
"grad_norm": 0.3896949449984179,
"learning_rate": 1.178199740727362e-05,
"loss": 0.1016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08350640535354614,
"step": 4470,
"valid_targets_mean": 3009.9,
"valid_targets_min": 739
},
{
"epoch": 4.705573080967403,
"grad_norm": 0.521490395157194,
"learning_rate": 1.1734218526430446e-05,
"loss": 0.0986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09911235421895981,
"step": 4475,
"valid_targets_mean": 2304.8,
"valid_targets_min": 542
},
{
"epoch": 4.710830704521556,
"grad_norm": 0.4813048717328619,
"learning_rate": 1.1686496468669269e-05,
"loss": 0.0948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08519215136766434,
"step": 4480,
"valid_targets_mean": 2401.8,
"valid_targets_min": 774
},
{
"epoch": 4.71608832807571,
"grad_norm": 0.5598112043799223,
"learning_rate": 1.1638831562055191e-05,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.090914286673069,
"step": 4485,
"valid_targets_mean": 1917.9,
"valid_targets_min": 363
},
{
"epoch": 4.721345951629863,
"grad_norm": 0.5246952916607143,
"learning_rate": 1.1591224134260425e-05,
"loss": 0.0947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09370351582765579,
"step": 4490,
"valid_targets_mean": 2400.6,
"valid_targets_min": 804
},
{
"epoch": 4.726603575184017,
"grad_norm": 0.6565003592691423,
"learning_rate": 1.1543674512562037e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12521179020404816,
"step": 4495,
"valid_targets_mean": 2023.5,
"valid_targets_min": 765
},
{
"epoch": 4.73186119873817,
"grad_norm": 0.5427757368927597,
"learning_rate": 1.1496183023839729e-05,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09612180292606354,
"step": 4500,
"valid_targets_mean": 1967.1,
"valid_targets_min": 647
},
{
"epoch": 4.737118822292324,
"grad_norm": 0.4508204549580782,
"learning_rate": 1.144874999457354e-05,
"loss": 0.0959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09256187081336975,
"step": 4505,
"valid_targets_mean": 2573.9,
"valid_targets_min": 943
},
{
"epoch": 4.742376445846477,
"grad_norm": 0.5049509144729405,
"learning_rate": 1.1401375750841637e-05,
"loss": 0.0975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08873606473207474,
"step": 4510,
"valid_targets_mean": 2558.1,
"valid_targets_min": 848
},
{
"epoch": 4.747634069400631,
"grad_norm": 0.49495600212397534,
"learning_rate": 1.1354060618318086e-05,
"loss": 0.1002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10050778836011887,
"step": 4515,
"valid_targets_mean": 2426.5,
"valid_targets_min": 797
},
{
"epoch": 4.752891692954784,
"grad_norm": 0.5114820141922032,
"learning_rate": 1.1306804922270568e-05,
"loss": 0.1166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0971759557723999,
"step": 4520,
"valid_targets_mean": 2566.6,
"valid_targets_min": 866
},
{
"epoch": 4.758149316508938,
"grad_norm": 0.632053912759659,
"learning_rate": 1.1259608987558175e-05,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12641634047031403,
"step": 4525,
"valid_targets_mean": 2165.0,
"valid_targets_min": 1042
},
{
"epoch": 4.763406940063091,
"grad_norm": 0.6407487997767939,
"learning_rate": 1.1212473138629187e-05,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.129093199968338,
"step": 4530,
"valid_targets_mean": 1567.3,
"valid_targets_min": 635
},
{
"epoch": 4.768664563617245,
"grad_norm": 0.4748727011114625,
"learning_rate": 1.1165397699518797e-05,
"loss": 0.091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09252180904150009,
"step": 4535,
"valid_targets_mean": 2456.8,
"valid_targets_min": 701
},
{
"epoch": 4.773922187171398,
"grad_norm": 0.4941751130576742,
"learning_rate": 1.1118382993846933e-05,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11116250604391098,
"step": 4540,
"valid_targets_mean": 2394.6,
"valid_targets_min": 626
},
{
"epoch": 4.779179810725552,
"grad_norm": 0.5299027801957493,
"learning_rate": 1.1071429344816003e-05,
"loss": 0.0986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09701026976108551,
"step": 4545,
"valid_targets_mean": 2138.4,
"valid_targets_min": 856
},
{
"epoch": 4.784437434279706,
"grad_norm": 0.5129425286831147,
"learning_rate": 1.102453707520867e-05,
"loss": 0.0972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10163642466068268,
"step": 4550,
"valid_targets_mean": 2204.8,
"valid_targets_min": 770
},
{
"epoch": 4.789695057833859,
"grad_norm": 0.5508142859981414,
"learning_rate": 1.0977706507385673e-05,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10404539108276367,
"step": 4555,
"valid_targets_mean": 2175.4,
"valid_targets_min": 697
},
{
"epoch": 4.794952681388013,
"grad_norm": 0.5433699061805612,
"learning_rate": 1.0930937963283554e-05,
"loss": 0.0977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09824663400650024,
"step": 4560,
"valid_targets_mean": 2136.2,
"valid_targets_min": 535
},
{
"epoch": 4.8002103049421665,
"grad_norm": 0.6953915966344411,
"learning_rate": 1.088423176441248e-05,
"loss": 0.1142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09402541816234589,
"step": 4565,
"valid_targets_mean": 2570.6,
"valid_targets_min": 559
},
{
"epoch": 4.80546792849632,
"grad_norm": 0.48242146139007297,
"learning_rate": 1.0837588231854044e-05,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09483704715967178,
"step": 4570,
"valid_targets_mean": 2460.8,
"valid_targets_min": 623
},
{
"epoch": 4.8107255520504735,
"grad_norm": 0.4896295169453218,
"learning_rate": 1.0791007686259019e-05,
"loss": 0.0928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1058853417634964,
"step": 4575,
"valid_targets_mean": 2419.6,
"valid_targets_min": 516
},
{
"epoch": 4.815983175604627,
"grad_norm": 0.5635275786108805,
"learning_rate": 1.0744490447845172e-05,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10014744102954865,
"step": 4580,
"valid_targets_mean": 2023.0,
"valid_targets_min": 926
},
{
"epoch": 4.8212407991587805,
"grad_norm": 0.5248809216777951,
"learning_rate": 1.0698036836395084e-05,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09372108429670334,
"step": 4585,
"valid_targets_mean": 2062.7,
"valid_targets_min": 657
},
{
"epoch": 4.826498422712934,
"grad_norm": 0.5282566214001109,
"learning_rate": 1.0651647171253936e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10230812430381775,
"step": 4590,
"valid_targets_mean": 1986.8,
"valid_targets_min": 707
},
{
"epoch": 4.831756046267087,
"grad_norm": 0.4123856622268535,
"learning_rate": 1.0605321771327267e-05,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07696308195590973,
"step": 4595,
"valid_targets_mean": 3218.1,
"valid_targets_min": 692
},
{
"epoch": 4.837013669821241,
"grad_norm": 0.5238479603664691,
"learning_rate": 1.0559060955078873e-05,
"loss": 0.0932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10284964740276337,
"step": 4600,
"valid_targets_mean": 2373.4,
"valid_targets_min": 790
},
{
"epoch": 4.842271293375394,
"grad_norm": 0.468609075721786,
"learning_rate": 1.0512865040528558e-05,
"loss": 0.0891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08464796841144562,
"step": 4605,
"valid_targets_mean": 2436.6,
"valid_targets_min": 807
},
{
"epoch": 4.847528916929548,
"grad_norm": 0.48328852441064596,
"learning_rate": 1.0466734345249946e-05,
"loss": 0.0915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08199210464954376,
"step": 4610,
"valid_targets_mean": 2194.1,
"valid_targets_min": 744
},
{
"epoch": 4.852786540483701,
"grad_norm": 0.5354458073127093,
"learning_rate": 1.0420669186368311e-05,
"loss": 0.0906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09654032438993454,
"step": 4615,
"valid_targets_mean": 2015.8,
"valid_targets_min": 459
},
{
"epoch": 4.858044164037855,
"grad_norm": 0.5135883795451422,
"learning_rate": 1.0374669880558419e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09381682425737381,
"step": 4620,
"valid_targets_mean": 2450.0,
"valid_targets_min": 534
},
{
"epoch": 4.863301787592008,
"grad_norm": 0.4235909671196331,
"learning_rate": 1.0328736744042311e-05,
"loss": 0.1017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08027419447898865,
"step": 4625,
"valid_targets_mean": 2799.8,
"valid_targets_min": 843
},
{
"epoch": 4.868559411146162,
"grad_norm": 0.4707831943602184,
"learning_rate": 1.0282870092587144e-05,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08368093520402908,
"step": 4630,
"valid_targets_mean": 2812.9,
"valid_targets_min": 909
},
{
"epoch": 4.873817034700315,
"grad_norm": 0.5339909907011945,
"learning_rate": 1.023707024150305e-05,
"loss": 0.0962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11583643406629562,
"step": 4635,
"valid_targets_mean": 2287.1,
"valid_targets_min": 1052
},
{
"epoch": 4.879074658254469,
"grad_norm": 0.5085378577412311,
"learning_rate": 1.0191337505640905e-05,
"loss": 0.0914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1098240539431572,
"step": 4640,
"valid_targets_mean": 2549.8,
"valid_targets_min": 770
},
{
"epoch": 4.884332281808622,
"grad_norm": 0.45220409517830074,
"learning_rate": 1.0145672199390226e-05,
"loss": 0.1036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08148109912872314,
"step": 4645,
"valid_targets_mean": 2461.1,
"valid_targets_min": 533
},
{
"epoch": 4.889589905362776,
"grad_norm": 0.475515183709408,
"learning_rate": 1.010007463667699e-05,
"loss": 0.0903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10368898510932922,
"step": 4650,
"valid_targets_mean": 2331.8,
"valid_targets_min": 612
},
{
"epoch": 4.894847528916929,
"grad_norm": 0.5763158891821861,
"learning_rate": 1.0054545130961441e-05,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10566672682762146,
"step": 4655,
"valid_targets_mean": 1883.9,
"valid_targets_min": 812
},
{
"epoch": 4.900105152471083,
"grad_norm": 0.43104414608433417,
"learning_rate": 1.0009083995236009e-05,
"loss": 0.0961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08963556587696075,
"step": 4660,
"valid_targets_mean": 2955.2,
"valid_targets_min": 908
},
{
"epoch": 4.905362776025236,
"grad_norm": 0.5445275966774047,
"learning_rate": 9.963691542023079e-06,
"loss": 0.0991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09479817003011703,
"step": 4665,
"valid_targets_mean": 2277.8,
"valid_targets_min": 657
},
{
"epoch": 4.91062039957939,
"grad_norm": 0.5066367629312661,
"learning_rate": 9.918368083372884e-06,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09916972368955612,
"step": 4670,
"valid_targets_mean": 2247.6,
"valid_targets_min": 782
},
{
"epoch": 4.915878023133543,
"grad_norm": 0.4771781629319518,
"learning_rate": 9.87311393086138e-06,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09766573458909988,
"step": 4675,
"valid_targets_mean": 2661.2,
"valid_targets_min": 827
},
{
"epoch": 4.921135646687697,
"grad_norm": 0.47605099896765274,
"learning_rate": 9.827929395588048e-06,
"loss": 0.0934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10150592029094696,
"step": 4680,
"valid_targets_mean": 2232.2,
"valid_targets_min": 718
},
{
"epoch": 4.926393270241851,
"grad_norm": 0.5272252711411148,
"learning_rate": 9.782814788173787e-06,
"loss": 0.0947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09894594550132751,
"step": 4685,
"valid_targets_mean": 2163.0,
"valid_targets_min": 591
},
{
"epoch": 4.931650893796004,
"grad_norm": 0.6001334349524697,
"learning_rate": 9.737770418758808e-06,
"loss": 0.0969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09525749087333679,
"step": 4690,
"valid_targets_mean": 2034.4,
"valid_targets_min": 195
},
{
"epoch": 4.936908517350158,
"grad_norm": 0.5866759894690932,
"learning_rate": 9.692796597000438e-06,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1112414300441742,
"step": 4695,
"valid_targets_mean": 1976.1,
"valid_targets_min": 684
},
{
"epoch": 4.942166140904312,
"grad_norm": 0.49758985127375477,
"learning_rate": 9.64789363207103e-06,
"loss": 0.103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09018470346927643,
"step": 4700,
"valid_targets_mean": 2658.8,
"valid_targets_min": 516
},
{
"epoch": 4.947423764458465,
"grad_norm": 0.5459854002762042,
"learning_rate": 9.603061832655847e-06,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10367339849472046,
"step": 4705,
"valid_targets_mean": 2151.7,
"valid_targets_min": 531
},
{
"epoch": 4.952681388012619,
"grad_norm": 0.4026824037932101,
"learning_rate": 9.55830150695093e-06,
"loss": 0.0979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08115653693675995,
"step": 4710,
"valid_targets_mean": 2948.0,
"valid_targets_min": 551
},
{
"epoch": 4.957939011566772,
"grad_norm": 0.4550478327591578,
"learning_rate": 9.513612962660935e-06,
"loss": 0.0941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08574287593364716,
"step": 4715,
"valid_targets_mean": 2740.3,
"valid_targets_min": 989
},
{
"epoch": 4.963196635120926,
"grad_norm": 0.535463814722982,
"learning_rate": 9.468996506997093e-06,
"loss": 0.11,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11817488074302673,
"step": 4720,
"valid_targets_mean": 2331.6,
"valid_targets_min": 875
},
{
"epoch": 4.968454258675079,
"grad_norm": 0.5190460495882703,
"learning_rate": 9.424452446675059e-06,
"loss": 0.1078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10049982368946075,
"step": 4725,
"valid_targets_mean": 2304.6,
"valid_targets_min": 663
},
{
"epoch": 4.9737118822292326,
"grad_norm": 0.5604972050064392,
"learning_rate": 9.379981087912795e-06,
"loss": 0.1034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10879268497228622,
"step": 4730,
"valid_targets_mean": 1894.5,
"valid_targets_min": 843
},
{
"epoch": 4.978969505783386,
"grad_norm": 0.5413203799831996,
"learning_rate": 9.33558273642848e-06,
"loss": 0.0963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10227219015359879,
"step": 4735,
"valid_targets_mean": 1804.4,
"valid_targets_min": 647
},
{
"epoch": 4.9842271293375395,
"grad_norm": 0.6441356375017433,
"learning_rate": 9.291257697438393e-06,
"loss": 0.0976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09676170349121094,
"step": 4740,
"valid_targets_mean": 2362.1,
"valid_targets_min": 738
},
{
"epoch": 4.989484752891693,
"grad_norm": 0.5320775542310602,
"learning_rate": 9.247006275654861e-06,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.104653000831604,
"step": 4745,
"valid_targets_mean": 1971.3,
"valid_targets_min": 507
},
{
"epoch": 4.9947423764458465,
"grad_norm": 0.46856590894197625,
"learning_rate": 9.202828775284101e-06,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0959998071193695,
"step": 4750,
"valid_targets_mean": 2490.2,
"valid_targets_min": 659
},
{
"epoch": 5.0,
"grad_norm": 0.5952484924570117,
"learning_rate": 9.158725500024148e-06,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11373323947191238,
"step": 4755,
"valid_targets_mean": 1951.9,
"valid_targets_min": 609
},
{
"epoch": 5.0052576235541535,
"grad_norm": 0.4747881902688858,
"learning_rate": 9.114696753062816e-06,
"loss": 0.0872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09556099772453308,
"step": 4760,
"valid_targets_mean": 2731.6,
"valid_targets_min": 1102
},
{
"epoch": 5.010515247108307,
"grad_norm": 0.531060146381296,
"learning_rate": 9.07074283707554e-06,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09349146485328674,
"step": 4765,
"valid_targets_mean": 2682.4,
"valid_targets_min": 800
},
{
"epoch": 5.0157728706624605,
"grad_norm": 0.4803599014963528,
"learning_rate": 9.026864054223337e-06,
"loss": 0.0799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08033661544322968,
"step": 4770,
"valid_targets_mean": 3233.9,
"valid_targets_min": 780
},
{
"epoch": 5.021030494216614,
"grad_norm": 0.5738319263889354,
"learning_rate": 8.98306070615073e-06,
"loss": 0.0896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08915919065475464,
"step": 4775,
"valid_targets_mean": 2011.4,
"valid_targets_min": 492
},
{
"epoch": 5.0262881177707674,
"grad_norm": 0.43000492514648264,
"learning_rate": 8.93933309398368e-06,
"loss": 0.0742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07440449297428131,
"step": 4780,
"valid_targets_mean": 2776.8,
"valid_targets_min": 637
},
{
"epoch": 5.031545741324921,
"grad_norm": 0.5773281092892758,
"learning_rate": 8.89568151832745e-06,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10673081129789352,
"step": 4785,
"valid_targets_mean": 2185.7,
"valid_targets_min": 598
},
{
"epoch": 5.036803364879074,
"grad_norm": 0.551538874932054,
"learning_rate": 8.852106279264643e-06,
"loss": 0.0811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08478675782680511,
"step": 4790,
"valid_targets_mean": 2123.6,
"valid_targets_min": 535
},
{
"epoch": 5.042060988433228,
"grad_norm": 0.4960007141639336,
"learning_rate": 8.808607676353074e-06,
"loss": 0.084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07749012857675552,
"step": 4795,
"valid_targets_mean": 2246.9,
"valid_targets_min": 569
},
{
"epoch": 5.047318611987381,
"grad_norm": 0.5653349333593447,
"learning_rate": 8.765186008623706e-06,
"loss": 0.0842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08439381420612335,
"step": 4800,
"valid_targets_mean": 2139.5,
"valid_targets_min": 727
},
{
"epoch": 5.052576235541535,
"grad_norm": 0.556138225843227,
"learning_rate": 8.721841574578617e-06,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0761680155992508,
"step": 4805,
"valid_targets_mean": 2112.2,
"valid_targets_min": 634
},
{
"epoch": 5.057833859095688,
"grad_norm": 0.5133626158390642,
"learning_rate": 8.678574672188963e-06,
"loss": 0.0784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07579199969768524,
"step": 4810,
"valid_targets_mean": 2167.1,
"valid_targets_min": 784
},
{
"epoch": 5.063091482649842,
"grad_norm": 0.5646934953364373,
"learning_rate": 8.635385598892881e-06,
"loss": 0.0952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09673206508159637,
"step": 4815,
"valid_targets_mean": 2140.2,
"valid_targets_min": 608
},
{
"epoch": 5.068349106203995,
"grad_norm": 0.5772485641334589,
"learning_rate": 8.592274651593482e-06,
"loss": 0.09,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07193920016288757,
"step": 4820,
"valid_targets_mean": 2546.4,
"valid_targets_min": 744
},
{
"epoch": 5.07360672975815,
"grad_norm": 0.5777837302827505,
"learning_rate": 8.549242126656814e-06,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0906825140118599,
"step": 4825,
"valid_targets_mean": 2081.2,
"valid_targets_min": 691
},
{
"epoch": 5.078864353312303,
"grad_norm": 0.5233064547260131,
"learning_rate": 8.506288319909793e-06,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08560320734977722,
"step": 4830,
"valid_targets_mean": 2432.2,
"valid_targets_min": 641
},
{
"epoch": 5.084121976866457,
"grad_norm": 0.6101615167011463,
"learning_rate": 8.463413526638186e-06,
"loss": 0.0829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.096367746591568,
"step": 4835,
"valid_targets_mean": 1844.6,
"valid_targets_min": 834
},
{
"epoch": 5.08937960042061,
"grad_norm": 0.42631376037572355,
"learning_rate": 8.420618041584604e-06,
"loss": 0.0903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07750090956687927,
"step": 4840,
"valid_targets_mean": 3060.9,
"valid_targets_min": 1204
},
{
"epoch": 5.094637223974764,
"grad_norm": 0.608597401551527,
"learning_rate": 8.377902158946427e-06,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11112530529499054,
"step": 4845,
"valid_targets_mean": 2162.4,
"valid_targets_min": 485
},
{
"epoch": 5.099894847528917,
"grad_norm": 0.6140835434362498,
"learning_rate": 8.335266172373832e-06,
"loss": 0.0815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08970272541046143,
"step": 4850,
"valid_targets_mean": 1963.8,
"valid_targets_min": 591
},
{
"epoch": 5.105152471083071,
"grad_norm": 0.4863633229657105,
"learning_rate": 8.292710374967737e-06,
"loss": 0.0873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07550916820764542,
"step": 4855,
"valid_targets_mean": 2228.6,
"valid_targets_min": 722
},
{
"epoch": 5.110410094637224,
"grad_norm": 0.5739706485973418,
"learning_rate": 8.250235059277792e-06,
"loss": 0.0891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10407744348049164,
"step": 4860,
"valid_targets_mean": 2238.4,
"valid_targets_min": 790
},
{
"epoch": 5.115667718191378,
"grad_norm": 0.514139216010886,
"learning_rate": 8.207840517300398e-06,
"loss": 0.0884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08347027748823166,
"step": 4865,
"valid_targets_mean": 2555.4,
"valid_targets_min": 548
},
{
"epoch": 5.120925341745531,
"grad_norm": 0.6394788603902261,
"learning_rate": 8.165527040476666e-06,
"loss": 0.09,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09309305250644684,
"step": 4870,
"valid_targets_mean": 1850.6,
"valid_targets_min": 649
},
{
"epoch": 5.126182965299685,
"grad_norm": 0.5033017445925095,
"learning_rate": 8.123294919690413e-06,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08884253352880478,
"step": 4875,
"valid_targets_mean": 2351.9,
"valid_targets_min": 925
},
{
"epoch": 5.131440588853838,
"grad_norm": 0.6211269811198701,
"learning_rate": 8.081144445266201e-06,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10970626026391983,
"step": 4880,
"valid_targets_mean": 1906.9,
"valid_targets_min": 818
},
{
"epoch": 5.136698212407992,
"grad_norm": 0.4707250949700276,
"learning_rate": 8.039075906967293e-06,
"loss": 0.0956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07014121860265732,
"step": 4885,
"valid_targets_mean": 2335.6,
"valid_targets_min": 516
},
{
"epoch": 5.141955835962145,
"grad_norm": 0.4542172026051046,
"learning_rate": 7.99708959399368e-06,
"loss": 0.0818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08962544798851013,
"step": 4890,
"valid_targets_mean": 2735.6,
"valid_targets_min": 606
},
{
"epoch": 5.147213459516299,
"grad_norm": 0.4764289023428161,
"learning_rate": 7.955185794980117e-06,
"loss": 0.0893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08560174703598022,
"step": 4895,
"valid_targets_mean": 2765.1,
"valid_targets_min": 1052
},
{
"epoch": 5.152471083070452,
"grad_norm": 0.4838651174803042,
"learning_rate": 7.913364797994111e-06,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08318427205085754,
"step": 4900,
"valid_targets_mean": 2794.4,
"valid_targets_min": 933
},
{
"epoch": 5.157728706624606,
"grad_norm": 0.4892959953794859,
"learning_rate": 7.871626890533917e-06,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0772155225276947,
"step": 4905,
"valid_targets_mean": 2832.8,
"valid_targets_min": 638
},
{
"epoch": 5.162986330178759,
"grad_norm": 0.5676510237286844,
"learning_rate": 7.829972359526626e-06,
"loss": 0.092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09734560549259186,
"step": 4910,
"valid_targets_mean": 2242.8,
"valid_targets_min": 611
},
{
"epoch": 5.168243953732913,
"grad_norm": 0.625272606978109,
"learning_rate": 7.788401491326155e-06,
"loss": 0.0995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11970986425876617,
"step": 4915,
"valid_targets_mean": 1919.2,
"valid_targets_min": 712
},
{
"epoch": 5.173501577287066,
"grad_norm": 0.4197566624914115,
"learning_rate": 7.746914571711264e-06,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06784413009881973,
"step": 4920,
"valid_targets_mean": 3019.0,
"valid_targets_min": 542
},
{
"epoch": 5.1787592008412195,
"grad_norm": 0.5810050456122732,
"learning_rate": 7.705511885883612e-06,
"loss": 0.1083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09299144148826599,
"step": 4925,
"valid_targets_mean": 2198.4,
"valid_targets_min": 802
},
{
"epoch": 5.184016824395373,
"grad_norm": 0.4701281349667338,
"learning_rate": 7.664193718465814e-06,
"loss": 0.0826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0833558514714241,
"step": 4930,
"valid_targets_mean": 2734.9,
"valid_targets_min": 778
},
{
"epoch": 5.1892744479495265,
"grad_norm": 0.6087811947826366,
"learning_rate": 7.622960353499438e-06,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08990595489740372,
"step": 4935,
"valid_targets_mean": 2070.8,
"valid_targets_min": 647
},
{
"epoch": 5.19453207150368,
"grad_norm": 0.5095848176981579,
"learning_rate": 7.581812074443084e-06,
"loss": 0.0889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08168764412403107,
"step": 4940,
"valid_targets_mean": 2443.6,
"valid_targets_min": 1064
},
{
"epoch": 5.1997896950578335,
"grad_norm": 0.5287408674005241,
"learning_rate": 7.5407491641704464e-06,
"loss": 0.0966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1372952163219452,
"step": 4945,
"valid_targets_mean": 2538.5,
"valid_targets_min": 1242
},
{
"epoch": 5.205047318611987,
"grad_norm": 0.526923008558239,
"learning_rate": 7.499771904968332e-06,
"loss": 0.092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09596161544322968,
"step": 4950,
"valid_targets_mean": 2516.8,
"valid_targets_min": 530
},
{
"epoch": 5.2103049421661405,
"grad_norm": 0.5757081805714579,
"learning_rate": 7.45888057853474e-06,
"loss": 0.088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11269830912351608,
"step": 4955,
"valid_targets_mean": 2153.9,
"valid_targets_min": 727
},
{
"epoch": 5.215562565720294,
"grad_norm": 0.5195623013896692,
"learning_rate": 7.418075465976944e-06,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07585069537162781,
"step": 4960,
"valid_targets_mean": 2242.2,
"valid_targets_min": 766
},
{
"epoch": 5.220820189274448,
"grad_norm": 0.4750117808205412,
"learning_rate": 7.3773568478095184e-06,
"loss": 0.084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07411602884531021,
"step": 4965,
"valid_targets_mean": 2471.2,
"valid_targets_min": 816
},
{
"epoch": 5.226077812828602,
"grad_norm": 0.567042240599365,
"learning_rate": 7.336725003952456e-06,
"loss": 0.0909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0949440449476242,
"step": 4970,
"valid_targets_mean": 2255.4,
"valid_targets_min": 669
},
{
"epoch": 5.231335436382755,
"grad_norm": 0.5877466871826089,
"learning_rate": 7.296180213729196e-06,
"loss": 0.0943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08979032188653946,
"step": 4975,
"valid_targets_mean": 2317.8,
"valid_targets_min": 716
},
{
"epoch": 5.236593059936909,
"grad_norm": 0.7089572534362036,
"learning_rate": 7.255722755864734e-06,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10060486942529678,
"step": 4980,
"valid_targets_mean": 1797.9,
"valid_targets_min": 743
},
{
"epoch": 5.241850683491062,
"grad_norm": 0.5270847189384095,
"learning_rate": 7.21535290848372e-06,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09048455953598022,
"step": 4985,
"valid_targets_mean": 2466.2,
"valid_targets_min": 333
},
{
"epoch": 5.247108307045216,
"grad_norm": 0.6220379212563706,
"learning_rate": 7.175070949108496e-06,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09916834533214569,
"step": 4990,
"valid_targets_mean": 2074.2,
"valid_targets_min": 617
},
{
"epoch": 5.252365930599369,
"grad_norm": 0.4094425144504652,
"learning_rate": 7.1348771546572315e-06,
"loss": 0.0788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061037708073854446,
"step": 4995,
"valid_targets_mean": 2724.8,
"valid_targets_min": 570
},
{
"epoch": 5.257623554153523,
"grad_norm": 0.5255626983319233,
"learning_rate": 7.09477180144202e-06,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08301110565662384,
"step": 5000,
"valid_targets_mean": 2371.1,
"valid_targets_min": 800
},
{
"epoch": 5.262881177707676,
"grad_norm": 0.5317665547747095,
"learning_rate": 7.054755165166945e-06,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08194243907928467,
"step": 5005,
"valid_targets_mean": 2288.0,
"valid_targets_min": 591
},
{
"epoch": 5.26813880126183,
"grad_norm": 0.6110742880061574,
"learning_rate": 7.014827520926206e-06,
"loss": 0.0911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07745426893234253,
"step": 5010,
"valid_targets_mean": 1685.6,
"valid_targets_min": 536
},
{
"epoch": 5.273396424815983,
"grad_norm": 0.6185550001623864,
"learning_rate": 6.9749891432022505e-06,
"loss": 0.0934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0874614417552948,
"step": 5015,
"valid_targets_mean": 2362.5,
"valid_targets_min": 734
},
{
"epoch": 5.278654048370137,
"grad_norm": 0.6215121701984339,
"learning_rate": 6.935240305863844e-06,
"loss": 0.0905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10409186780452728,
"step": 5020,
"valid_targets_mean": 1938.4,
"valid_targets_min": 692
},
{
"epoch": 5.28391167192429,
"grad_norm": 0.5205161352159564,
"learning_rate": 6.895581282164201e-06,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08407530933618546,
"step": 5025,
"valid_targets_mean": 2421.5,
"valid_targets_min": 763
},
{
"epoch": 5.289169295478444,
"grad_norm": 0.4739553980784417,
"learning_rate": 6.856012344739138e-06,
"loss": 0.0834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07506439089775085,
"step": 5030,
"valid_targets_mean": 2647.1,
"valid_targets_min": 821
},
{
"epoch": 5.294426919032597,
"grad_norm": 0.6644721062928993,
"learning_rate": 6.816533765605144e-06,
"loss": 0.0886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11241534352302551,
"step": 5035,
"valid_targets_mean": 1938.0,
"valid_targets_min": 652
},
{
"epoch": 5.299684542586751,
"grad_norm": 0.468157087965398,
"learning_rate": 6.7771458161575685e-06,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07443106174468994,
"step": 5040,
"valid_targets_mean": 2810.1,
"valid_targets_min": 776
},
{
"epoch": 5.304942166140904,
"grad_norm": 0.506797870494024,
"learning_rate": 6.737848767168709e-06,
"loss": 0.0942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11336579918861389,
"step": 5045,
"valid_targets_mean": 2916.1,
"valid_targets_min": 195
},
{
"epoch": 5.310199789695058,
"grad_norm": 0.5948917224715727,
"learning_rate": 6.698642888785965e-06,
"loss": 0.0934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09943850338459015,
"step": 5050,
"valid_targets_mean": 2226.2,
"valid_targets_min": 736
},
{
"epoch": 5.315457413249211,
"grad_norm": 0.4570125709648298,
"learning_rate": 6.659528450530006e-06,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07685257494449615,
"step": 5055,
"valid_targets_mean": 2539.8,
"valid_targets_min": 756
},
{
"epoch": 5.320715036803365,
"grad_norm": 0.4607678512776848,
"learning_rate": 6.6205057212928755e-06,
"loss": 0.0861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08634813129901886,
"step": 5060,
"valid_targets_mean": 2880.8,
"valid_targets_min": 739
},
{
"epoch": 5.325972660357518,
"grad_norm": 0.5933753963794773,
"learning_rate": 6.5815749693361645e-06,
"loss": 0.0861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08705602586269379,
"step": 5065,
"valid_targets_mean": 2286.2,
"valid_targets_min": 729
},
{
"epoch": 5.331230283911672,
"grad_norm": 0.5737142436331638,
"learning_rate": 6.542736462289188e-06,
"loss": 0.0939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08779951184988022,
"step": 5070,
"valid_targets_mean": 2010.6,
"valid_targets_min": 614
},
{
"epoch": 5.336487907465825,
"grad_norm": 0.4977445954434311,
"learning_rate": 6.503990467147101e-06,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0765611082315445,
"step": 5075,
"valid_targets_mean": 2795.3,
"valid_targets_min": 1059
},
{
"epoch": 5.341745531019979,
"grad_norm": 0.6259572327424517,
"learning_rate": 6.465337250269086e-06,
"loss": 0.0984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11080735176801682,
"step": 5080,
"valid_targets_mean": 1644.2,
"valid_targets_min": 635
},
{
"epoch": 5.347003154574132,
"grad_norm": 0.6285895537287443,
"learning_rate": 6.426777077376538e-06,
"loss": 0.0877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08999790251255035,
"step": 5085,
"valid_targets_mean": 1772.4,
"valid_targets_min": 753
},
{
"epoch": 5.352260778128286,
"grad_norm": 0.5977737148128844,
"learning_rate": 6.388310213551223e-06,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09891614317893982,
"step": 5090,
"valid_targets_mean": 2087.9,
"valid_targets_min": 531
},
{
"epoch": 5.357518401682439,
"grad_norm": 0.5508784320517726,
"learning_rate": 6.349936923233422e-06,
"loss": 0.0889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08124659210443497,
"step": 5095,
"valid_targets_mean": 2310.6,
"valid_targets_min": 649
},
{
"epoch": 5.3627760252365935,
"grad_norm": 0.5159614570586936,
"learning_rate": 6.311657470220178e-06,
"loss": 0.085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08114410191774368,
"step": 5100,
"valid_targets_mean": 2617.3,
"valid_targets_min": 665
},
{
"epoch": 5.368033648790747,
"grad_norm": 0.5704928497789014,
"learning_rate": 6.273472117663446e-06,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06149521842598915,
"step": 5105,
"valid_targets_mean": 2451.3,
"valid_targets_min": 684
},
{
"epoch": 5.3732912723449004,
"grad_norm": 0.653197074846383,
"learning_rate": 6.2353811280682715e-06,
"loss": 0.1034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10560913383960724,
"step": 5110,
"valid_targets_mean": 2101.6,
"valid_targets_min": 639
},
{
"epoch": 5.378548895899054,
"grad_norm": 0.5059796650282158,
"learning_rate": 6.19738476329101e-06,
"loss": 0.0823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08062926679849625,
"step": 5115,
"valid_targets_mean": 2766.2,
"valid_targets_min": 836
},
{
"epoch": 5.383806519453207,
"grad_norm": 0.6299208443881084,
"learning_rate": 6.159483284537533e-06,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1033320352435112,
"step": 5120,
"valid_targets_mean": 2004.7,
"valid_targets_min": 612
},
{
"epoch": 5.389064143007361,
"grad_norm": 0.4976447594636517,
"learning_rate": 6.121676952361395e-06,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08027186989784241,
"step": 5125,
"valid_targets_mean": 2383.1,
"valid_targets_min": 672
},
{
"epoch": 5.394321766561514,
"grad_norm": 0.5162665920302016,
"learning_rate": 6.083966026662076e-06,
"loss": 0.0954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09540772438049316,
"step": 5130,
"valid_targets_mean": 2081.2,
"valid_targets_min": 647
},
{
"epoch": 5.399579390115668,
"grad_norm": 0.6755188681179325,
"learning_rate": 6.046350766683194e-06,
"loss": 0.0912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08836962282657623,
"step": 5135,
"valid_targets_mean": 1916.9,
"valid_targets_min": 486
},
{
"epoch": 5.404837013669821,
"grad_norm": 0.49184892305156813,
"learning_rate": 6.0088314310107e-06,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07478086650371552,
"step": 5140,
"valid_targets_mean": 2625.5,
"valid_targets_min": 557
},
{
"epoch": 5.410094637223975,
"grad_norm": 0.5427144533180108,
"learning_rate": 5.9714082775711115e-06,
"loss": 0.0896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08238373696804047,
"step": 5145,
"valid_targets_mean": 2412.2,
"valid_targets_min": 583
},
{
"epoch": 5.415352260778128,
"grad_norm": 0.56159728903901,
"learning_rate": 5.934081563629764e-06,
"loss": 0.0895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10774420201778412,
"step": 5150,
"valid_targets_mean": 2574.9,
"valid_targets_min": 1041
},
{
"epoch": 5.420609884332282,
"grad_norm": 0.684217672102224,
"learning_rate": 5.896851545788987e-06,
"loss": 0.0982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1068786159157753,
"step": 5155,
"valid_targets_mean": 1533.3,
"valid_targets_min": 722
},
{
"epoch": 5.425867507886435,
"grad_norm": 0.5129428811204777,
"learning_rate": 5.859718479986407e-06,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09402783215045929,
"step": 5160,
"valid_targets_mean": 2386.5,
"valid_targets_min": 739
},
{
"epoch": 5.431125131440589,
"grad_norm": 0.5329563235707115,
"learning_rate": 5.822682621493132e-06,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09016478806734085,
"step": 5165,
"valid_targets_mean": 2212.3,
"valid_targets_min": 661
},
{
"epoch": 5.436382754994742,
"grad_norm": 0.5258381654629917,
"learning_rate": 5.7857442249120155e-06,
"loss": 0.0823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09403106570243835,
"step": 5170,
"valid_targets_mean": 2156.6,
"valid_targets_min": 707
},
{
"epoch": 5.441640378548896,
"grad_norm": 0.5265139153110723,
"learning_rate": 5.748903544175934e-06,
"loss": 0.0865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07622712105512619,
"step": 5175,
"valid_targets_mean": 2318.4,
"valid_targets_min": 805
},
{
"epoch": 5.446898002103049,
"grad_norm": 0.47694438996139393,
"learning_rate": 5.712160832545992e-06,
"loss": 0.0886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0758940801024437,
"step": 5180,
"valid_targets_mean": 2229.1,
"valid_targets_min": 782
},
{
"epoch": 5.452155625657203,
"grad_norm": 0.5902731195372731,
"learning_rate": 5.675516342609811e-06,
"loss": 0.0953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09718483686447144,
"step": 5185,
"valid_targets_mean": 2076.9,
"valid_targets_min": 702
},
{
"epoch": 5.457413249211356,
"grad_norm": 0.4761587460632117,
"learning_rate": 5.638970326279802e-06,
"loss": 0.0995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07407154142856598,
"step": 5190,
"valid_targets_mean": 2687.7,
"valid_targets_min": 912
},
{
"epoch": 5.46267087276551,
"grad_norm": 0.535617634825431,
"learning_rate": 5.602523034791407e-06,
"loss": 0.1005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12189748138189316,
"step": 5195,
"valid_targets_mean": 2799.6,
"valid_targets_min": 952
},
{
"epoch": 5.467928496319663,
"grad_norm": 0.553037426047414,
"learning_rate": 5.566174718701378e-06,
"loss": 0.0886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07654684782028198,
"step": 5200,
"valid_targets_mean": 2550.1,
"valid_targets_min": 923
},
{
"epoch": 5.473186119873817,
"grad_norm": 0.6555197998919323,
"learning_rate": 5.529925627886079e-06,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09734015166759491,
"step": 5205,
"valid_targets_mean": 1867.9,
"valid_targets_min": 684
},
{
"epoch": 5.47844374342797,
"grad_norm": 0.49489188109177146,
"learning_rate": 5.493776011539749e-06,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07118456065654755,
"step": 5210,
"valid_targets_mean": 2581.7,
"valid_targets_min": 724
},
{
"epoch": 5.483701366982124,
"grad_norm": 0.6184209032961526,
"learning_rate": 5.457726118172761e-06,
"loss": 0.0861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09093640744686127,
"step": 5215,
"valid_targets_mean": 1897.7,
"valid_targets_min": 676
},
{
"epoch": 5.488958990536277,
"grad_norm": 0.5633129479934272,
"learning_rate": 5.421776195609982e-06,
"loss": 0.0873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08384709060192108,
"step": 5220,
"valid_targets_mean": 2077.4,
"valid_targets_min": 859
},
{
"epoch": 5.494216614090431,
"grad_norm": 0.48714039337173504,
"learning_rate": 5.385926490989e-06,
"loss": 0.0811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07210887968540192,
"step": 5225,
"valid_targets_mean": 2639.4,
"valid_targets_min": 574
},
{
"epoch": 5.499474237644584,
"grad_norm": 0.5602380111645523,
"learning_rate": 5.350177250758479e-06,
"loss": 0.1017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1105768233537674,
"step": 5230,
"valid_targets_mean": 2253.5,
"valid_targets_min": 875
},
{
"epoch": 5.504731861198739,
"grad_norm": 0.6155675377801821,
"learning_rate": 5.314528720676424e-06,
"loss": 0.0875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09778967499732971,
"step": 5235,
"valid_targets_mean": 2121.3,
"valid_targets_min": 730
},
{
"epoch": 5.509989484752892,
"grad_norm": 0.6079400830110482,
"learning_rate": 5.2789811458085085e-06,
"loss": 0.0893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09395016729831696,
"step": 5240,
"valid_targets_mean": 2127.2,
"valid_targets_min": 564
},
{
"epoch": 5.515247108307046,
"grad_norm": 0.5574338639075599,
"learning_rate": 5.243534770526404e-06,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07216348499059677,
"step": 5245,
"valid_targets_mean": 2429.6,
"valid_targets_min": 596
},
{
"epoch": 5.520504731861199,
"grad_norm": 0.5442233836773664,
"learning_rate": 5.208189838506074e-06,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08539680391550064,
"step": 5250,
"valid_targets_mean": 2291.8,
"valid_targets_min": 655
},
{
"epoch": 5.5257623554153525,
"grad_norm": 0.6322818515182882,
"learning_rate": 5.172946592726109e-06,
"loss": 0.0945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08994129300117493,
"step": 5255,
"valid_targets_mean": 1991.9,
"valid_targets_min": 731
},
{
"epoch": 5.531019978969506,
"grad_norm": 0.5766441567429282,
"learning_rate": 5.137805275466072e-06,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08678489923477173,
"step": 5260,
"valid_targets_mean": 2474.0,
"valid_targets_min": 905
},
{
"epoch": 5.5362776025236595,
"grad_norm": 0.5912648441933985,
"learning_rate": 5.1027661283048036e-06,
"loss": 0.0901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10287672281265259,
"step": 5265,
"valid_targets_mean": 2525.1,
"valid_targets_min": 788
},
{
"epoch": 5.541535226077813,
"grad_norm": 0.5398208833982352,
"learning_rate": 5.067829392118775e-06,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08741910010576248,
"step": 5270,
"valid_targets_mean": 2423.4,
"valid_targets_min": 744
},
{
"epoch": 5.5467928496319665,
"grad_norm": 0.4153235041633056,
"learning_rate": 5.03299530708045e-06,
"loss": 0.0783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06753223389387131,
"step": 5275,
"valid_targets_mean": 2707.9,
"valid_targets_min": 570
},
{
"epoch": 5.55205047318612,
"grad_norm": 0.5993804049489362,
"learning_rate": 4.998264112656617e-06,
"loss": 0.0914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08266077935695648,
"step": 5280,
"valid_targets_mean": 2450.8,
"valid_targets_min": 632
},
{
"epoch": 5.5573080967402735,
"grad_norm": 0.49158789697485294,
"learning_rate": 4.963636047606712e-06,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09071182459592819,
"step": 5285,
"valid_targets_mean": 2366.0,
"valid_targets_min": 457
},
{
"epoch": 5.562565720294427,
"grad_norm": 0.5733751464405636,
"learning_rate": 4.929111349981244e-06,
"loss": 0.092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09665729105472565,
"step": 5290,
"valid_targets_mean": 2026.9,
"valid_targets_min": 647
},
{
"epoch": 5.5678233438485805,
"grad_norm": 0.6195412458721764,
"learning_rate": 4.894690257120114e-06,
"loss": 0.082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08800621330738068,
"step": 5295,
"valid_targets_mean": 1942.7,
"valid_targets_min": 697
},
{
"epoch": 5.573080967402734,
"grad_norm": 0.5032757942881321,
"learning_rate": 4.860373005650985e-06,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07049019634723663,
"step": 5300,
"valid_targets_mean": 2433.9,
"valid_targets_min": 800
},
{
"epoch": 5.578338590956887,
"grad_norm": 0.5865934894545591,
"learning_rate": 4.826159831487656e-06,
"loss": 0.0923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10396245121955872,
"step": 5305,
"valid_targets_mean": 2183.4,
"valid_targets_min": 636
},
{
"epoch": 5.583596214511041,
"grad_norm": 0.3948078988960736,
"learning_rate": 4.792050969828474e-06,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06265468895435333,
"step": 5310,
"valid_targets_mean": 3537.3,
"valid_targets_min": 807
},
{
"epoch": 5.588853838065194,
"grad_norm": 0.4595783336920087,
"learning_rate": 4.758046655154664e-06,
"loss": 0.0922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07591443508863449,
"step": 5315,
"valid_targets_mean": 2284.4,
"valid_targets_min": 526
},
{
"epoch": 5.594111461619348,
"grad_norm": 0.5303180029151328,
"learning_rate": 4.72414712122875e-06,
"loss": 0.0953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07905713468790054,
"step": 5320,
"valid_targets_mean": 2264.1,
"valid_targets_min": 526
},
{
"epoch": 5.599369085173501,
"grad_norm": 0.5163464637524532,
"learning_rate": 4.690352601092954e-06,
"loss": 0.0937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09070698916912079,
"step": 5325,
"valid_targets_mean": 2313.1,
"valid_targets_min": 936
},
{
"epoch": 5.604626708727655,
"grad_norm": 0.515625639071231,
"learning_rate": 4.656663327067563e-06,
"loss": 0.0868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08502315729856491,
"step": 5330,
"valid_targets_mean": 2410.4,
"valid_targets_min": 663
},
{
"epoch": 5.609884332281808,
"grad_norm": 0.5753128046467256,
"learning_rate": 4.623079530749355e-06,
"loss": 0.0882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09436322748661041,
"step": 5335,
"valid_targets_mean": 2534.8,
"valid_targets_min": 680
},
{
"epoch": 5.615141955835962,
"grad_norm": 0.553906598059246,
"learning_rate": 4.589601443010012e-06,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08646899461746216,
"step": 5340,
"valid_targets_mean": 2483.5,
"valid_targets_min": 666
},
{
"epoch": 5.620399579390115,
"grad_norm": 0.6681476043896348,
"learning_rate": 4.55622929399451e-06,
"loss": 0.0954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13314712047576904,
"step": 5345,
"valid_targets_mean": 1749.9,
"valid_targets_min": 703
},
{
"epoch": 5.625657202944269,
"grad_norm": 0.46089624700762366,
"learning_rate": 4.522963313119564e-06,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07705404609441757,
"step": 5350,
"valid_targets_mean": 2723.7,
"valid_targets_min": 447
},
{
"epoch": 5.630914826498422,
"grad_norm": 0.444664454552104,
"learning_rate": 4.48980372907202e-06,
"loss": 0.0958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0913049578666687,
"step": 5355,
"valid_targets_mean": 3072.8,
"valid_targets_min": 1289
},
{
"epoch": 5.636172450052577,
"grad_norm": 0.4311136895308548,
"learning_rate": 4.456750769807303e-06,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07031607627868652,
"step": 5360,
"valid_targets_mean": 2942.3,
"valid_targets_min": 459
},
{
"epoch": 5.641430073606729,
"grad_norm": 0.6500569130936695,
"learning_rate": 4.4238046625478635e-06,
"loss": 0.084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08337889611721039,
"step": 5365,
"valid_targets_mean": 2212.2,
"valid_targets_min": 545
},
{
"epoch": 5.646687697160884,
"grad_norm": 0.5728413530834037,
"learning_rate": 4.390965633781579e-06,
"loss": 0.0922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0895937830209732,
"step": 5370,
"valid_targets_mean": 2505.4,
"valid_targets_min": 841
},
{
"epoch": 5.651945320715037,
"grad_norm": 0.4483705223835473,
"learning_rate": 4.358233909260215e-06,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08544885367155075,
"step": 5375,
"valid_targets_mean": 2688.9,
"valid_targets_min": 818
},
{
"epoch": 5.657202944269191,
"grad_norm": 0.4198114609978518,
"learning_rate": 4.3256097139978934e-06,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08224814385175705,
"step": 5380,
"valid_targets_mean": 3323.7,
"valid_targets_min": 1275
},
{
"epoch": 5.662460567823344,
"grad_norm": 0.48101414070495335,
"learning_rate": 4.293093272269513e-06,
"loss": 0.0747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07239574939012527,
"step": 5385,
"valid_targets_mean": 2499.7,
"valid_targets_min": 663
},
{
"epoch": 5.667718191377498,
"grad_norm": 0.5646795103123908,
"learning_rate": 4.260684807609217e-06,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08617733418941498,
"step": 5390,
"valid_targets_mean": 2204.4,
"valid_targets_min": 676
},
{
"epoch": 5.672975814931651,
"grad_norm": 0.5210357234668013,
"learning_rate": 4.22838454280887e-06,
"loss": 0.0881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08218752592802048,
"step": 5395,
"valid_targets_mean": 2285.6,
"valid_targets_min": 840
},
{
"epoch": 5.678233438485805,
"grad_norm": 0.6531544978424684,
"learning_rate": 4.196192699916528e-06,
"loss": 0.0927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09651017189025879,
"step": 5400,
"valid_targets_mean": 2171.2,
"valid_targets_min": 687
},
{
"epoch": 5.683491062039958,
"grad_norm": 0.5774453303522198,
"learning_rate": 4.164109500234865e-06,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10746052861213684,
"step": 5405,
"valid_targets_mean": 2573.3,
"valid_targets_min": 719
},
{
"epoch": 5.688748685594112,
"grad_norm": 0.6424409067962772,
"learning_rate": 4.1321351643197235e-06,
"loss": 0.1026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14832936227321625,
"step": 5410,
"valid_targets_mean": 2176.1,
"valid_targets_min": 919
},
{
"epoch": 5.694006309148265,
"grad_norm": 0.6277268282338863,
"learning_rate": 4.100269911978549e-06,
"loss": 0.0828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07900786399841309,
"step": 5415,
"valid_targets_mean": 2172.5,
"valid_targets_min": 665
},
{
"epoch": 5.699263932702419,
"grad_norm": 0.4817563483663239,
"learning_rate": 4.068513962268892e-06,
"loss": 0.0869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07632628083229065,
"step": 5420,
"valid_targets_mean": 2947.7,
"valid_targets_min": 730
},
{
"epoch": 5.704521556256572,
"grad_norm": 0.5004479213669947,
"learning_rate": 4.036867533496895e-06,
"loss": 0.0861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09631700813770294,
"step": 5425,
"valid_targets_mean": 2772.9,
"valid_targets_min": 768
},
{
"epoch": 5.709779179810726,
"grad_norm": 0.6530074009531026,
"learning_rate": 4.00533084321582e-06,
"loss": 0.088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10301493108272552,
"step": 5430,
"valid_targets_mean": 1791.8,
"valid_targets_min": 759
},
{
"epoch": 5.715036803364879,
"grad_norm": 0.524610129797814,
"learning_rate": 3.9739041082245114e-06,
"loss": 0.0924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08901625871658325,
"step": 5435,
"valid_targets_mean": 2381.7,
"valid_targets_min": 713
},
{
"epoch": 5.720294426919033,
"grad_norm": 0.5590991950288964,
"learning_rate": 3.942587544565932e-06,
"loss": 0.0908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09176189452409744,
"step": 5440,
"valid_targets_mean": 2532.6,
"valid_targets_min": 605
},
{
"epoch": 5.725552050473186,
"grad_norm": 0.47196418919574834,
"learning_rate": 3.9113813675256816e-06,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06913070380687714,
"step": 5445,
"valid_targets_mean": 2493.3,
"valid_targets_min": 557
},
{
"epoch": 5.7308096740273395,
"grad_norm": 0.4397388736856478,
"learning_rate": 3.8802857916305006e-06,
"loss": 0.0947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06952081620693207,
"step": 5450,
"valid_targets_mean": 2595.3,
"valid_targets_min": 663
},
{
"epoch": 5.736067297581493,
"grad_norm": 0.45140113372622415,
"learning_rate": 3.849301030646797e-06,
"loss": 0.085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0651782900094986,
"step": 5455,
"valid_targets_mean": 2937.3,
"valid_targets_min": 857
},
{
"epoch": 5.7413249211356465,
"grad_norm": 0.548536146314351,
"learning_rate": 3.818427297579186e-06,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08253629505634308,
"step": 5460,
"valid_targets_mean": 2287.4,
"valid_targets_min": 597
},
{
"epoch": 5.7465825446898,
"grad_norm": 0.7331227478959966,
"learning_rate": 3.787664804669027e-06,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13046732544898987,
"step": 5465,
"valid_targets_mean": 1947.7,
"valid_targets_min": 660
},
{
"epoch": 5.7518401682439535,
"grad_norm": 0.5710492123285679,
"learning_rate": 3.7570137633929647e-06,
"loss": 0.0872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12107446789741516,
"step": 5470,
"valid_targets_mean": 2234.6,
"valid_targets_min": 826
},
{
"epoch": 5.757097791798107,
"grad_norm": 0.45114348672813753,
"learning_rate": 3.7264743844614424e-06,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06874774396419525,
"step": 5475,
"valid_targets_mean": 2493.6,
"valid_targets_min": 692
},
{
"epoch": 5.7623554153522605,
"grad_norm": 0.7662737736843699,
"learning_rate": 3.6960468778173097e-06,
"loss": 0.09,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07488881796598434,
"step": 5480,
"valid_targets_mean": 1951.9,
"valid_targets_min": 582
},
{
"epoch": 5.767613038906414,
"grad_norm": 0.44970734616562896,
"learning_rate": 3.665731452634347e-06,
"loss": 0.0776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07213976979255676,
"step": 5485,
"valid_targets_mean": 2931.3,
"valid_targets_min": 951
},
{
"epoch": 5.7728706624605675,
"grad_norm": 0.4984338259217311,
"learning_rate": 3.6355283173158153e-06,
"loss": 0.0939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10505960881710052,
"step": 5490,
"valid_targets_mean": 2391.6,
"valid_targets_min": 679
},
{
"epoch": 5.778128286014722,
"grad_norm": 0.5402497583721152,
"learning_rate": 3.6054376794930467e-06,
"loss": 0.0864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1041635200381279,
"step": 5495,
"valid_targets_mean": 2059.9,
"valid_targets_min": 664
},
{
"epoch": 5.783385909568874,
"grad_norm": 0.6305453990943386,
"learning_rate": 3.5754597460240216e-06,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09370997548103333,
"step": 5500,
"valid_targets_mean": 2417.4,
"valid_targets_min": 568
},
{
"epoch": 5.788643533123029,
"grad_norm": 0.4678951652643369,
"learning_rate": 3.5455947229919185e-06,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08178877830505371,
"step": 5505,
"valid_targets_mean": 2901.9,
"valid_targets_min": 958
},
{
"epoch": 5.793901156677181,
"grad_norm": 0.5906023556607463,
"learning_rate": 3.515842815703716e-06,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0749162882566452,
"step": 5510,
"valid_targets_mean": 2771.2,
"valid_targets_min": 1008
},
{
"epoch": 5.799158780231336,
"grad_norm": 0.5957726744354533,
"learning_rate": 3.4862042286887943e-06,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07660531997680664,
"step": 5515,
"valid_targets_mean": 2089.9,
"valid_targets_min": 616
},
{
"epoch": 5.804416403785489,
"grad_norm": 0.4958844336200409,
"learning_rate": 3.456679165697494e-06,
"loss": 0.0949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08415857702493668,
"step": 5520,
"valid_targets_mean": 2608.9,
"valid_targets_min": 749
},
{
"epoch": 5.809674027339643,
"grad_norm": 0.5659252836064446,
"learning_rate": 3.427267829699741e-06,
"loss": 0.0907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08828768134117126,
"step": 5525,
"valid_targets_mean": 2554.5,
"valid_targets_min": 1005
},
{
"epoch": 5.814931650893796,
"grad_norm": 0.528723705289167,
"learning_rate": 3.3979704228836586e-06,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10861288011074066,
"step": 5530,
"valid_targets_mean": 2562.7,
"valid_targets_min": 699
},
{
"epoch": 5.82018927444795,
"grad_norm": 0.5146879599510277,
"learning_rate": 3.3687871466541424e-06,
"loss": 0.0859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07991898059844971,
"step": 5535,
"valid_targets_mean": 2441.8,
"valid_targets_min": 776
},
{
"epoch": 5.825446898002103,
"grad_norm": 0.5292565366075449,
"learning_rate": 3.339718201631521e-06,
"loss": 0.0827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09508883953094482,
"step": 5540,
"valid_targets_mean": 2610.1,
"valid_targets_min": 970
},
{
"epoch": 5.830704521556257,
"grad_norm": 0.47962227609708746,
"learning_rate": 3.3107637876501352e-06,
"loss": 0.097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07185357809066772,
"step": 5545,
"valid_targets_mean": 2593.1,
"valid_targets_min": 685
},
{
"epoch": 5.83596214511041,
"grad_norm": 0.5548732898629763,
"learning_rate": 3.2819241037569838e-06,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08948536217212677,
"step": 5550,
"valid_targets_mean": 2108.5,
"valid_targets_min": 659
},
{
"epoch": 5.841219768664564,
"grad_norm": 0.5645995988238837,
"learning_rate": 3.253199348210372e-06,
"loss": 0.0983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0948578268289566,
"step": 5555,
"valid_targets_mean": 1972.9,
"valid_targets_min": 754
},
{
"epoch": 5.846477392218717,
"grad_norm": 0.5996572112895203,
"learning_rate": 3.2245897184785103e-06,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09942987561225891,
"step": 5560,
"valid_targets_mean": 2082.2,
"valid_targets_min": 507
},
{
"epoch": 5.851735015772871,
"grad_norm": 0.4704668960159087,
"learning_rate": 3.1960954112381825e-06,
"loss": 0.0877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07045850902795792,
"step": 5565,
"valid_targets_mean": 2615.1,
"valid_targets_min": 768
},
{
"epoch": 5.856992639327024,
"grad_norm": 0.6221105353509334,
"learning_rate": 3.1677166223733934e-06,
"loss": 0.0886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08988603204488754,
"step": 5570,
"valid_targets_mean": 1817.7,
"valid_targets_min": 507
},
{
"epoch": 5.862250262881178,
"grad_norm": 0.4881413001729917,
"learning_rate": 3.1394535469740273e-06,
"loss": 0.0844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07280032336711884,
"step": 5575,
"valid_targets_mean": 2507.2,
"valid_targets_min": 716
},
{
"epoch": 5.867507886435331,
"grad_norm": 0.4891925276738254,
"learning_rate": 3.111306379334462e-06,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08489258587360382,
"step": 5580,
"valid_targets_mean": 2766.6,
"valid_targets_min": 765
},
{
"epoch": 5.872765509989485,
"grad_norm": 0.5362053437582399,
"learning_rate": 3.083275312952301e-06,
"loss": 0.0848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08721506595611572,
"step": 5585,
"valid_targets_mean": 2344.8,
"valid_targets_min": 577
},
{
"epoch": 5.878023133543638,
"grad_norm": 0.434492361782878,
"learning_rate": 3.055360540527006e-06,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06373853981494904,
"step": 5590,
"valid_targets_mean": 2705.3,
"valid_targets_min": 530
},
{
"epoch": 5.883280757097792,
"grad_norm": 0.5858458093131826,
"learning_rate": 3.0275622539585556e-06,
"loss": 0.0968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09622153639793396,
"step": 5595,
"valid_targets_mean": 2104.0,
"valid_targets_min": 724
},
{
"epoch": 5.888538380651945,
"grad_norm": 0.45417862459823877,
"learning_rate": 2.999880644346165e-06,
"loss": 0.0839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07301604002714157,
"step": 5600,
"valid_targets_mean": 2815.8,
"valid_targets_min": 616
},
{
"epoch": 5.893796004206099,
"grad_norm": 0.5127927963734046,
"learning_rate": 2.9723159019869597e-06,
"loss": 0.0858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07359402626752853,
"step": 5605,
"valid_targets_mean": 2428.5,
"valid_targets_min": 740
},
{
"epoch": 5.899053627760252,
"grad_norm": 0.64273765132575,
"learning_rate": 2.9448682163746413e-06,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09796072542667389,
"step": 5610,
"valid_targets_mean": 1890.1,
"valid_targets_min": 734
},
{
"epoch": 5.904311251314406,
"grad_norm": 0.5802948362858069,
"learning_rate": 2.917537776198216e-06,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09772264957427979,
"step": 5615,
"valid_targets_mean": 2369.3,
"valid_targets_min": 605
},
{
"epoch": 5.909568874868559,
"grad_norm": 0.47503663884897634,
"learning_rate": 2.8903247693406932e-06,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08762972056865692,
"step": 5620,
"valid_targets_mean": 2411.2,
"valid_targets_min": 618
},
{
"epoch": 5.914826498422713,
"grad_norm": 0.4533706973115579,
"learning_rate": 2.863229382877777e-06,
"loss": 0.0884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06960652023553848,
"step": 5625,
"valid_targets_mean": 2516.8,
"valid_targets_min": 610
},
{
"epoch": 5.920084121976867,
"grad_norm": 0.5992984312981956,
"learning_rate": 2.8362518030765904e-06,
"loss": 0.0874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08197487890720367,
"step": 5630,
"valid_targets_mean": 1861.7,
"valid_targets_min": 633
},
{
"epoch": 5.9253417455310196,
"grad_norm": 0.5456357448566179,
"learning_rate": 2.8093922153944065e-06,
"loss": 0.0984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08513805270195007,
"step": 5635,
"valid_targets_mean": 2709.4,
"valid_targets_min": 807
},
{
"epoch": 5.930599369085174,
"grad_norm": 0.6490203054458612,
"learning_rate": 2.782650804477347e-06,
"loss": 0.0899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10770347714424133,
"step": 5640,
"valid_targets_mean": 1824.4,
"valid_targets_min": 895
},
{
"epoch": 5.9358569926393265,
"grad_norm": 0.49867988696714866,
"learning_rate": 2.7560277541591427e-06,
"loss": 0.0865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08890093863010406,
"step": 5645,
"valid_targets_mean": 2237.4,
"valid_targets_min": 1015
},
{
"epoch": 5.941114616193481,
"grad_norm": 0.6082667419874155,
"learning_rate": 2.7295232474598445e-06,
"loss": 0.0975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09509513527154922,
"step": 5650,
"valid_targets_mean": 1942.3,
"valid_targets_min": 337
},
{
"epoch": 5.946372239747634,
"grad_norm": 0.496042340568446,
"learning_rate": 2.703137466584571e-06,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07633326947689056,
"step": 5655,
"valid_targets_mean": 2645.0,
"valid_targets_min": 721
},
{
"epoch": 5.951629863301788,
"grad_norm": 0.5897513325385411,
"learning_rate": 2.6768705929222827e-06,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08483654260635376,
"step": 5660,
"valid_targets_mean": 2241.8,
"valid_targets_min": 680
},
{
"epoch": 5.956887486855941,
"grad_norm": 0.6370513621413806,
"learning_rate": 2.6507228070444922e-06,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11121095716953278,
"step": 5665,
"valid_targets_mean": 2336.7,
"valid_targets_min": 705
},
{
"epoch": 5.962145110410095,
"grad_norm": 0.4507262999169322,
"learning_rate": 2.6246942887040416e-06,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.073326975107193,
"step": 5670,
"valid_targets_mean": 3020.1,
"valid_targets_min": 847
},
{
"epoch": 5.967402733964248,
"grad_norm": 0.5723282245002131,
"learning_rate": 2.5987852168338922e-06,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08216974139213562,
"step": 5675,
"valid_targets_mean": 2300.0,
"valid_targets_min": 647
},
{
"epoch": 5.972660357518402,
"grad_norm": 0.4952944807697732,
"learning_rate": 2.5729957695458454e-06,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08002395182847977,
"step": 5680,
"valid_targets_mean": 2569.4,
"valid_targets_min": 732
},
{
"epoch": 5.977917981072555,
"grad_norm": 0.5812148747322718,
"learning_rate": 2.5473261241293547e-06,
"loss": 0.0896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08404475450515747,
"step": 5685,
"valid_targets_mean": 2359.4,
"valid_targets_min": 584
},
{
"epoch": 5.983175604626709,
"grad_norm": 0.7609849333124278,
"learning_rate": 2.521776457050302e-06,
"loss": 0.0855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0982176810503006,
"step": 5690,
"valid_targets_mean": 1734.2,
"valid_targets_min": 714
},
{
"epoch": 5.988433228180862,
"grad_norm": 0.6982768349055034,
"learning_rate": 2.4963469439497703e-06,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09887810051441193,
"step": 5695,
"valid_targets_mean": 1699.8,
"valid_targets_min": 647
},
{
"epoch": 5.993690851735016,
"grad_norm": 0.6758395777894055,
"learning_rate": 2.4710377596428404e-06,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09870202094316483,
"step": 5700,
"valid_targets_mean": 1829.5,
"valid_targets_min": 697
},
{
"epoch": 5.998948475289169,
"grad_norm": 0.4557440930637309,
"learning_rate": 2.4458490781174084e-06,
"loss": 0.0888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07640472054481506,
"step": 5705,
"valid_targets_mean": 3156.1,
"valid_targets_min": 815
},
{
"epoch": 6.004206098843323,
"grad_norm": 0.6311486181160924,
"learning_rate": 2.4207810725329583e-06,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11960560083389282,
"step": 5710,
"valid_targets_mean": 2027.1,
"valid_targets_min": 720
},
{
"epoch": 6.009463722397476,
"grad_norm": 0.4301873346168057,
"learning_rate": 2.395833915219401e-06,
"loss": 0.0801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06634050607681274,
"step": 5715,
"valid_targets_mean": 2516.6,
"valid_targets_min": 826
},
{
"epoch": 6.01472134595163,
"grad_norm": 0.4602129645627361,
"learning_rate": 2.3710077776758713e-06,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07114356011152267,
"step": 5720,
"valid_targets_mean": 2623.8,
"valid_targets_min": 740
},
{
"epoch": 6.019978969505783,
"grad_norm": 0.4678338969468432,
"learning_rate": 2.3463028305695447e-06,
"loss": 0.0757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06978046149015427,
"step": 5725,
"valid_targets_mean": 2589.9,
"valid_targets_min": 919
},
{
"epoch": 6.025236593059937,
"grad_norm": 0.5537062921815175,
"learning_rate": 2.3217192437344925e-06,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08498544991016388,
"step": 5730,
"valid_targets_mean": 2447.1,
"valid_targets_min": 853
},
{
"epoch": 6.03049421661409,
"grad_norm": 0.5998614066943314,
"learning_rate": 2.2972571861704784e-06,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07053668051958084,
"step": 5735,
"valid_targets_mean": 2536.7,
"valid_targets_min": 539
},
{
"epoch": 6.035751840168244,
"grad_norm": 0.4943978335545759,
"learning_rate": 2.2729168260418224e-06,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0674082338809967,
"step": 5740,
"valid_targets_mean": 2453.1,
"valid_targets_min": 912
},
{
"epoch": 6.041009463722397,
"grad_norm": 0.6658790399701576,
"learning_rate": 2.2486983306762332e-06,
"loss": 0.0867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0960560292005539,
"step": 5745,
"valid_targets_mean": 1916.3,
"valid_targets_min": 774
},
{
"epoch": 6.046267087276551,
"grad_norm": 0.5097721105025195,
"learning_rate": 2.224601866563665e-06,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06594580411911011,
"step": 5750,
"valid_targets_mean": 2288.9,
"valid_targets_min": 605
},
{
"epoch": 6.051524710830704,
"grad_norm": 0.44053964580255667,
"learning_rate": 2.2006275993551563e-06,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07779178768396378,
"step": 5755,
"valid_targets_mean": 2928.6,
"valid_targets_min": 1062
},
{
"epoch": 6.056782334384858,
"grad_norm": 0.5286826672086139,
"learning_rate": 2.176775693861719e-06,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10188593715429306,
"step": 5760,
"valid_targets_mean": 2638.4,
"valid_targets_min": 692
},
{
"epoch": 6.062039957939011,
"grad_norm": 0.5902172679053457,
"learning_rate": 2.1530463140531886e-06,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07679794728755951,
"step": 5765,
"valid_targets_mean": 2029.1,
"valid_targets_min": 580
},
{
"epoch": 6.067297581493165,
"grad_norm": 0.5904499596922234,
"learning_rate": 2.129439623057077e-06,
"loss": 0.0795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08259987086057663,
"step": 5770,
"valid_targets_mean": 1961.1,
"valid_targets_min": 641
},
{
"epoch": 6.072555205047319,
"grad_norm": 0.5773865011711439,
"learning_rate": 2.105955783157498e-06,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08179889619350433,
"step": 5775,
"valid_targets_mean": 2238.8,
"valid_targets_min": 635
},
{
"epoch": 6.0778128286014725,
"grad_norm": 0.698689796019584,
"learning_rate": 2.0825949557940174e-06,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0948541909456253,
"step": 5780,
"valid_targets_mean": 1778.4,
"valid_targets_min": 669
},
{
"epoch": 6.083070452155626,
"grad_norm": 0.5162464182641611,
"learning_rate": 2.059357301560547e-06,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08193211257457733,
"step": 5785,
"valid_targets_mean": 2498.9,
"valid_targets_min": 523
},
{
"epoch": 6.0883280757097795,
"grad_norm": 0.5331890474579141,
"learning_rate": 2.036242980204244e-06,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06974825263023376,
"step": 5790,
"valid_targets_mean": 2300.2,
"valid_targets_min": 797
},
{
"epoch": 6.093585699263933,
"grad_norm": 0.5139405965645236,
"learning_rate": 2.0132521506244294e-06,
"loss": 0.0799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07520533353090286,
"step": 5795,
"valid_targets_mean": 2326.1,
"valid_targets_min": 931
},
{
"epoch": 6.0988433228180865,
"grad_norm": 0.5679383487761702,
"learning_rate": 1.9903849708714664e-06,
"loss": 0.0877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09307673573493958,
"step": 5800,
"valid_targets_mean": 2668.4,
"valid_targets_min": 1101
},
{
"epoch": 6.10410094637224,
"grad_norm": 0.5893786641548519,
"learning_rate": 1.967641598145684e-06,
"loss": 0.0845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11470180749893188,
"step": 5805,
"valid_targets_mean": 2223.9,
"valid_targets_min": 848
},
{
"epoch": 6.1093585699263935,
"grad_norm": 0.6749860961486656,
"learning_rate": 1.9450221887963194e-06,
"loss": 0.0911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09860561043024063,
"step": 5810,
"valid_targets_mean": 2228.6,
"valid_targets_min": 740
},
{
"epoch": 6.114616193480547,
"grad_norm": 0.5461422699973559,
"learning_rate": 1.922526898320407e-06,
"loss": 0.0818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07981450855731964,
"step": 5815,
"valid_targets_mean": 1969.8,
"valid_targets_min": 711
},
{
"epoch": 6.1198738170347005,
"grad_norm": 0.48062831708279297,
"learning_rate": 1.900155881361727e-06,
"loss": 0.0895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07658898830413818,
"step": 5820,
"valid_targets_mean": 2999.1,
"valid_targets_min": 1327
},
{
"epoch": 6.125131440588854,
"grad_norm": 0.6836225155472394,
"learning_rate": 1.8779092917097564e-06,
"loss": 0.0833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08772972226142883,
"step": 5825,
"valid_targets_mean": 1539.4,
"valid_targets_min": 661
},
{
"epoch": 6.130389064143007,
"grad_norm": 0.5333913803219947,
"learning_rate": 1.85578728229858e-06,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06963882595300674,
"step": 5830,
"valid_targets_mean": 2270.5,
"valid_targets_min": 527
},
{
"epoch": 6.135646687697161,
"grad_norm": 0.41092806355355926,
"learning_rate": 1.8337900052058732e-06,
"loss": 0.084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0618227943778038,
"step": 5835,
"valid_targets_mean": 3200.2,
"valid_targets_min": 1396
},
{
"epoch": 6.140904311251314,
"grad_norm": 0.5353628490169989,
"learning_rate": 1.811917611651821e-06,
"loss": 0.0898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08164452761411667,
"step": 5840,
"valid_targets_mean": 2353.9,
"valid_targets_min": 635
},
{
"epoch": 6.146161934805468,
"grad_norm": 0.4547484195439129,
"learning_rate": 1.7901702519981068e-06,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07978129386901855,
"step": 5845,
"valid_targets_mean": 2846.4,
"valid_targets_min": 774
},
{
"epoch": 6.151419558359621,
"grad_norm": 0.6360039238386269,
"learning_rate": 1.7685480757468765e-06,
"loss": 0.0756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09062075614929199,
"step": 5850,
"valid_targets_mean": 2170.2,
"valid_targets_min": 730
},
{
"epoch": 6.156677181913775,
"grad_norm": 0.570311220403222,
"learning_rate": 1.7470512315396894e-06,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0884757786989212,
"step": 5855,
"valid_targets_mean": 2211.8,
"valid_targets_min": 764
},
{
"epoch": 6.161934805467928,
"grad_norm": 0.5645789911037258,
"learning_rate": 1.7256798671565111e-06,
"loss": 0.0869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08335705101490021,
"step": 5860,
"valid_targets_mean": 2381.9,
"valid_targets_min": 602
},
{
"epoch": 6.167192429022082,
"grad_norm": 0.486639090978762,
"learning_rate": 1.7044341295147116e-06,
"loss": 0.0748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06472732871770859,
"step": 5865,
"valid_targets_mean": 2881.5,
"valid_targets_min": 797
},
{
"epoch": 6.172450052576235,
"grad_norm": 0.6019317506830465,
"learning_rate": 1.683314164668024e-06,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07349525392055511,
"step": 5870,
"valid_targets_mean": 1929.8,
"valid_targets_min": 742
},
{
"epoch": 6.177707676130389,
"grad_norm": 0.5556573521483458,
"learning_rate": 1.6623201178055603e-06,
"loss": 0.0811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07919690012931824,
"step": 5875,
"valid_targets_mean": 2386.4,
"valid_targets_min": 607
},
{
"epoch": 6.182965299684542,
"grad_norm": 0.5747006002411422,
"learning_rate": 1.6414521332508183e-06,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0947389081120491,
"step": 5880,
"valid_targets_mean": 2145.9,
"valid_targets_min": 350
},
{
"epoch": 6.188222923238696,
"grad_norm": 0.59557809966825,
"learning_rate": 1.6207103544606795e-06,
"loss": 0.0791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08798443526029587,
"step": 5885,
"valid_targets_mean": 1905.6,
"valid_targets_min": 726
},
{
"epoch": 6.193480546792849,
"grad_norm": 0.672818039827917,
"learning_rate": 1.6000949240244047e-06,
"loss": 0.085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08742979168891907,
"step": 5890,
"valid_targets_mean": 1696.6,
"valid_targets_min": 726
},
{
"epoch": 6.198738170347003,
"grad_norm": 0.5764204219071091,
"learning_rate": 1.5796059836626998e-06,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0877244770526886,
"step": 5895,
"valid_targets_mean": 2382.4,
"valid_targets_min": 884
},
{
"epoch": 6.203995793901156,
"grad_norm": 0.4665849612615211,
"learning_rate": 1.5592436742267048e-06,
"loss": 0.0704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0696813240647316,
"step": 5900,
"valid_targets_mean": 2860.2,
"valid_targets_min": 790
},
{
"epoch": 6.20925341745531,
"grad_norm": 0.5700320665439652,
"learning_rate": 1.5390081356970331e-06,
"loss": 0.0788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08158508688211441,
"step": 5905,
"valid_targets_mean": 2091.7,
"valid_targets_min": 704
},
{
"epoch": 6.214511041009464,
"grad_norm": 0.6352796922081088,
"learning_rate": 1.5188995071828117e-06,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08770360797643661,
"step": 5910,
"valid_targets_mean": 2132.7,
"valid_targets_min": 767
},
{
"epoch": 6.219768664563618,
"grad_norm": 0.5309122306086711,
"learning_rate": 1.498917926920731e-06,
"loss": 0.0745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07387938350439072,
"step": 5915,
"valid_targets_mean": 2518.3,
"valid_targets_min": 699
},
{
"epoch": 6.225026288117771,
"grad_norm": 0.46769653644810577,
"learning_rate": 1.4790635322740855e-06,
"loss": 0.0785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06388302147388458,
"step": 5920,
"valid_targets_mean": 2821.1,
"valid_targets_min": 959
},
{
"epoch": 6.230283911671925,
"grad_norm": 0.5717791177010827,
"learning_rate": 1.4593364597318305e-06,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07935073971748352,
"step": 5925,
"valid_targets_mean": 2100.4,
"valid_targets_min": 693
},
{
"epoch": 6.235541535226078,
"grad_norm": 0.688283660293618,
"learning_rate": 1.4397368449076443e-06,
"loss": 0.0806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08895394206047058,
"step": 5930,
"valid_targets_mean": 2100.2,
"valid_targets_min": 484
},
{
"epoch": 6.240799158780232,
"grad_norm": 0.3864338862766506,
"learning_rate": 1.4202648225390103e-06,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05905337631702423,
"step": 5935,
"valid_targets_mean": 3502.8,
"valid_targets_min": 559
},
{
"epoch": 6.246056782334385,
"grad_norm": 0.5867996213511845,
"learning_rate": 1.4009205264862646e-06,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08197467029094696,
"step": 5940,
"valid_targets_mean": 2281.4,
"valid_targets_min": 597
},
{
"epoch": 6.251314405888539,
"grad_norm": 0.7681107562041767,
"learning_rate": 1.3817040897316903e-06,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10609617829322815,
"step": 5945,
"valid_targets_mean": 1774.8,
"valid_targets_min": 393
},
{
"epoch": 6.256572029442692,
"grad_norm": 0.5882457221242022,
"learning_rate": 1.362615644378611e-06,
"loss": 0.0704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07970559597015381,
"step": 5950,
"valid_targets_mean": 1882.4,
"valid_targets_min": 494
},
{
"epoch": 6.261829652996846,
"grad_norm": 0.5446473062867583,
"learning_rate": 1.3436553216504721e-06,
"loss": 0.0725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06973997503519058,
"step": 5955,
"valid_targets_mean": 2178.6,
"valid_targets_min": 827
},
{
"epoch": 6.267087276550999,
"grad_norm": 0.5430430157157021,
"learning_rate": 1.324823251889924e-06,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06701123714447021,
"step": 5960,
"valid_targets_mean": 2009.4,
"valid_targets_min": 741
},
{
"epoch": 6.2723449001051526,
"grad_norm": 0.5966724311585041,
"learning_rate": 1.3061195645579661e-06,
"loss": 0.0861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08821358531713486,
"step": 5965,
"valid_targets_mean": 2258.1,
"valid_targets_min": 650
},
{
"epoch": 6.277602523659306,
"grad_norm": 0.5595837800247703,
"learning_rate": 1.2875443882330218e-06,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0767974704504013,
"step": 5970,
"valid_targets_mean": 2147.6,
"valid_targets_min": 682
},
{
"epoch": 6.2828601472134595,
"grad_norm": 0.6024425827163108,
"learning_rate": 1.269097850610066e-06,
"loss": 0.0756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07450282573699951,
"step": 5975,
"valid_targets_mean": 2046.2,
"valid_targets_min": 625
},
{
"epoch": 6.288117770767613,
"grad_norm": 0.5082908028436955,
"learning_rate": 1.250780078499747e-06,
"loss": 0.0787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07629716396331787,
"step": 5980,
"valid_targets_mean": 2939.5,
"valid_targets_min": 792
},
{
"epoch": 6.2933753943217665,
"grad_norm": 0.5530591409149812,
"learning_rate": 1.2325911978275196e-06,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08858577907085419,
"step": 5985,
"valid_targets_mean": 2107.3,
"valid_targets_min": 737
},
{
"epoch": 6.29863301787592,
"grad_norm": 0.42155331558211045,
"learning_rate": 1.214531333632769e-06,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06619024276733398,
"step": 5990,
"valid_targets_mean": 3019.6,
"valid_targets_min": 780
},
{
"epoch": 6.3038906414300735,
"grad_norm": 0.579312455259237,
"learning_rate": 1.1966006100679596e-06,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07520725578069687,
"step": 5995,
"valid_targets_mean": 2269.9,
"valid_targets_min": 885
},
{
"epoch": 6.309148264984227,
"grad_norm": 0.5916456338865763,
"learning_rate": 1.1787991503977846e-06,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08871051669120789,
"step": 6000,
"valid_targets_mean": 2106.0,
"valid_targets_min": 699
},
{
"epoch": 6.3144058885383805,
"grad_norm": 0.6418660695053835,
"learning_rate": 1.1611270769983051e-06,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10253676772117615,
"step": 6005,
"valid_targets_mean": 1845.0,
"valid_targets_min": 858
},
{
"epoch": 6.319663512092534,
"grad_norm": 0.4930153985822729,
"learning_rate": 1.143584511356115e-06,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06924517452716827,
"step": 6010,
"valid_targets_mean": 2813.2,
"valid_targets_min": 660
},
{
"epoch": 6.3249211356466875,
"grad_norm": 0.7730944577417425,
"learning_rate": 1.1261715740675205e-06,
"loss": 0.0964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10961425304412842,
"step": 6015,
"valid_targets_mean": 1668.3,
"valid_targets_min": 856
},
{
"epoch": 6.330178759200841,
"grad_norm": 0.5569057386584306,
"learning_rate": 1.108888384837683e-06,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07794185727834702,
"step": 6020,
"valid_targets_mean": 2372.7,
"valid_targets_min": 633
},
{
"epoch": 6.335436382754994,
"grad_norm": 0.6341954198977304,
"learning_rate": 1.0917350624798262e-06,
"loss": 0.0915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0955299586057663,
"step": 6025,
"valid_targets_mean": 1871.8,
"valid_targets_min": 801
},
{
"epoch": 6.340694006309148,
"grad_norm": 0.7459273664348837,
"learning_rate": 1.07471172491439e-06,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09329669177532196,
"step": 6030,
"valid_targets_mean": 2203.2,
"valid_targets_min": 658
},
{
"epoch": 6.345951629863301,
"grad_norm": 0.6236134660278216,
"learning_rate": 1.0578184891682408e-06,
"loss": 0.0834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0735333263874054,
"step": 6035,
"valid_targets_mean": 1820.4,
"valid_targets_min": 666
},
{
"epoch": 6.351209253417455,
"grad_norm": 0.4539557672064203,
"learning_rate": 1.041055471373864e-06,
"loss": 0.0691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06271669268608093,
"step": 6040,
"valid_targets_mean": 3111.9,
"valid_targets_min": 695
},
{
"epoch": 6.356466876971609,
"grad_norm": 0.5303228163353034,
"learning_rate": 1.0244227867685597e-06,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07431896030902863,
"step": 6045,
"valid_targets_mean": 2555.9,
"valid_targets_min": 920
},
{
"epoch": 6.361724500525763,
"grad_norm": 0.6317922633406078,
"learning_rate": 1.0079205496936484e-06,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09275339543819427,
"step": 6050,
"valid_targets_mean": 2014.0,
"valid_targets_min": 657
},
{
"epoch": 6.366982124079916,
"grad_norm": 0.5400098594514727,
"learning_rate": 9.915488735936995e-07,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07970055937767029,
"step": 6055,
"valid_targets_mean": 2397.6,
"valid_targets_min": 799
},
{
"epoch": 6.37223974763407,
"grad_norm": 0.5445260585602347,
"learning_rate": 9.753078710157316e-07,
"loss": 0.0803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08175334334373474,
"step": 6060,
"valid_targets_mean": 2710.8,
"valid_targets_min": 588
},
{
"epoch": 6.377497371188223,
"grad_norm": 0.5493161794666009,
"learning_rate": 9.59197653608448e-07,
"loss": 0.0901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08461320400238037,
"step": 6065,
"valid_targets_mean": 2250.4,
"valid_targets_min": 733
},
{
"epoch": 6.382754994742377,
"grad_norm": 0.6039116683957063,
"learning_rate": 9.432183321214805e-07,
"loss": 0.0809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08243244886398315,
"step": 6070,
"valid_targets_mean": 2346.0,
"valid_targets_min": 708
},
{
"epoch": 6.38801261829653,
"grad_norm": 0.6290483447472189,
"learning_rate": 9.273700164046162e-07,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0974254161119461,
"step": 6075,
"valid_targets_mean": 1893.2,
"valid_targets_min": 808
},
{
"epoch": 6.393270241850684,
"grad_norm": 0.5463570769017867,
"learning_rate": 9.11652815407027e-07,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07830381393432617,
"step": 6080,
"valid_targets_mean": 2322.2,
"valid_targets_min": 824
},
{
"epoch": 6.398527865404837,
"grad_norm": 0.5368764660983166,
"learning_rate": 8.960668371765569e-07,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07296697795391083,
"step": 6085,
"valid_targets_mean": 2090.9,
"valid_targets_min": 634
},
{
"epoch": 6.403785488958991,
"grad_norm": 0.6707918783592765,
"learning_rate": 8.806121888589492e-07,
"loss": 0.0835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09032337367534637,
"step": 6090,
"valid_targets_mean": 1574.7,
"valid_targets_min": 693
},
{
"epoch": 6.409043112513144,
"grad_norm": 0.5741397453146982,
"learning_rate": 8.652889766971229e-07,
"loss": 0.0959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07402016967535019,
"step": 6095,
"valid_targets_mean": 2014.1,
"valid_targets_min": 714
},
{
"epoch": 6.414300736067298,
"grad_norm": 0.4317367622445938,
"learning_rate": 8.500973060304374e-07,
"loss": 0.0795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07480774074792862,
"step": 6100,
"valid_targets_mean": 2856.8,
"valid_targets_min": 746
},
{
"epoch": 6.419558359621451,
"grad_norm": 0.5434627700414081,
"learning_rate": 8.350372812939778e-07,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07698965072631836,
"step": 6105,
"valid_targets_mean": 2252.5,
"valid_targets_min": 472
},
{
"epoch": 6.424815983175605,
"grad_norm": 0.48770613140521873,
"learning_rate": 8.201090060178174e-07,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07912035286426544,
"step": 6110,
"valid_targets_mean": 2754.8,
"valid_targets_min": 721
},
{
"epoch": 6.430073606729758,
"grad_norm": 0.4021173515623404,
"learning_rate": 8.053125828263297e-07,
"loss": 0.0752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06188628077507019,
"step": 6115,
"valid_targets_mean": 3266.8,
"valid_targets_min": 935
},
{
"epoch": 6.435331230283912,
"grad_norm": 0.6271981219314893,
"learning_rate": 7.906481134374688e-07,
"loss": 0.0765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08953511714935303,
"step": 6120,
"valid_targets_mean": 2653.8,
"valid_targets_min": 764
},
{
"epoch": 6.440588853838065,
"grad_norm": 0.49154771586648777,
"learning_rate": 7.761156986620677e-07,
"loss": 0.083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06230591982603073,
"step": 6125,
"valid_targets_mean": 2427.1,
"valid_targets_min": 572
},
{
"epoch": 6.445846477392219,
"grad_norm": 0.5658997963287195,
"learning_rate": 7.617154384031545e-07,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08193057775497437,
"step": 6130,
"valid_targets_mean": 2087.7,
"valid_targets_min": 819
},
{
"epoch": 6.451104100946372,
"grad_norm": 0.5422618785120368,
"learning_rate": 7.474474316552638e-07,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09044471383094788,
"step": 6135,
"valid_targets_mean": 2267.8,
"valid_targets_min": 629
},
{
"epoch": 6.456361724500526,
"grad_norm": 0.4949849706601599,
"learning_rate": 7.33311776503749e-07,
"loss": 0.0779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07225309312343597,
"step": 6140,
"valid_targets_mean": 2734.7,
"valid_targets_min": 685
},
{
"epoch": 6.461619348054679,
"grad_norm": 0.7331318946935437,
"learning_rate": 7.193085701241175e-07,
"loss": 0.0828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08906973898410797,
"step": 6145,
"valid_targets_mean": 1425.6,
"valid_targets_min": 676
},
{
"epoch": 6.466876971608833,
"grad_norm": 0.6736935827439013,
"learning_rate": 7.054379087813568e-07,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08986799418926239,
"step": 6150,
"valid_targets_mean": 1876.6,
"valid_targets_min": 614
},
{
"epoch": 6.472134595162986,
"grad_norm": 0.5008524689755908,
"learning_rate": 6.916998878292691e-07,
"loss": 0.0755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06841963529586792,
"step": 6155,
"valid_targets_mean": 2242.1,
"valid_targets_min": 697
},
{
"epoch": 6.4773922187171395,
"grad_norm": 0.4918950725934552,
"learning_rate": 6.780946017098289e-07,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07490278780460358,
"step": 6160,
"valid_targets_mean": 2857.0,
"valid_targets_min": 848
},
{
"epoch": 6.482649842271293,
"grad_norm": 0.49546769919969147,
"learning_rate": 6.646221439525225e-07,
"loss": 0.0842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06905891001224518,
"step": 6165,
"valid_targets_mean": 2577.3,
"valid_targets_min": 702
},
{
"epoch": 6.4879074658254465,
"grad_norm": 0.5555565151909756,
"learning_rate": 6.512826071737021e-07,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12128590047359467,
"step": 6170,
"valid_targets_mean": 2214.1,
"valid_targets_min": 478
},
{
"epoch": 6.4931650893796,
"grad_norm": 0.5370080914337216,
"learning_rate": 6.380760830759669e-07,
"loss": 0.0826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0735749676823616,
"step": 6175,
"valid_targets_mean": 2156.8,
"valid_targets_min": 531
},
{
"epoch": 6.498422712933754,
"grad_norm": 0.5117520718386905,
"learning_rate": 6.250026624475092e-07,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07520468533039093,
"step": 6180,
"valid_targets_mean": 2463.1,
"valid_targets_min": 765
},
{
"epoch": 6.503680336487907,
"grad_norm": 0.5669605157655614,
"learning_rate": 6.12062435161509e-07,
"loss": 0.0851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0995398461818695,
"step": 6185,
"valid_targets_mean": 2554.8,
"valid_targets_min": 826
},
{
"epoch": 6.508937960042061,
"grad_norm": 0.5853351573738615,
"learning_rate": 5.992554901755121e-07,
"loss": 0.0913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09550810605287552,
"step": 6190,
"valid_targets_mean": 2431.9,
"valid_targets_min": 717
},
{
"epoch": 6.514195583596215,
"grad_norm": 0.4802008536339129,
"learning_rate": 5.865819155308039e-07,
"loss": 0.0806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06486310809850693,
"step": 6195,
"valid_targets_mean": 2594.8,
"valid_targets_min": 880
},
{
"epoch": 6.519453207150368,
"grad_norm": 0.504005501037842,
"learning_rate": 5.740417983518253e-07,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.068062424659729,
"step": 6200,
"valid_targets_mean": 2458.5,
"valid_targets_min": 793
},
{
"epoch": 6.524710830704522,
"grad_norm": 0.6026058547119624,
"learning_rate": 5.61635224845567e-07,
"loss": 0.0794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10778342187404633,
"step": 6205,
"valid_targets_mean": 2191.8,
"valid_targets_min": 720
},
{
"epoch": 6.529968454258675,
"grad_norm": 0.6244835175660529,
"learning_rate": 5.493622803009602e-07,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08120977878570557,
"step": 6210,
"valid_targets_mean": 2157.4,
"valid_targets_min": 621
},
{
"epoch": 6.535226077812829,
"grad_norm": 0.6068652413994866,
"learning_rate": 5.372230490883246e-07,
"loss": 0.0783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10791747272014618,
"step": 6215,
"valid_targets_mean": 2231.4,
"valid_targets_min": 641
},
{
"epoch": 6.540483701366982,
"grad_norm": 0.6518432249319286,
"learning_rate": 5.252176146587484e-07,
"loss": 0.0868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08978095650672913,
"step": 6220,
"valid_targets_mean": 1999.6,
"valid_targets_min": 520
},
{
"epoch": 6.545741324921136,
"grad_norm": 0.5322523075185667,
"learning_rate": 5.133460595435447e-07,
"loss": 0.0879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08263758569955826,
"step": 6225,
"valid_targets_mean": 2624.8,
"valid_targets_min": 951
},
{
"epoch": 6.550998948475289,
"grad_norm": 0.5491804314149535,
"learning_rate": 5.016084653536756e-07,
"loss": 0.0864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07608095556497574,
"step": 6230,
"valid_targets_mean": 2382.8,
"valid_targets_min": 635
},
{
"epoch": 6.556256572029443,
"grad_norm": 0.6191162630290431,
"learning_rate": 4.900049127791851e-07,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0798032358288765,
"step": 6235,
"valid_targets_mean": 1820.6,
"valid_targets_min": 580
},
{
"epoch": 6.561514195583596,
"grad_norm": 0.41142023652597154,
"learning_rate": 4.785354815886445e-07,
"loss": 0.082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07865408062934875,
"step": 6240,
"valid_targets_mean": 3497.9,
"valid_targets_min": 1058
},
{
"epoch": 6.56677181913775,
"grad_norm": 0.4620355977287411,
"learning_rate": 4.6720025062862106e-07,
"loss": 0.0859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06432715803384781,
"step": 6245,
"valid_targets_mean": 2800.7,
"valid_targets_min": 535
},
{
"epoch": 6.572029442691903,
"grad_norm": 0.6379109945418963,
"learning_rate": 4.559992978231087e-07,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08400370180606842,
"step": 6250,
"valid_targets_mean": 1952.3,
"valid_targets_min": 664
},
{
"epoch": 6.577287066246057,
"grad_norm": 0.6716197205135126,
"learning_rate": 4.4493270017301305e-07,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08722291886806488,
"step": 6255,
"valid_targets_mean": 1848.4,
"valid_targets_min": 542
},
{
"epoch": 6.58254468980021,
"grad_norm": 0.45964959162742225,
"learning_rate": 4.340005337556186e-07,
"loss": 0.0788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06998851895332336,
"step": 6260,
"valid_targets_mean": 2483.1,
"valid_targets_min": 682
},
{
"epoch": 6.587802313354364,
"grad_norm": 0.46996990274006156,
"learning_rate": 4.232028737240623e-07,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06872901320457458,
"step": 6265,
"valid_targets_mean": 2698.6,
"valid_targets_min": 788
},
{
"epoch": 6.593059936908517,
"grad_norm": 0.5727096460977925,
"learning_rate": 4.125397943068099e-07,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07843247801065445,
"step": 6270,
"valid_targets_mean": 2486.0,
"valid_targets_min": 611
},
{
"epoch": 6.598317560462671,
"grad_norm": 0.48763409327222446,
"learning_rate": 4.0201136880716027e-07,
"loss": 0.083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07651547342538834,
"step": 6275,
"valid_targets_mean": 2702.9,
"valid_targets_min": 324
},
{
"epoch": 6.603575184016824,
"grad_norm": 0.533280459278677,
"learning_rate": 3.9161766960273517e-07,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07566278427839279,
"step": 6280,
"valid_targets_mean": 2462.0,
"valid_targets_min": 901
},
{
"epoch": 6.608832807570978,
"grad_norm": 0.5432365352962231,
"learning_rate": 3.8135876814497927e-07,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07376210391521454,
"step": 6285,
"valid_targets_mean": 2129.5,
"valid_targets_min": 697
},
{
"epoch": 6.614090431125131,
"grad_norm": 0.6261963575928159,
"learning_rate": 3.7123473495866314e-07,
"loss": 0.0749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08720436692237854,
"step": 6290,
"valid_targets_mean": 2554.2,
"valid_targets_min": 837
},
{
"epoch": 6.619348054679285,
"grad_norm": 0.5487338252275524,
"learning_rate": 3.61245639641421e-07,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07632743567228317,
"step": 6295,
"valid_targets_mean": 2285.2,
"valid_targets_min": 709
},
{
"epoch": 6.624605678233438,
"grad_norm": 0.5354842406307797,
"learning_rate": 3.513915508632448e-07,
"loss": 0.0788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06830295920372009,
"step": 6300,
"valid_targets_mean": 2155.7,
"valid_targets_min": 596
},
{
"epoch": 6.629863301787592,
"grad_norm": 0.6865677382003469,
"learning_rate": 3.4167253636602893e-07,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13126109540462494,
"step": 6305,
"valid_targets_mean": 2041.0,
"valid_targets_min": 801
},
{
"epoch": 6.635120925341745,
"grad_norm": 1.141326469895751,
"learning_rate": 3.3208866296310147e-07,
"loss": 0.0822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.080931656062603,
"step": 6310,
"valid_targets_mean": 1350.2,
"valid_targets_min": 577
},
{
"epoch": 6.6403785488958995,
"grad_norm": 0.5956020995829401,
"learning_rate": 3.2263999653876057e-07,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08234746754169464,
"step": 6315,
"valid_targets_mean": 1965.1,
"valid_targets_min": 516
},
{
"epoch": 6.645636172450052,
"grad_norm": 0.5571185608973166,
"learning_rate": 3.133266020478254e-07,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08819910138845444,
"step": 6320,
"valid_targets_mean": 2504.0,
"valid_targets_min": 714
},
{
"epoch": 6.6508937960042065,
"grad_norm": 0.6266443138131848,
"learning_rate": 3.0414854351519476e-07,
"loss": 0.0809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07300835847854614,
"step": 6325,
"valid_targets_mean": 2504.6,
"valid_targets_min": 923
},
{
"epoch": 6.65615141955836,
"grad_norm": 0.5920382865400394,
"learning_rate": 2.951058840353893e-07,
"loss": 0.0818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07816168665885925,
"step": 6330,
"valid_targets_mean": 2009.1,
"valid_targets_min": 611
},
{
"epoch": 6.6614090431125135,
"grad_norm": 0.46086708222512274,
"learning_rate": 2.861986857721388e-07,
"loss": 0.0784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08219857513904572,
"step": 6335,
"valid_targets_mean": 2743.7,
"valid_targets_min": 681
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.6042618093428848,
"learning_rate": 2.7742700995794457e-07,
"loss": 0.08,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08346769213676453,
"step": 6340,
"valid_targets_mean": 1825.4,
"valid_targets_min": 594
},
{
"epoch": 6.6719242902208205,
"grad_norm": 0.5632200603410698,
"learning_rate": 2.687909168936509e-07,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0770227462053299,
"step": 6345,
"valid_targets_mean": 2225.6,
"valid_targets_min": 663
},
{
"epoch": 6.677181913774974,
"grad_norm": 0.44172182563771206,
"learning_rate": 2.6029046594805206e-07,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06683406233787537,
"step": 6350,
"valid_targets_mean": 3205.3,
"valid_targets_min": 575
},
{
"epoch": 6.682439537329127,
"grad_norm": 0.47937200700051824,
"learning_rate": 2.519257155574617e-07,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06627700477838516,
"step": 6355,
"valid_targets_mean": 2196.9,
"valid_targets_min": 618
},
{
"epoch": 6.687697160883281,
"grad_norm": 0.5786591175133745,
"learning_rate": 2.436967232253218e-07,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07670648396015167,
"step": 6360,
"valid_targets_mean": 2454.1,
"valid_targets_min": 773
},
{
"epoch": 6.692954784437434,
"grad_norm": 0.5522841183832378,
"learning_rate": 2.3560354552180976e-07,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1030472069978714,
"step": 6365,
"valid_targets_mean": 2364.6,
"valid_targets_min": 795
},
{
"epoch": 6.698212407991588,
"grad_norm": 0.7246510988177797,
"learning_rate": 2.27646238083441e-07,
"loss": 0.0827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10080615431070328,
"step": 6370,
"valid_targets_mean": 1538.2,
"valid_targets_min": 731
},
{
"epoch": 6.703470031545741,
"grad_norm": 0.5112433586782476,
"learning_rate": 2.1982485561269805e-07,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08447860926389694,
"step": 6375,
"valid_targets_mean": 2548.8,
"valid_targets_min": 823
},
{
"epoch": 6.708727655099895,
"grad_norm": 0.4752830603680117,
"learning_rate": 2.1213945187763764e-07,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06532780826091766,
"step": 6380,
"valid_targets_mean": 2738.0,
"valid_targets_min": 744
},
{
"epoch": 6.713985278654048,
"grad_norm": 0.5097184369542547,
"learning_rate": 2.0459007971154632e-07,
"loss": 0.0815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08999559283256531,
"step": 6385,
"valid_targets_mean": 2560.6,
"valid_targets_min": 792
},
{
"epoch": 6.719242902208202,
"grad_norm": 0.5141735072926472,
"learning_rate": 1.9717679101254549e-07,
"loss": 0.0866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07460691034793854,
"step": 6390,
"valid_targets_mean": 2553.9,
"valid_targets_min": 661
},
{
"epoch": 6.724500525762355,
"grad_norm": 0.42662656259592047,
"learning_rate": 1.898996367432604e-07,
"loss": 0.0833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06775867938995361,
"step": 6395,
"valid_targets_mean": 3185.2,
"valid_targets_min": 886
},
{
"epoch": 6.729758149316509,
"grad_norm": 0.5815415443046982,
"learning_rate": 1.8275866693046263e-07,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07805125415325165,
"step": 6400,
"valid_targets_mean": 2401.2,
"valid_targets_min": 667
},
{
"epoch": 6.735015772870662,
"grad_norm": 0.6809583789098095,
"learning_rate": 1.7575393066471714e-07,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09543434530496597,
"step": 6405,
"valid_targets_mean": 2051.9,
"valid_targets_min": 685
},
{
"epoch": 6.740273396424816,
"grad_norm": 0.6074377015682235,
"learning_rate": 1.6888547610005802e-07,
"loss": 0.0789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0802602767944336,
"step": 6410,
"valid_targets_mean": 1878.8,
"valid_targets_min": 593
},
{
"epoch": 6.745531019978969,
"grad_norm": 0.6099932212135954,
"learning_rate": 1.6215335045364656e-07,
"loss": 0.0819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08950551599264145,
"step": 6415,
"valid_targets_mean": 2048.2,
"valid_targets_min": 526
},
{
"epoch": 6.750788643533123,
"grad_norm": 0.5855761199733788,
"learning_rate": 1.5555760000545595e-07,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08389267325401306,
"step": 6420,
"valid_targets_mean": 1949.8,
"valid_targets_min": 595
},
{
"epoch": 6.756046267087276,
"grad_norm": 0.581674804723855,
"learning_rate": 1.4909827009794486e-07,
"loss": 0.0848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08347044885158539,
"step": 6425,
"valid_targets_mean": 2073.5,
"valid_targets_min": 595
},
{
"epoch": 6.76130389064143,
"grad_norm": 0.5535352821726502,
"learning_rate": 1.4277540513575328e-07,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06882120668888092,
"step": 6430,
"valid_targets_mean": 2613.6,
"valid_targets_min": 739
},
{
"epoch": 6.766561514195583,
"grad_norm": 0.45591930105334755,
"learning_rate": 1.3658904858538936e-07,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.074724942445755,
"step": 6435,
"valid_targets_mean": 3086.1,
"valid_targets_min": 1015
},
{
"epoch": 6.771819137749737,
"grad_norm": 0.7477860815286947,
"learning_rate": 1.3053924297493858e-07,
"loss": 0.0853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.106345035135746,
"step": 6440,
"valid_targets_mean": 1640.8,
"valid_targets_min": 817
},
{
"epoch": 6.77707676130389,
"grad_norm": 0.5069610013245355,
"learning_rate": 1.2462602989376404e-07,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07082130014896393,
"step": 6445,
"valid_targets_mean": 2335.3,
"valid_targets_min": 543
},
{
"epoch": 6.782334384858045,
"grad_norm": 0.5347968910010757,
"learning_rate": 1.1884944999222658e-07,
"loss": 0.0897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07372461259365082,
"step": 6450,
"valid_targets_mean": 2553.9,
"valid_targets_min": 619
},
{
"epoch": 6.787592008412197,
"grad_norm": 0.4738534221180958,
"learning_rate": 1.1320954298140063e-07,
"loss": 0.0739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06634832173585892,
"step": 6455,
"valid_targets_mean": 2835.3,
"valid_targets_min": 826
},
{
"epoch": 6.792849631966352,
"grad_norm": 0.41603099555601125,
"learning_rate": 1.0770634763280552e-07,
"loss": 0.0736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0566122904419899,
"step": 6460,
"valid_targets_mean": 2864.8,
"valid_targets_min": 605
},
{
"epoch": 6.798107255520505,
"grad_norm": 0.5303244633135924,
"learning_rate": 1.023399017781368e-07,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09245777875185013,
"step": 6465,
"valid_targets_mean": 2603.1,
"valid_targets_min": 645
},
{
"epoch": 6.803364879074659,
"grad_norm": 0.4861274680792788,
"learning_rate": 9.711024230900423e-08,
"loss": 0.0787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07168373465538025,
"step": 6470,
"valid_targets_mean": 2689.0,
"valid_targets_min": 570
},
{
"epoch": 6.808622502628812,
"grad_norm": 0.5860357938410719,
"learning_rate": 9.201740517668089e-08,
"loss": 0.0881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09011109173297882,
"step": 6475,
"valid_targets_mean": 2369.3,
"valid_targets_min": 545
},
{
"epoch": 6.813880126182966,
"grad_norm": 0.4372969003909345,
"learning_rate": 8.706142539185447e-08,
"loss": 0.0678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05839034542441368,
"step": 6480,
"valid_targets_mean": 2381.8,
"valid_targets_min": 540
},
{
"epoch": 6.819137749737119,
"grad_norm": 0.5832180780388873,
"learning_rate": 8.224233702438966e-08,
"loss": 0.0803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0864538848400116,
"step": 6485,
"valid_targets_mean": 2176.7,
"valid_targets_min": 852
},
{
"epoch": 6.8243953732912725,
"grad_norm": 0.5660249394018138,
"learning_rate": 7.756017320309283e-08,
"loss": 0.0763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07787185162305832,
"step": 6490,
"valid_targets_mean": 1994.6,
"valid_targets_min": 830
},
{
"epoch": 6.829652996845426,
"grad_norm": 0.514128307764356,
"learning_rate": 7.301496611547665e-08,
"loss": 0.082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07752392441034317,
"step": 6495,
"valid_targets_mean": 2736.7,
"valid_targets_min": 758
},
{
"epoch": 6.8349106203995795,
"grad_norm": 0.6144942092654951,
"learning_rate": 6.86067470075491e-08,
"loss": 0.0815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08299332857131958,
"step": 6500,
"valid_targets_mean": 1566.8,
"valid_targets_min": 589
},
{
"epoch": 6.840168243953733,
"grad_norm": 0.5040161968586385,
"learning_rate": 6.433554618359816e-08,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06926639378070831,
"step": 6505,
"valid_targets_mean": 2173.9,
"valid_targets_min": 722
},
{
"epoch": 6.8454258675078865,
"grad_norm": 0.6768579508213621,
"learning_rate": 6.020139300597638e-08,
"loss": 0.0945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10462668538093567,
"step": 6510,
"valid_targets_mean": 1910.5,
"valid_targets_min": 646
},
{
"epoch": 6.85068349106204,
"grad_norm": 0.48428870253124023,
"learning_rate": 5.620431589490105e-08,
"loss": 0.0862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06444454193115234,
"step": 6515,
"valid_targets_mean": 2744.2,
"valid_targets_min": 888
},
{
"epoch": 6.8559411146161935,
"grad_norm": 0.6288267093245004,
"learning_rate": 5.234434232826324e-08,
"loss": 0.0849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09103910624980927,
"step": 6520,
"valid_targets_mean": 2009.6,
"valid_targets_min": 323
},
{
"epoch": 6.861198738170347,
"grad_norm": 0.7407904498846085,
"learning_rate": 4.862149884143907e-08,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0877629965543747,
"step": 6525,
"valid_targets_mean": 1637.1,
"valid_targets_min": 656
},
{
"epoch": 6.8664563617245005,
"grad_norm": 0.6546131880366078,
"learning_rate": 4.503581102709875e-08,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08757936954498291,
"step": 6530,
"valid_targets_mean": 1721.7,
"valid_targets_min": 593
},
{
"epoch": 6.871713985278654,
"grad_norm": 0.6631749432299133,
"learning_rate": 4.1587303535040035e-08,
"loss": 0.0798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08749720454216003,
"step": 6535,
"valid_targets_mean": 2121.8,
"valid_targets_min": 810
},
{
"epoch": 6.8769716088328074,
"grad_norm": 0.6263469103280397,
"learning_rate": 3.827600007201282e-08,
"loss": 0.0815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08659907430410385,
"step": 6540,
"valid_targets_mean": 2460.6,
"valid_targets_min": 688
},
{
"epoch": 6.882229232386961,
"grad_norm": 0.4964990109626726,
"learning_rate": 3.510192340156149e-08,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06929381191730499,
"step": 6545,
"valid_targets_mean": 2670.8,
"valid_targets_min": 827
},
{
"epoch": 6.887486855941114,
"grad_norm": 0.6388431749211498,
"learning_rate": 3.20650953438606e-08,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0863485112786293,
"step": 6550,
"valid_targets_mean": 1925.8,
"valid_targets_min": 662
},
{
"epoch": 6.892744479495268,
"grad_norm": 0.6111429694117104,
"learning_rate": 2.9165536775574987e-08,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08870579302310944,
"step": 6555,
"valid_targets_mean": 2264.5,
"valid_targets_min": 637
},
{
"epoch": 6.898002103049421,
"grad_norm": 0.6876725377629237,
"learning_rate": 2.6403267629706575e-08,
"loss": 0.0798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09392409026622772,
"step": 6560,
"valid_targets_mean": 1824.2,
"valid_targets_min": 515
},
{
"epoch": 6.903259726603575,
"grad_norm": 0.5425245448421149,
"learning_rate": 2.3778306895467785e-08,
"loss": 0.0924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07857099175453186,
"step": 6565,
"valid_targets_mean": 2822.9,
"valid_targets_min": 507
},
{
"epoch": 6.908517350157728,
"grad_norm": 0.5963557164127626,
"learning_rate": 2.1290672618135e-08,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07683561742305756,
"step": 6570,
"valid_targets_mean": 1971.9,
"valid_targets_min": 809
},
{
"epoch": 6.913774973711882,
"grad_norm": 0.510152007810794,
"learning_rate": 1.8940381898946424e-08,
"loss": 0.0717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06886039674282074,
"step": 6575,
"valid_targets_mean": 2683.1,
"valid_targets_min": 810
},
{
"epoch": 6.919032597266035,
"grad_norm": 0.5956362659114911,
"learning_rate": 1.6727450894959973e-08,
"loss": 0.0818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0822213888168335,
"step": 6580,
"valid_targets_mean": 2070.6,
"valid_targets_min": 604
},
{
"epoch": 6.92429022082019,
"grad_norm": 0.5690839230902637,
"learning_rate": 1.4651894818966671e-08,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08221758157014847,
"step": 6585,
"valid_targets_mean": 2298.4,
"valid_targets_min": 549
},
{
"epoch": 6.929547844374342,
"grad_norm": 0.62480736797892,
"learning_rate": 1.2713727939364096e-08,
"loss": 0.0973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08547095209360123,
"step": 6590,
"valid_targets_mean": 1900.0,
"valid_targets_min": 684
},
{
"epoch": 6.934805467928497,
"grad_norm": 0.7266004835873926,
"learning_rate": 1.091296358007643e-08,
"loss": 0.0834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0911824107170105,
"step": 6595,
"valid_targets_mean": 1658.3,
"valid_targets_min": 665
},
{
"epoch": 6.94006309148265,
"grad_norm": 0.6420014219853515,
"learning_rate": 9.249614120450113e-09,
"loss": 0.0838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08862049132585526,
"step": 6600,
"valid_targets_mean": 1993.0,
"valid_targets_min": 781
},
{
"epoch": 6.945320715036804,
"grad_norm": 0.5605123593848899,
"learning_rate": 7.723690995171673e-09,
"loss": 0.0923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07938556373119354,
"step": 6605,
"valid_targets_mean": 1996.4,
"valid_targets_min": 559
},
{
"epoch": 6.950578338590957,
"grad_norm": 0.6261934252171842,
"learning_rate": 6.335204694196684e-09,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0783381536602974,
"step": 6610,
"valid_targets_mean": 1721.9,
"valid_targets_min": 723
},
{
"epoch": 6.955835962145111,
"grad_norm": 0.5219456433674271,
"learning_rate": 5.084164762667598e-09,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06869587302207947,
"step": 6615,
"valid_targets_mean": 2252.4,
"valid_targets_min": 790
},
{
"epoch": 6.961093585699264,
"grad_norm": 0.5078327776482854,
"learning_rate": 3.970579800853802e-09,
"loss": 0.0939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10540289431810379,
"step": 6620,
"valid_targets_mean": 2315.0,
"valid_targets_min": 738
},
{
"epoch": 6.966351209253418,
"grad_norm": 0.5599403594131802,
"learning_rate": 2.9944574640894398e-09,
"loss": 0.0807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07712725549936295,
"step": 6625,
"valid_targets_mean": 2107.6,
"valid_targets_min": 700
},
{
"epoch": 6.971608832807571,
"grad_norm": 0.5799823765268213,
"learning_rate": 2.1558044627267847e-09,
"loss": 0.0779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07924142479896545,
"step": 6630,
"valid_targets_mean": 2008.0,
"valid_targets_min": 810
},
{
"epoch": 6.976866456361725,
"grad_norm": 0.5968465080497266,
"learning_rate": 1.4546265620785094e-09,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12107521295547485,
"step": 6635,
"valid_targets_mean": 2159.6,
"valid_targets_min": 806
},
{
"epoch": 6.982124079915878,
"grad_norm": 0.5415805272676822,
"learning_rate": 8.909285823910374e-10,
"loss": 0.0748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07664281874895096,
"step": 6640,
"valid_targets_mean": 2211.8,
"valid_targets_min": 598
},
{
"epoch": 6.987381703470032,
"grad_norm": 0.7172005397351996,
"learning_rate": 4.647143988067981e-10,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09677685797214508,
"step": 6645,
"valid_targets_mean": 1728.0,
"valid_targets_min": 703
},
{
"epoch": 6.992639327024185,
"grad_norm": 0.6204649705614377,
"learning_rate": 1.7598694132869853e-10,
"loss": 0.0798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08412232249975204,
"step": 6650,
"valid_targets_mean": 1963.6,
"valid_targets_min": 739
},
{
"epoch": 6.997896950578339,
"grad_norm": 0.5175219860773291,
"learning_rate": 2.474819481568247e-11,
"loss": 0.0838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07761639356613159,
"step": 6655,
"valid_targets_mean": 2373.6,
"valid_targets_min": 647
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10391900688409805,
"step": 6657,
"total_flos": 1429562854998016.0,
"train_loss": 0.12602117706011307,
"train_runtime": 32355.6398,
"train_samples_per_second": 3.29,
"train_steps_per_second": 0.206,
"valid_targets_mean": 2165.2,
"valid_targets_min": 936
}
],
"logging_steps": 5,
"max_steps": 6657,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1429562854998016.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}