a1-stack_cpp / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
25153a5 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4410,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007936507936507936,
"grad_norm": 13.936445999727159,
"learning_rate": 3.6281179138322e-07,
"loss": 0.5831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5446114540100098,
"step": 5,
"valid_targets_mean": 5181.8,
"valid_targets_min": 1333
},
{
"epoch": 0.015873015873015872,
"grad_norm": 14.14405406674101,
"learning_rate": 8.163265306122449e-07,
"loss": 0.6026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6077768802642822,
"step": 10,
"valid_targets_mean": 5303.6,
"valid_targets_min": 948
},
{
"epoch": 0.023809523809523808,
"grad_norm": 13.385853949153486,
"learning_rate": 1.26984126984127e-06,
"loss": 0.5824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5799890160560608,
"step": 15,
"valid_targets_mean": 5301.1,
"valid_targets_min": 1000
},
{
"epoch": 0.031746031746031744,
"grad_norm": 10.791756912090966,
"learning_rate": 1.723356009070295e-06,
"loss": 0.5901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5597653985023499,
"step": 20,
"valid_targets_mean": 4823.9,
"valid_targets_min": 263
},
{
"epoch": 0.03968253968253968,
"grad_norm": 6.581205621105729,
"learning_rate": 2.17687074829932e-06,
"loss": 0.5323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4685205817222595,
"step": 25,
"valid_targets_mean": 4813.8,
"valid_targets_min": 330
},
{
"epoch": 0.047619047619047616,
"grad_norm": 3.7853786833152236,
"learning_rate": 2.6303854875283447e-06,
"loss": 0.4573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4164578914642334,
"step": 30,
"valid_targets_mean": 5283.2,
"valid_targets_min": 538
},
{
"epoch": 0.05555555555555555,
"grad_norm": 2.602330607184181,
"learning_rate": 3.08390022675737e-06,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39225059747695923,
"step": 35,
"valid_targets_mean": 4700.6,
"valid_targets_min": 2390
},
{
"epoch": 0.06349206349206349,
"grad_norm": 1.4233023861991225,
"learning_rate": 3.537414965986395e-06,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35967135429382324,
"step": 40,
"valid_targets_mean": 5445.3,
"valid_targets_min": 657
},
{
"epoch": 0.07142857142857142,
"grad_norm": 1.0170115963512993,
"learning_rate": 3.99092970521542e-06,
"loss": 0.402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3903147876262665,
"step": 45,
"valid_targets_mean": 6464.0,
"valid_targets_min": 3085
},
{
"epoch": 0.07936507936507936,
"grad_norm": 0.8370897006461435,
"learning_rate": 4.444444444444444e-06,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33025485277175903,
"step": 50,
"valid_targets_mean": 5718.5,
"valid_targets_min": 975
},
{
"epoch": 0.0873015873015873,
"grad_norm": 0.7252658896074926,
"learning_rate": 4.897959183673469e-06,
"loss": 0.3611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34258341789245605,
"step": 55,
"valid_targets_mean": 5999.1,
"valid_targets_min": 989
},
{
"epoch": 0.09523809523809523,
"grad_norm": 0.756722250222215,
"learning_rate": 5.3514739229024945e-06,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3988223075866699,
"step": 60,
"valid_targets_mean": 4506.9,
"valid_targets_min": 290
},
{
"epoch": 0.10317460317460317,
"grad_norm": 0.568685223882473,
"learning_rate": 5.80498866213152e-06,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3268760144710541,
"step": 65,
"valid_targets_mean": 6105.9,
"valid_targets_min": 2717
},
{
"epoch": 0.1111111111111111,
"grad_norm": 0.5731290626935265,
"learning_rate": 6.258503401360545e-06,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3184238374233246,
"step": 70,
"valid_targets_mean": 5088.2,
"valid_targets_min": 420
},
{
"epoch": 0.11904761904761904,
"grad_norm": 0.5739988755146004,
"learning_rate": 6.71201814058957e-06,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34080153703689575,
"step": 75,
"valid_targets_mean": 5674.6,
"valid_targets_min": 1923
},
{
"epoch": 0.12698412698412698,
"grad_norm": 0.5021784940463249,
"learning_rate": 7.165532879818595e-06,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3233030438423157,
"step": 80,
"valid_targets_mean": 5277.2,
"valid_targets_min": 291
},
{
"epoch": 0.1349206349206349,
"grad_norm": 0.5521401363464609,
"learning_rate": 7.61904761904762e-06,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2872031331062317,
"step": 85,
"valid_targets_mean": 5470.0,
"valid_targets_min": 737
},
{
"epoch": 0.14285714285714285,
"grad_norm": 0.4751497127812398,
"learning_rate": 8.072562358276645e-06,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3212955594062805,
"step": 90,
"valid_targets_mean": 6301.1,
"valid_targets_min": 2854
},
{
"epoch": 0.15079365079365079,
"grad_norm": 0.43696107468178264,
"learning_rate": 8.52607709750567e-06,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2621079683303833,
"step": 95,
"valid_targets_mean": 5617.8,
"valid_targets_min": 266
},
{
"epoch": 0.15873015873015872,
"grad_norm": 0.5242468737414164,
"learning_rate": 8.979591836734695e-06,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3428232669830322,
"step": 100,
"valid_targets_mean": 5715.6,
"valid_targets_min": 2266
},
{
"epoch": 0.16666666666666666,
"grad_norm": 0.4723266645052996,
"learning_rate": 9.43310657596372e-06,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27712035179138184,
"step": 105,
"valid_targets_mean": 5371.8,
"valid_targets_min": 662
},
{
"epoch": 0.1746031746031746,
"grad_norm": 0.49793096409078624,
"learning_rate": 9.886621315192746e-06,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2675686478614807,
"step": 110,
"valid_targets_mean": 4750.8,
"valid_targets_min": 662
},
{
"epoch": 0.18253968253968253,
"grad_norm": 0.4902776042402625,
"learning_rate": 1.034013605442177e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30433300137519836,
"step": 115,
"valid_targets_mean": 5146.1,
"valid_targets_min": 940
},
{
"epoch": 0.19047619047619047,
"grad_norm": 0.465412157163947,
"learning_rate": 1.0793650793650794e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2920241057872772,
"step": 120,
"valid_targets_mean": 5453.2,
"valid_targets_min": 841
},
{
"epoch": 0.1984126984126984,
"grad_norm": 0.4355039639514751,
"learning_rate": 1.124716553287982e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2529776692390442,
"step": 125,
"valid_targets_mean": 5727.6,
"valid_targets_min": 2696
},
{
"epoch": 0.20634920634920634,
"grad_norm": 0.4996682572655225,
"learning_rate": 1.1700680272108845e-05,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821199297904968,
"step": 130,
"valid_targets_mean": 5396.6,
"valid_targets_min": 2020
},
{
"epoch": 0.21428571428571427,
"grad_norm": 0.43094951290178424,
"learning_rate": 1.215419501133787e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24614138901233673,
"step": 135,
"valid_targets_mean": 5842.7,
"valid_targets_min": 286
},
{
"epoch": 0.2222222222222222,
"grad_norm": 0.47723431745558176,
"learning_rate": 1.2607709750566895e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2890702486038208,
"step": 140,
"valid_targets_mean": 5354.1,
"valid_targets_min": 2307
},
{
"epoch": 0.23015873015873015,
"grad_norm": 0.4617350150011481,
"learning_rate": 1.3061224489795918e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2510530948638916,
"step": 145,
"valid_targets_mean": 5552.1,
"valid_targets_min": 608
},
{
"epoch": 0.23809523809523808,
"grad_norm": 0.45824070397194494,
"learning_rate": 1.3514739229024945e-05,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26986801624298096,
"step": 150,
"valid_targets_mean": 5441.2,
"valid_targets_min": 1175
},
{
"epoch": 0.24603174603174602,
"grad_norm": 0.4392573652714541,
"learning_rate": 1.3968253968253968e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2496776133775711,
"step": 155,
"valid_targets_mean": 5731.4,
"valid_targets_min": 1393
},
{
"epoch": 0.25396825396825395,
"grad_norm": 0.4536964041682826,
"learning_rate": 1.4421768707482994e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21673960983753204,
"step": 160,
"valid_targets_mean": 6079.4,
"valid_targets_min": 300
},
{
"epoch": 0.2619047619047619,
"grad_norm": 0.5619742860376928,
"learning_rate": 1.4875283446712018e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2804248631000519,
"step": 165,
"valid_targets_mean": 5392.2,
"valid_targets_min": 2214
},
{
"epoch": 0.2698412698412698,
"grad_norm": 0.4588222248723898,
"learning_rate": 1.5328798185941044e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24595819413661957,
"step": 170,
"valid_targets_mean": 5367.2,
"valid_targets_min": 1806
},
{
"epoch": 0.2777777777777778,
"grad_norm": 0.4837210875448078,
"learning_rate": 1.578231292517007e-05,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26808232069015503,
"step": 175,
"valid_targets_mean": 4694.2,
"valid_targets_min": 1970
},
{
"epoch": 0.2857142857142857,
"grad_norm": 0.4642135470304616,
"learning_rate": 1.6235827664399097e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25557032227516174,
"step": 180,
"valid_targets_mean": 5724.9,
"valid_targets_min": 1981
},
{
"epoch": 0.29365079365079366,
"grad_norm": 0.4404678599566564,
"learning_rate": 1.668934240362812e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2403090000152588,
"step": 185,
"valid_targets_mean": 5580.2,
"valid_targets_min": 1807
},
{
"epoch": 0.30158730158730157,
"grad_norm": 0.461513428421082,
"learning_rate": 1.7142857142857142e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2342744767665863,
"step": 190,
"valid_targets_mean": 5209.1,
"valid_targets_min": 528
},
{
"epoch": 0.30952380952380953,
"grad_norm": 0.4616028237565255,
"learning_rate": 1.759637188208617e-05,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2381066232919693,
"step": 195,
"valid_targets_mean": 4881.2,
"valid_targets_min": 1007
},
{
"epoch": 0.31746031746031744,
"grad_norm": 0.5048131717477712,
"learning_rate": 1.8049886621315194e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24961230158805847,
"step": 200,
"valid_targets_mean": 4766.8,
"valid_targets_min": 760
},
{
"epoch": 0.3253968253968254,
"grad_norm": 0.4608218526938904,
"learning_rate": 1.8503401360544218e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22085292637348175,
"step": 205,
"valid_targets_mean": 5626.6,
"valid_targets_min": 311
},
{
"epoch": 0.3333333333333333,
"grad_norm": 0.5276409706041367,
"learning_rate": 1.8956916099773243e-05,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512398362159729,
"step": 210,
"valid_targets_mean": 5207.8,
"valid_targets_min": 901
},
{
"epoch": 0.3412698412698413,
"grad_norm": 0.44125944724862465,
"learning_rate": 1.941043083900227e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23039595782756805,
"step": 215,
"valid_targets_mean": 6150.5,
"valid_targets_min": 2819
},
{
"epoch": 0.3492063492063492,
"grad_norm": 0.8225576873165226,
"learning_rate": 1.9863945578231295e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2745077311992645,
"step": 220,
"valid_targets_mean": 4586.4,
"valid_targets_min": 889
},
{
"epoch": 0.35714285714285715,
"grad_norm": 0.44559302418983976,
"learning_rate": 2.031746031746032e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27263548970222473,
"step": 225,
"valid_targets_mean": 5901.4,
"valid_targets_min": 1813
},
{
"epoch": 0.36507936507936506,
"grad_norm": 0.4702793229346846,
"learning_rate": 2.0770975056689343e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2387492060661316,
"step": 230,
"valid_targets_mean": 5740.0,
"valid_targets_min": 1593
},
{
"epoch": 0.373015873015873,
"grad_norm": 0.5771251589812603,
"learning_rate": 2.122448979591837e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27772706747055054,
"step": 235,
"valid_targets_mean": 5892.1,
"valid_targets_min": 807
},
{
"epoch": 0.38095238095238093,
"grad_norm": 0.4716600277551803,
"learning_rate": 2.1678004535147395e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24430419504642487,
"step": 240,
"valid_targets_mean": 5370.8,
"valid_targets_min": 300
},
{
"epoch": 0.3888888888888889,
"grad_norm": 0.4834321959641482,
"learning_rate": 2.213151927437642e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2554604709148407,
"step": 245,
"valid_targets_mean": 5334.6,
"valid_targets_min": 800
},
{
"epoch": 0.3968253968253968,
"grad_norm": 0.4468651198346908,
"learning_rate": 2.2585034013605444e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22178535163402557,
"step": 250,
"valid_targets_mean": 5966.1,
"valid_targets_min": 1724
},
{
"epoch": 0.40476190476190477,
"grad_norm": 0.4750302614876995,
"learning_rate": 2.3038548752834472e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26613864302635193,
"step": 255,
"valid_targets_mean": 5677.9,
"valid_targets_min": 1011
},
{
"epoch": 0.4126984126984127,
"grad_norm": 0.4468674852795431,
"learning_rate": 2.3492063492063496e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535470724105835,
"step": 260,
"valid_targets_mean": 5571.2,
"valid_targets_min": 3116
},
{
"epoch": 0.42063492063492064,
"grad_norm": 0.4435957536640986,
"learning_rate": 2.394557823129252e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24253222346305847,
"step": 265,
"valid_targets_mean": 5520.6,
"valid_targets_min": 2481
},
{
"epoch": 0.42857142857142855,
"grad_norm": 0.48192905697263166,
"learning_rate": 2.439909297052154e-05,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22654183208942413,
"step": 270,
"valid_targets_mean": 5040.6,
"valid_targets_min": 1020
},
{
"epoch": 0.4365079365079365,
"grad_norm": 0.4654909902022295,
"learning_rate": 2.4852607709750566e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22321158647537231,
"step": 275,
"valid_targets_mean": 4938.6,
"valid_targets_min": 554
},
{
"epoch": 0.4444444444444444,
"grad_norm": 0.47136311558318184,
"learning_rate": 2.5306122448979597e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25398164987564087,
"step": 280,
"valid_targets_mean": 5719.1,
"valid_targets_min": 1427
},
{
"epoch": 0.4523809523809524,
"grad_norm": 0.5143544056685512,
"learning_rate": 2.5759637188208618e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28001242876052856,
"step": 285,
"valid_targets_mean": 4379.2,
"valid_targets_min": 275
},
{
"epoch": 0.4603174603174603,
"grad_norm": 0.40992433170257936,
"learning_rate": 2.6213151927437642e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19944259524345398,
"step": 290,
"valid_targets_mean": 6113.2,
"valid_targets_min": 1496
},
{
"epoch": 0.46825396825396826,
"grad_norm": 0.7108778765163672,
"learning_rate": 2.6666666666666667e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2676636576652527,
"step": 295,
"valid_targets_mean": 4878.0,
"valid_targets_min": 1397
},
{
"epoch": 0.47619047619047616,
"grad_norm": 0.7424501325702221,
"learning_rate": 2.7120181405895694e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27534204721450806,
"step": 300,
"valid_targets_mean": 4737.1,
"valid_targets_min": 1195
},
{
"epoch": 0.48412698412698413,
"grad_norm": 0.4554032952042926,
"learning_rate": 2.757369614512472e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23061871528625488,
"step": 305,
"valid_targets_mean": 5816.9,
"valid_targets_min": 935
},
{
"epoch": 0.49206349206349204,
"grad_norm": 0.43918142641279273,
"learning_rate": 2.8027210884353743e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2266923487186432,
"step": 310,
"valid_targets_mean": 5512.4,
"valid_targets_min": 674
},
{
"epoch": 0.5,
"grad_norm": 0.46398515425879433,
"learning_rate": 2.8480725623582767e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21582689881324768,
"step": 315,
"valid_targets_mean": 5874.5,
"valid_targets_min": 1816
},
{
"epoch": 0.5079365079365079,
"grad_norm": 0.4043326688329922,
"learning_rate": 2.893424036281179e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21339790523052216,
"step": 320,
"valid_targets_mean": 5820.1,
"valid_targets_min": 282
},
{
"epoch": 0.5158730158730159,
"grad_norm": 0.502316882086023,
"learning_rate": 2.938775510204082e-05,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20219871401786804,
"step": 325,
"valid_targets_mean": 5578.6,
"valid_targets_min": 1540
},
{
"epoch": 0.5238095238095238,
"grad_norm": 0.9835515697061404,
"learning_rate": 2.9841269841269844e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2298191487789154,
"step": 330,
"valid_targets_mean": 4911.0,
"valid_targets_min": 632
},
{
"epoch": 0.5317460317460317,
"grad_norm": 0.4647735663644707,
"learning_rate": 3.0294784580498868e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22781239449977875,
"step": 335,
"valid_targets_mean": 5532.8,
"valid_targets_min": 1535
},
{
"epoch": 0.5396825396825397,
"grad_norm": 0.5438389697935898,
"learning_rate": 3.074829931972789e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22640562057495117,
"step": 340,
"valid_targets_mean": 4285.8,
"valid_targets_min": 727
},
{
"epoch": 0.5476190476190477,
"grad_norm": 0.4334285919558895,
"learning_rate": 3.1201814058956924e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21913409233093262,
"step": 345,
"valid_targets_mean": 5222.7,
"valid_targets_min": 285
},
{
"epoch": 0.5555555555555556,
"grad_norm": 0.4738405937337707,
"learning_rate": 3.1655328798185945e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25035279989242554,
"step": 350,
"valid_targets_mean": 5209.8,
"valid_targets_min": 833
},
{
"epoch": 0.5634920634920635,
"grad_norm": 0.4555272170875938,
"learning_rate": 3.2108843537414965e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21295906603336334,
"step": 355,
"valid_targets_mean": 4887.6,
"valid_targets_min": 845
},
{
"epoch": 0.5714285714285714,
"grad_norm": 0.4607956603180466,
"learning_rate": 3.256235827664399e-05,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23422232270240784,
"step": 360,
"valid_targets_mean": 5982.9,
"valid_targets_min": 3791
},
{
"epoch": 0.5793650793650794,
"grad_norm": 0.46019446827222377,
"learning_rate": 3.3015873015873014e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21903209388256073,
"step": 365,
"valid_targets_mean": 5330.9,
"valid_targets_min": 2257
},
{
"epoch": 0.5873015873015873,
"grad_norm": 0.6042052076393369,
"learning_rate": 3.346938775510204e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2550661861896515,
"step": 370,
"valid_targets_mean": 4556.8,
"valid_targets_min": 763
},
{
"epoch": 0.5952380952380952,
"grad_norm": 0.44853135001478606,
"learning_rate": 3.392290249433107e-05,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.202229842543602,
"step": 375,
"valid_targets_mean": 5618.4,
"valid_targets_min": 287
},
{
"epoch": 0.6031746031746031,
"grad_norm": 0.4114084841092905,
"learning_rate": 3.437641723356009e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.208021879196167,
"step": 380,
"valid_targets_mean": 6323.6,
"valid_targets_min": 3070
},
{
"epoch": 0.6111111111111112,
"grad_norm": 0.4907016504547875,
"learning_rate": 3.482993197278912e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2262699007987976,
"step": 385,
"valid_targets_mean": 5458.8,
"valid_targets_min": 1233
},
{
"epoch": 0.6190476190476191,
"grad_norm": 0.4470894371245897,
"learning_rate": 3.5283446712018146e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2284412682056427,
"step": 390,
"valid_targets_mean": 5275.5,
"valid_targets_min": 614
},
{
"epoch": 0.626984126984127,
"grad_norm": 0.8292394623205982,
"learning_rate": 3.573696145124717e-05,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23321247100830078,
"step": 395,
"valid_targets_mean": 4546.7,
"valid_targets_min": 1120
},
{
"epoch": 0.6349206349206349,
"grad_norm": 0.5101519952218712,
"learning_rate": 3.6190476190476195e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22552572190761566,
"step": 400,
"valid_targets_mean": 4713.0,
"valid_targets_min": 403
},
{
"epoch": 0.6428571428571429,
"grad_norm": 0.4782175383328679,
"learning_rate": 3.6643990929705216e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22066287696361542,
"step": 405,
"valid_targets_mean": 5557.4,
"valid_targets_min": 1431
},
{
"epoch": 0.6507936507936508,
"grad_norm": 0.6813010668498629,
"learning_rate": 3.7097505668934243e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23460529744625092,
"step": 410,
"valid_targets_mean": 4301.2,
"valid_targets_min": 290
},
{
"epoch": 0.6587301587301587,
"grad_norm": 0.42762135214795316,
"learning_rate": 3.755102040816327e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22290262579917908,
"step": 415,
"valid_targets_mean": 5696.5,
"valid_targets_min": 1242
},
{
"epoch": 0.6666666666666666,
"grad_norm": 0.7113003892096883,
"learning_rate": 3.800453514739229e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24848781526088715,
"step": 420,
"valid_targets_mean": 5861.1,
"valid_targets_min": 1829
},
{
"epoch": 0.6746031746031746,
"grad_norm": 0.4223786613285171,
"learning_rate": 3.845804988662132e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23021358251571655,
"step": 425,
"valid_targets_mean": 5603.6,
"valid_targets_min": 2005
},
{
"epoch": 0.6825396825396826,
"grad_norm": 0.46482319003042916,
"learning_rate": 3.891156462585034e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2257668375968933,
"step": 430,
"valid_targets_mean": 5665.9,
"valid_targets_min": 936
},
{
"epoch": 0.6904761904761905,
"grad_norm": 0.49517195170111594,
"learning_rate": 3.936507936507937e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24368128180503845,
"step": 435,
"valid_targets_mean": 5276.9,
"valid_targets_min": 965
},
{
"epoch": 0.6984126984126984,
"grad_norm": 0.4533449896226927,
"learning_rate": 3.9818594104308396e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2182699739933014,
"step": 440,
"valid_targets_mean": 5190.2,
"valid_targets_min": 609
},
{
"epoch": 0.7063492063492064,
"grad_norm": 0.47604972418524916,
"learning_rate": 3.999994361288785e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27464592456817627,
"step": 445,
"valid_targets_mean": 5377.2,
"valid_targets_min": 299
},
{
"epoch": 0.7142857142857143,
"grad_norm": 0.4843309348827549,
"learning_rate": 3.9999599026131644e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21664546430110931,
"step": 450,
"valid_targets_mean": 5402.9,
"valid_targets_min": 1359
},
{
"epoch": 0.7222222222222222,
"grad_norm": 0.4382635205661119,
"learning_rate": 3.999894118418342e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22355255484580994,
"step": 455,
"valid_targets_mean": 5052.1,
"valid_targets_min": 2069
},
{
"epoch": 0.7301587301587301,
"grad_norm": 0.472980100407786,
"learning_rate": 3.999797009734697e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22827665507793427,
"step": 460,
"valid_targets_mean": 5404.2,
"valid_targets_min": 1744
},
{
"epoch": 0.7380952380952381,
"grad_norm": 0.43558241143554155,
"learning_rate": 3.999668578083253e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22950908541679382,
"step": 465,
"valid_targets_mean": 5786.8,
"valid_targets_min": 688
},
{
"epoch": 0.746031746031746,
"grad_norm": 0.39301407866116134,
"learning_rate": 3.9995088254756434e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20144161581993103,
"step": 470,
"valid_targets_mean": 6067.9,
"valid_targets_min": 3477
},
{
"epoch": 0.753968253968254,
"grad_norm": 0.4335866805247727,
"learning_rate": 3.999317754414084e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24468550086021423,
"step": 475,
"valid_targets_mean": 5383.6,
"valid_targets_min": 297
},
{
"epoch": 0.7619047619047619,
"grad_norm": 0.43530076929025974,
"learning_rate": 3.999095367891337e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2087598741054535,
"step": 480,
"valid_targets_mean": 5412.7,
"valid_targets_min": 241
},
{
"epoch": 0.7698412698412699,
"grad_norm": 0.42581385510950404,
"learning_rate": 3.9988416693906563e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20418357849121094,
"step": 485,
"valid_targets_mean": 5400.4,
"valid_targets_min": 618
},
{
"epoch": 0.7777777777777778,
"grad_norm": 0.6201401443531581,
"learning_rate": 3.9985566628857425e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22904717922210693,
"step": 490,
"valid_targets_mean": 5283.9,
"valid_targets_min": 1641
},
{
"epoch": 0.7857142857142857,
"grad_norm": 0.40573600003328514,
"learning_rate": 3.998240352840672e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19750481843948364,
"step": 495,
"valid_targets_mean": 5820.5,
"valid_targets_min": 2527
},
{
"epoch": 0.7936507936507936,
"grad_norm": 0.6282176812699868,
"learning_rate": 3.997892744209833e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21052823960781097,
"step": 500,
"valid_targets_mean": 3286.4,
"valid_targets_min": 284
},
{
"epoch": 0.8015873015873016,
"grad_norm": 0.4150664416041001,
"learning_rate": 3.997513842437845e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20114190876483917,
"step": 505,
"valid_targets_mean": 6746.6,
"valid_targets_min": 3503
},
{
"epoch": 0.8095238095238095,
"grad_norm": 0.5580131451084269,
"learning_rate": 3.997103653459475e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21351292729377747,
"step": 510,
"valid_targets_mean": 5427.2,
"valid_targets_min": 1310
},
{
"epoch": 0.8174603174603174,
"grad_norm": 0.4539249289508295,
"learning_rate": 3.996662183699541e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22894957661628723,
"step": 515,
"valid_targets_mean": 6587.3,
"valid_targets_min": 2987
},
{
"epoch": 0.8253968253968254,
"grad_norm": 0.4606135797915741,
"learning_rate": 3.996189440072818e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23994050920009613,
"step": 520,
"valid_targets_mean": 5603.4,
"valid_targets_min": 963
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.46485471964434133,
"learning_rate": 3.9956854299839246e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24385607242584229,
"step": 525,
"valid_targets_mean": 5554.9,
"valid_targets_min": 1998
},
{
"epoch": 0.8412698412698413,
"grad_norm": 0.5070540327503203,
"learning_rate": 3.9951501613272076e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311379760503769,
"step": 530,
"valid_targets_mean": 5792.5,
"valid_targets_min": 2950
},
{
"epoch": 0.8492063492063492,
"grad_norm": 0.4509301237412979,
"learning_rate": 3.994583642486618e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22014960646629333,
"step": 535,
"valid_targets_mean": 5551.4,
"valid_targets_min": 2454
},
{
"epoch": 0.8571428571428571,
"grad_norm": 0.37450581843880576,
"learning_rate": 3.993985882335584e-05,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17562690377235413,
"step": 540,
"valid_targets_mean": 6399.9,
"valid_targets_min": 865
},
{
"epoch": 0.8650793650793651,
"grad_norm": 0.4181520509392521,
"learning_rate": 3.993356890236866e-05,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1997915804386139,
"step": 545,
"valid_targets_mean": 5282.3,
"valid_targets_min": 307
},
{
"epoch": 0.873015873015873,
"grad_norm": 0.40651126602493426,
"learning_rate": 3.992696676042414e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20215590298175812,
"step": 550,
"valid_targets_mean": 6478.2,
"valid_targets_min": 1253
},
{
"epoch": 0.8809523809523809,
"grad_norm": 0.42510576646915893,
"learning_rate": 3.992005250093211e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20907750725746155,
"step": 555,
"valid_targets_mean": 5629.7,
"valid_targets_min": 1539
},
{
"epoch": 0.8888888888888888,
"grad_norm": 0.4812454511222598,
"learning_rate": 3.991282623219113e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22547686100006104,
"step": 560,
"valid_targets_mean": 4727.8,
"valid_targets_min": 1324
},
{
"epoch": 0.8968253968253969,
"grad_norm": 0.4203217407948123,
"learning_rate": 3.9905288067386776e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21304470300674438,
"step": 565,
"valid_targets_mean": 5743.1,
"valid_targets_min": 2659
},
{
"epoch": 0.9047619047619048,
"grad_norm": 0.5536262458911827,
"learning_rate": 3.989743812458987e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22015127539634705,
"step": 570,
"valid_targets_mean": 5742.7,
"valid_targets_min": 501
},
{
"epoch": 0.9126984126984127,
"grad_norm": 0.44923723778131375,
"learning_rate": 3.9889276526754664e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2490832507610321,
"step": 575,
"valid_targets_mean": 5566.1,
"valid_targets_min": 906
},
{
"epoch": 0.9206349206349206,
"grad_norm": 0.4833832932237736,
"learning_rate": 3.988080340171685e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2266359031200409,
"step": 580,
"valid_targets_mean": 4794.4,
"valid_targets_min": 510
},
{
"epoch": 0.9285714285714286,
"grad_norm": 0.5314150951022422,
"learning_rate": 3.987201888219161e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23443414270877838,
"step": 585,
"valid_targets_mean": 3981.2,
"valid_targets_min": 577
},
{
"epoch": 0.9365079365079365,
"grad_norm": 0.44573566583926183,
"learning_rate": 3.986292310577153e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1997448205947876,
"step": 590,
"valid_targets_mean": 5087.9,
"valid_targets_min": 256
},
{
"epoch": 0.9444444444444444,
"grad_norm": 0.4823118351901083,
"learning_rate": 3.9853516214924416e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21190452575683594,
"step": 595,
"valid_targets_mean": 4769.4,
"valid_targets_min": 1789
},
{
"epoch": 0.9523809523809523,
"grad_norm": 0.9701252803781317,
"learning_rate": 3.9843798356991096e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21730470657348633,
"step": 600,
"valid_targets_mean": 5590.2,
"valid_targets_min": 871
},
{
"epoch": 0.9603174603174603,
"grad_norm": 0.8528374645310175,
"learning_rate": 3.9833769684183104e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25169217586517334,
"step": 605,
"valid_targets_mean": 5481.6,
"valid_targets_min": 648
},
{
"epoch": 0.9682539682539683,
"grad_norm": 0.5719512687258413,
"learning_rate": 3.982343035358026e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25562554597854614,
"step": 610,
"valid_targets_mean": 4258.5,
"valid_targets_min": 852
},
{
"epoch": 0.9761904761904762,
"grad_norm": 0.42417870906303506,
"learning_rate": 3.981278052712827e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19715425372123718,
"step": 615,
"valid_targets_mean": 6383.4,
"valid_targets_min": 2557
},
{
"epoch": 0.9841269841269841,
"grad_norm": 0.5592731470756656,
"learning_rate": 3.9801820371636157e-05,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21826912462711334,
"step": 620,
"valid_targets_mean": 5242.9,
"valid_targets_min": 540
},
{
"epoch": 0.9920634920634921,
"grad_norm": 0.45536035098972394,
"learning_rate": 3.979055005877364e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23044517636299133,
"step": 625,
"valid_targets_mean": 6434.3,
"valid_targets_min": 1909
},
{
"epoch": 1.0,
"grad_norm": 0.45688834618759994,
"learning_rate": 3.977896976506845e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20650140941143036,
"step": 630,
"valid_targets_mean": 4983.3,
"valid_targets_min": 920
},
{
"epoch": 1.007936507936508,
"grad_norm": 0.45783302985716545,
"learning_rate": 3.976707967190358e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1878741830587387,
"step": 635,
"valid_targets_mean": 6036.8,
"valid_targets_min": 1419
},
{
"epoch": 1.0158730158730158,
"grad_norm": 0.3696615133926402,
"learning_rate": 3.9754879965514456e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17767128348350525,
"step": 640,
"valid_targets_mean": 6949.4,
"valid_targets_min": 1382
},
{
"epoch": 1.0238095238095237,
"grad_norm": 0.5301335563601449,
"learning_rate": 3.9742370836985956e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18509696424007416,
"step": 645,
"valid_targets_mean": 5665.9,
"valid_targets_min": 3373
},
{
"epoch": 1.0317460317460316,
"grad_norm": 0.45339150425457114,
"learning_rate": 3.972955248224949e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19851231575012207,
"step": 650,
"valid_targets_mean": 5496.2,
"valid_targets_min": 1700
},
{
"epoch": 1.0396825396825398,
"grad_norm": 0.4563819518280238,
"learning_rate": 3.971642510207989e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20360763370990753,
"step": 655,
"valid_targets_mean": 5350.4,
"valid_targets_min": 333
},
{
"epoch": 1.0476190476190477,
"grad_norm": 0.5625847542647227,
"learning_rate": 3.9702988902092274e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1898064911365509,
"step": 660,
"valid_targets_mean": 5748.2,
"valid_targets_min": 1540
},
{
"epoch": 1.0555555555555556,
"grad_norm": 0.425299703122137,
"learning_rate": 3.968924409273884e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19356761872768402,
"step": 665,
"valid_targets_mean": 5209.3,
"valid_targets_min": 1985
},
{
"epoch": 1.0634920634920635,
"grad_norm": 0.47286769247229504,
"learning_rate": 3.9675190889305545e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1817602813243866,
"step": 670,
"valid_targets_mean": 5672.6,
"valid_targets_min": 959
},
{
"epoch": 1.0714285714285714,
"grad_norm": 0.432773210737844,
"learning_rate": 3.966082951190874e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2104063630104065,
"step": 675,
"valid_targets_mean": 6248.0,
"valid_targets_min": 1230
},
{
"epoch": 1.0793650793650793,
"grad_norm": 0.4706439453673335,
"learning_rate": 3.9646160185491756e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18827101588249207,
"step": 680,
"valid_targets_mean": 4876.6,
"valid_targets_min": 1043
},
{
"epoch": 1.0873015873015872,
"grad_norm": 0.5338851223858002,
"learning_rate": 3.963118313982131e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18436592817306519,
"step": 685,
"valid_targets_mean": 4361.0,
"valid_targets_min": 1130
},
{
"epoch": 1.0952380952380953,
"grad_norm": 0.41520798715060503,
"learning_rate": 3.961589860948399e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21202310919761658,
"step": 690,
"valid_targets_mean": 5486.4,
"valid_targets_min": 1888
},
{
"epoch": 1.1031746031746033,
"grad_norm": 0.42676794941537016,
"learning_rate": 3.960030683388251e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17921066284179688,
"step": 695,
"valid_targets_mean": 5590.2,
"valid_targets_min": 217
},
{
"epoch": 1.1111111111111112,
"grad_norm": 0.40164984647020757,
"learning_rate": 3.9584408057232e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17369890213012695,
"step": 700,
"valid_targets_mean": 5022.5,
"valid_targets_min": 268
},
{
"epoch": 1.119047619047619,
"grad_norm": 0.4557865055131249,
"learning_rate": 3.956820252855618e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21178218722343445,
"step": 705,
"valid_targets_mean": 5212.6,
"valid_targets_min": 1650
},
{
"epoch": 1.126984126984127,
"grad_norm": 0.4737440529809228,
"learning_rate": 3.955169050168343e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18235670030117035,
"step": 710,
"valid_targets_mean": 4897.6,
"valid_targets_min": 1233
},
{
"epoch": 1.1349206349206349,
"grad_norm": 0.36301667189206566,
"learning_rate": 3.953487223524283e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15816360712051392,
"step": 715,
"valid_targets_mean": 6158.5,
"valid_targets_min": 2000
},
{
"epoch": 1.1428571428571428,
"grad_norm": 0.4512962324237001,
"learning_rate": 3.951774799266014e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1824280321598053,
"step": 720,
"valid_targets_mean": 5561.8,
"valid_targets_min": 2560
},
{
"epoch": 1.1507936507936507,
"grad_norm": 0.4511979075727613,
"learning_rate": 3.950031804215364e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2006044089794159,
"step": 725,
"valid_targets_mean": 5573.5,
"valid_targets_min": 1633
},
{
"epoch": 1.1587301587301586,
"grad_norm": 0.42676374430180725,
"learning_rate": 3.948258265672991e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21262499690055847,
"step": 730,
"valid_targets_mean": 5894.2,
"valid_targets_min": 513
},
{
"epoch": 1.1666666666666667,
"grad_norm": 0.669542399200941,
"learning_rate": 3.946454211417961e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20334014296531677,
"step": 735,
"valid_targets_mean": 5074.4,
"valid_targets_min": 690
},
{
"epoch": 1.1746031746031746,
"grad_norm": 0.45162646285557456,
"learning_rate": 3.944619669707309e-05,
"loss": 0.2193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.215205579996109,
"step": 740,
"valid_targets_mean": 5439.4,
"valid_targets_min": 1907
},
{
"epoch": 1.1825396825396826,
"grad_norm": 0.4710256071640483,
"learning_rate": 3.9427546692755946e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21397551894187927,
"step": 745,
"valid_targets_mean": 5276.3,
"valid_targets_min": 1098
},
{
"epoch": 1.1904761904761905,
"grad_norm": 0.4625751950531012,
"learning_rate": 3.9408592393344596e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19521868228912354,
"step": 750,
"valid_targets_mean": 5905.4,
"valid_targets_min": 2861
},
{
"epoch": 1.1984126984126984,
"grad_norm": 0.4677554812825755,
"learning_rate": 3.9389334095721606e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21653307974338531,
"step": 755,
"valid_targets_mean": 4797.6,
"valid_targets_min": 895
},
{
"epoch": 1.2063492063492063,
"grad_norm": 0.546242046347798,
"learning_rate": 3.936977210153113e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20400574803352356,
"step": 760,
"valid_targets_mean": 5519.1,
"valid_targets_min": 896
},
{
"epoch": 1.2142857142857142,
"grad_norm": 0.4204392123363325,
"learning_rate": 3.93499067171741e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22943107783794403,
"step": 765,
"valid_targets_mean": 6420.3,
"valid_targets_min": 1329
},
{
"epoch": 1.2222222222222223,
"grad_norm": 0.4682155865822684,
"learning_rate": 3.932973825380351e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22972063720226288,
"step": 770,
"valid_targets_mean": 4946.4,
"valid_targets_min": 933
},
{
"epoch": 1.2301587301587302,
"grad_norm": 0.5301139897940557,
"learning_rate": 3.9309267027319485e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23306161165237427,
"step": 775,
"valid_targets_mean": 3961.6,
"valid_targets_min": 222
},
{
"epoch": 1.2380952380952381,
"grad_norm": 0.40365821128282314,
"learning_rate": 3.928849335836435e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18574738502502441,
"step": 780,
"valid_targets_mean": 5806.0,
"valid_targets_min": 2320
},
{
"epoch": 1.246031746031746,
"grad_norm": 0.47813886067964756,
"learning_rate": 3.926741757231761e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21044926345348358,
"step": 785,
"valid_targets_mean": 5299.6,
"valid_targets_min": 1723
},
{
"epoch": 1.253968253968254,
"grad_norm": 0.40253903041192324,
"learning_rate": 3.924603999929086e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2096974402666092,
"step": 790,
"valid_targets_mean": 5558.8,
"valid_targets_min": 543
},
{
"epoch": 1.2619047619047619,
"grad_norm": 0.4549298029596003,
"learning_rate": 3.9224360974122584e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23242492973804474,
"step": 795,
"valid_targets_mean": 5270.6,
"valid_targets_min": 2212
},
{
"epoch": 1.2698412698412698,
"grad_norm": 0.4695471820608219,
"learning_rate": 3.920238083637297e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20831601321697235,
"step": 800,
"valid_targets_mean": 5308.8,
"valid_targets_min": 883
},
{
"epoch": 1.2777777777777777,
"grad_norm": 0.7642610362979803,
"learning_rate": 3.9180099930318524e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991654336452484,
"step": 805,
"valid_targets_mean": 6815.1,
"valid_targets_min": 1462
},
{
"epoch": 1.2857142857142856,
"grad_norm": 0.4440164128697404,
"learning_rate": 3.915751860494672e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16493773460388184,
"step": 810,
"valid_targets_mean": 5028.6,
"valid_targets_min": 397
},
{
"epoch": 1.2936507936507937,
"grad_norm": 0.43322694583144405,
"learning_rate": 3.913463721395051e-05,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1892578899860382,
"step": 815,
"valid_targets_mean": 4793.7,
"valid_targets_min": 343
},
{
"epoch": 1.3015873015873016,
"grad_norm": 0.4113857371999088,
"learning_rate": 3.911145611572282e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22850877046585083,
"step": 820,
"valid_targets_mean": 6205.9,
"valid_targets_min": 3119
},
{
"epoch": 1.3095238095238095,
"grad_norm": 0.4024454753442706,
"learning_rate": 3.908797567335089e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1995319277048111,
"step": 825,
"valid_targets_mean": 6545.4,
"valid_targets_min": 2059
},
{
"epoch": 1.3174603174603174,
"grad_norm": 0.4766793634475361,
"learning_rate": 3.906419625461062e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21162061393260956,
"step": 830,
"valid_targets_mean": 5270.3,
"valid_targets_min": 294
},
{
"epoch": 1.3253968253968254,
"grad_norm": 0.43124302476576,
"learning_rate": 3.90401182319608e-05,
"loss": 0.2112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2024182230234146,
"step": 835,
"valid_targets_mean": 5587.5,
"valid_targets_min": 946
},
{
"epoch": 1.3333333333333333,
"grad_norm": 0.37620838473431895,
"learning_rate": 3.9015741982537265e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16263701021671295,
"step": 840,
"valid_targets_mean": 6486.5,
"valid_targets_min": 777
},
{
"epoch": 1.3412698412698414,
"grad_norm": 0.4227366879146679,
"learning_rate": 3.899106788814701e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19696393609046936,
"step": 845,
"valid_targets_mean": 5981.3,
"valid_targets_min": 1252
},
{
"epoch": 1.3492063492063493,
"grad_norm": 0.4396285787879683,
"learning_rate": 3.896609633526219e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21186983585357666,
"step": 850,
"valid_targets_mean": 5076.4,
"valid_targets_min": 525
},
{
"epoch": 1.3571428571428572,
"grad_norm": 0.4809038294139755,
"learning_rate": 3.894082771501407e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191837877035141,
"step": 855,
"valid_targets_mean": 5344.6,
"valid_targets_min": 3615
},
{
"epoch": 1.3650793650793651,
"grad_norm": 0.48473797503352833,
"learning_rate": 3.891526242318692e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16904303431510925,
"step": 860,
"valid_targets_mean": 4677.6,
"valid_targets_min": 281
},
{
"epoch": 1.373015873015873,
"grad_norm": 0.3848141194705589,
"learning_rate": 3.8889400860211785e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19609695672988892,
"step": 865,
"valid_targets_mean": 5797.4,
"valid_targets_min": 577
},
{
"epoch": 1.380952380952381,
"grad_norm": 0.43935568195512203,
"learning_rate": 3.886324343116023e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21925979852676392,
"step": 870,
"valid_targets_mean": 5510.4,
"valid_targets_min": 2795
},
{
"epoch": 1.3888888888888888,
"grad_norm": 0.3787284592232413,
"learning_rate": 3.883679054573799e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17324265837669373,
"step": 875,
"valid_targets_mean": 6371.8,
"valid_targets_min": 1851
},
{
"epoch": 1.3968253968253967,
"grad_norm": 0.48231311291457907,
"learning_rate": 3.881004261827856e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22266656160354614,
"step": 880,
"valid_targets_mean": 5407.8,
"valid_targets_min": 247
},
{
"epoch": 1.4047619047619047,
"grad_norm": 0.39562200883867676,
"learning_rate": 3.878300006773669e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19309642910957336,
"step": 885,
"valid_targets_mean": 6324.1,
"valid_targets_min": 3843
},
{
"epoch": 1.4126984126984126,
"grad_norm": 0.4536286972970636,
"learning_rate": 3.875566331768184e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.205659881234169,
"step": 890,
"valid_targets_mean": 4451.7,
"valid_targets_min": 766
},
{
"epoch": 1.4206349206349207,
"grad_norm": 0.40917484623660716,
"learning_rate": 3.872803279629155e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21330603957176208,
"step": 895,
"valid_targets_mean": 5915.2,
"valid_targets_min": 2792
},
{
"epoch": 1.4285714285714286,
"grad_norm": 0.44208512274029477,
"learning_rate": 3.8700108936344705e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21972954273223877,
"step": 900,
"valid_targets_mean": 4555.5,
"valid_targets_min": 299
},
{
"epoch": 1.4365079365079365,
"grad_norm": 0.44093255819884136,
"learning_rate": 3.867189217521477e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20141087472438812,
"step": 905,
"valid_targets_mean": 5635.6,
"valid_targets_min": 2966
},
{
"epoch": 1.4444444444444444,
"grad_norm": 0.4623153556330511,
"learning_rate": 3.864338295486297e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21589690446853638,
"step": 910,
"valid_targets_mean": 4678.0,
"valid_targets_min": 514
},
{
"epoch": 1.4523809523809523,
"grad_norm": 0.41249982388927653,
"learning_rate": 3.8614581721831316e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2026449292898178,
"step": 915,
"valid_targets_mean": 5216.7,
"valid_targets_min": 591
},
{
"epoch": 1.4603174603174602,
"grad_norm": 0.4104480770890901,
"learning_rate": 3.858548892723563e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1731051206588745,
"step": 920,
"valid_targets_mean": 5339.4,
"valid_targets_min": 736
},
{
"epoch": 1.4682539682539684,
"grad_norm": 0.41895380180198477,
"learning_rate": 3.855610502675851e-05,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2031707614660263,
"step": 925,
"valid_targets_mean": 5263.9,
"valid_targets_min": 1601
},
{
"epoch": 1.4761904761904763,
"grad_norm": 0.4261994122248901,
"learning_rate": 3.852643048064215e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084016501903534,
"step": 930,
"valid_targets_mean": 5398.7,
"valid_targets_min": 366
},
{
"epoch": 1.4841269841269842,
"grad_norm": 0.44461914330875957,
"learning_rate": 3.8496465753681145e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.203968346118927,
"step": 935,
"valid_targets_mean": 5705.4,
"valid_targets_min": 293
},
{
"epoch": 1.492063492063492,
"grad_norm": 0.3619697764513735,
"learning_rate": 3.846621131521522e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16397273540496826,
"step": 940,
"valid_targets_mean": 5586.3,
"valid_targets_min": 603
},
{
"epoch": 1.5,
"grad_norm": 0.47927964908668164,
"learning_rate": 3.843566763912187e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19876304268836975,
"step": 945,
"valid_targets_mean": 5481.6,
"valid_targets_min": 2470
},
{
"epoch": 1.507936507936508,
"grad_norm": 0.43177345256816557,
"learning_rate": 3.840483520380896e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19520597159862518,
"step": 950,
"valid_targets_mean": 5171.9,
"valid_targets_min": 578
},
{
"epoch": 1.5158730158730158,
"grad_norm": 0.45814725913527155,
"learning_rate": 3.837371449220717e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191867396235466,
"step": 955,
"valid_targets_mean": 6292.2,
"valid_targets_min": 3359
},
{
"epoch": 1.5238095238095237,
"grad_norm": 0.3660046705130465,
"learning_rate": 3.834230599176251e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16699504852294922,
"step": 960,
"valid_targets_mean": 6213.4,
"valid_targets_min": 2488
},
{
"epoch": 1.5317460317460316,
"grad_norm": 0.3890844674038831,
"learning_rate": 3.831061019442864e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20834946632385254,
"step": 965,
"valid_targets_mean": 5682.8,
"valid_targets_min": 855
},
{
"epoch": 1.5396825396825395,
"grad_norm": 0.442290989827857,
"learning_rate": 3.827862759665916e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2266271859407425,
"step": 970,
"valid_targets_mean": 5248.5,
"valid_targets_min": 1995
},
{
"epoch": 1.5476190476190477,
"grad_norm": 0.4156925522612072,
"learning_rate": 3.8246358699399853e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16675469279289246,
"step": 975,
"valid_targets_mean": 4952.9,
"valid_targets_min": 277
},
{
"epoch": 1.5555555555555556,
"grad_norm": 0.37604931667074504,
"learning_rate": 3.8213804008080824e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18879935145378113,
"step": 980,
"valid_targets_mean": 6674.0,
"valid_targets_min": 3077
},
{
"epoch": 1.5634920634920635,
"grad_norm": 0.4287194995251398,
"learning_rate": 3.818096403260862e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20438791811466217,
"step": 985,
"valid_targets_mean": 5784.4,
"valid_targets_min": 1565
},
{
"epoch": 1.5714285714285714,
"grad_norm": 0.44022259559851695,
"learning_rate": 3.8147839287358185e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21569909155368805,
"step": 990,
"valid_targets_mean": 5262.6,
"valid_targets_min": 1953
},
{
"epoch": 1.5793650793650795,
"grad_norm": 0.466156003317299,
"learning_rate": 3.8114430291164836e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1877652108669281,
"step": 995,
"valid_targets_mean": 4195.9,
"valid_targets_min": 361
},
{
"epoch": 1.5873015873015874,
"grad_norm": 0.38334955845745405,
"learning_rate": 3.808073756731615e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1762232482433319,
"step": 1000,
"valid_targets_mean": 5545.6,
"valid_targets_min": 949
},
{
"epoch": 1.5952380952380953,
"grad_norm": 0.5439994931547266,
"learning_rate": 3.8046761643543734e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1913871467113495,
"step": 1005,
"valid_targets_mean": 4491.5,
"valid_targets_min": 369
},
{
"epoch": 1.6031746031746033,
"grad_norm": 0.40075365186274436,
"learning_rate": 3.8012503052014996e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1946803331375122,
"step": 1010,
"valid_targets_mean": 5425.6,
"valid_targets_min": 764
},
{
"epoch": 1.6111111111111112,
"grad_norm": 0.3877028365107908,
"learning_rate": 3.797796232932476e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21146497130393982,
"step": 1015,
"valid_targets_mean": 6453.6,
"valid_targets_min": 2839
},
{
"epoch": 1.619047619047619,
"grad_norm": 0.3668527782681026,
"learning_rate": 3.794314001648692e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18072551488876343,
"step": 1020,
"valid_targets_mean": 6010.3,
"valid_targets_min": 2661
},
{
"epoch": 1.626984126984127,
"grad_norm": 0.44781816078627307,
"learning_rate": 3.7908036658925926e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2001311182975769,
"step": 1025,
"valid_targets_mean": 5515.9,
"valid_targets_min": 693
},
{
"epoch": 1.6349206349206349,
"grad_norm": 0.40397196550171016,
"learning_rate": 3.787265280646825e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19972187280654907,
"step": 1030,
"valid_targets_mean": 5461.7,
"valid_targets_min": 289
},
{
"epoch": 1.6428571428571428,
"grad_norm": 0.4356586536795959,
"learning_rate": 3.7836989013333776e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1890064775943756,
"step": 1035,
"valid_targets_mean": 5751.4,
"valid_targets_min": 211
},
{
"epoch": 1.6507936507936507,
"grad_norm": 0.44136645672562447,
"learning_rate": 3.780104583812712e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1881527304649353,
"step": 1040,
"valid_targets_mean": 5342.1,
"valid_targets_min": 827
},
{
"epoch": 1.6587301587301586,
"grad_norm": 0.4490662637016875,
"learning_rate": 3.7764823843828883e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20181840658187866,
"step": 1045,
"valid_targets_mean": 4998.9,
"valid_targets_min": 1099
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.414814689156328,
"learning_rate": 3.7728323597786834e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2113458514213562,
"step": 1050,
"valid_targets_mean": 5317.9,
"valid_targets_min": 912
},
{
"epoch": 1.6746031746031746,
"grad_norm": 0.4002735439554692,
"learning_rate": 3.7691545671707007e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19339720904827118,
"step": 1055,
"valid_targets_mean": 5467.6,
"valid_targets_min": 304
},
{
"epoch": 1.6825396825396826,
"grad_norm": 0.34935950618209505,
"learning_rate": 3.765449064164477e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16387102007865906,
"step": 1060,
"valid_targets_mean": 5961.0,
"valid_targets_min": 1397
},
{
"epoch": 1.6904761904761905,
"grad_norm": 0.4617875758265747,
"learning_rate": 3.7617159087995784e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20451588928699493,
"step": 1065,
"valid_targets_mean": 5329.4,
"valid_targets_min": 1754
},
{
"epoch": 1.6984126984126984,
"grad_norm": 0.43000065083291655,
"learning_rate": 3.757955159548693e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19835901260375977,
"step": 1070,
"valid_targets_mean": 5593.4,
"valid_targets_min": 1554
},
{
"epoch": 1.7063492063492065,
"grad_norm": 0.3606371311330236,
"learning_rate": 3.754166875316713e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18690404295921326,
"step": 1075,
"valid_targets_mean": 6369.9,
"valid_targets_min": 2694
},
{
"epoch": 1.7142857142857144,
"grad_norm": 0.39285827605092777,
"learning_rate": 3.750351115439812e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20067650079727173,
"step": 1080,
"valid_targets_mean": 5648.6,
"valid_targets_min": 650
},
{
"epoch": 1.7222222222222223,
"grad_norm": 0.38570908603943815,
"learning_rate": 3.746507939684519e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19070516526699066,
"step": 1085,
"valid_targets_mean": 6492.1,
"valid_targets_min": 3263
},
{
"epoch": 1.7301587301587302,
"grad_norm": 0.39910170101731635,
"learning_rate": 3.742637408246779e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21158373355865479,
"step": 1090,
"valid_targets_mean": 6281.1,
"valid_targets_min": 1277
},
{
"epoch": 1.7380952380952381,
"grad_norm": 0.49874739628178993,
"learning_rate": 3.73873958175101e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20216044783592224,
"step": 1095,
"valid_targets_mean": 4570.4,
"valid_targets_min": 797
},
{
"epoch": 1.746031746031746,
"grad_norm": 0.47674802821687573,
"learning_rate": 3.734814521249156e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21278969943523407,
"step": 1100,
"valid_targets_mean": 6688.0,
"valid_targets_min": 4913
},
{
"epoch": 1.753968253968254,
"grad_norm": 0.4208345610037382,
"learning_rate": 3.7308622882197294e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20342180132865906,
"step": 1105,
"valid_targets_mean": 4974.2,
"valid_targets_min": 1373
},
{
"epoch": 1.7619047619047619,
"grad_norm": 0.5036978972360446,
"learning_rate": 3.7268829445668456e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19987335801124573,
"step": 1110,
"valid_targets_mean": 4656.1,
"valid_targets_min": 692
},
{
"epoch": 1.7698412698412698,
"grad_norm": 0.4475822251477478,
"learning_rate": 3.722876552619257e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1833523064851761,
"step": 1115,
"valid_targets_mean": 5454.4,
"valid_targets_min": 1320
},
{
"epoch": 1.7777777777777777,
"grad_norm": 0.42301407783978096,
"learning_rate": 3.718843175129378e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1914646029472351,
"step": 1120,
"valid_targets_mean": 6252.5,
"valid_targets_min": 899
},
{
"epoch": 1.7857142857142856,
"grad_norm": 0.3667105929189479,
"learning_rate": 3.7147828752722944e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18096204102039337,
"step": 1125,
"valid_targets_mean": 5728.2,
"valid_targets_min": 1408
},
{
"epoch": 1.7936507936507935,
"grad_norm": 0.3988857634933404,
"learning_rate": 3.7106957166447834e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20091086626052856,
"step": 1130,
"valid_targets_mean": 6323.2,
"valid_targets_min": 2797
},
{
"epoch": 1.8015873015873016,
"grad_norm": 0.4353965199064458,
"learning_rate": 3.7065817632643115e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2031416893005371,
"step": 1135,
"valid_targets_mean": 5034.0,
"valid_targets_min": 1545
},
{
"epoch": 1.8095238095238095,
"grad_norm": 0.3835363845414605,
"learning_rate": 3.7024410795680326e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20650315284729004,
"step": 1140,
"valid_targets_mean": 5709.4,
"valid_targets_min": 2868
},
{
"epoch": 1.8174603174603174,
"grad_norm": 0.6017933902148771,
"learning_rate": 3.698273730411782e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21874158084392548,
"step": 1145,
"valid_targets_mean": 4664.8,
"valid_targets_min": 1051
},
{
"epoch": 1.8253968253968254,
"grad_norm": 0.5010674614611315,
"learning_rate": 3.694079781069053e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22206932306289673,
"step": 1150,
"valid_targets_mean": 5182.3,
"valid_targets_min": 1754
},
{
"epoch": 1.8333333333333335,
"grad_norm": 0.3923636627441356,
"learning_rate": 3.6898592972299875e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17895236611366272,
"step": 1155,
"valid_targets_mean": 5307.1,
"valid_targets_min": 299
},
{
"epoch": 1.8412698412698414,
"grad_norm": 0.46097320064253466,
"learning_rate": 3.6856123450003306e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17629393935203552,
"step": 1160,
"valid_targets_mean": 5396.4,
"valid_targets_min": 1717
},
{
"epoch": 1.8492063492063493,
"grad_norm": 0.4118263198386797,
"learning_rate": 3.68133899090041e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21603277325630188,
"step": 1165,
"valid_targets_mean": 5743.1,
"valid_targets_min": 1944
},
{
"epoch": 1.8571428571428572,
"grad_norm": 0.40887713694857647,
"learning_rate": 3.677039301864085e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21704469621181488,
"step": 1170,
"valid_targets_mean": 5467.9,
"valid_targets_min": 1922
},
{
"epoch": 1.8650793650793651,
"grad_norm": 0.3934682878408651,
"learning_rate": 3.672713345237701e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19257432222366333,
"step": 1175,
"valid_targets_mean": 5539.5,
"valid_targets_min": 574
},
{
"epoch": 1.873015873015873,
"grad_norm": 0.40297241825152724,
"learning_rate": 3.6683611887790356e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22532138228416443,
"step": 1180,
"valid_targets_mean": 5603.6,
"valid_targets_min": 839
},
{
"epoch": 1.880952380952381,
"grad_norm": 0.4525568905524082,
"learning_rate": 3.663982900656236e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21516132354736328,
"step": 1185,
"valid_targets_mean": 4871.1,
"valid_targets_min": 852
},
{
"epoch": 1.8888888888888888,
"grad_norm": 0.3826095420283405,
"learning_rate": 3.6595785494467516e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2126571089029312,
"step": 1190,
"valid_targets_mean": 6149.8,
"valid_targets_min": 322
},
{
"epoch": 1.8968253968253967,
"grad_norm": 0.49491876878445984,
"learning_rate": 3.655148204136259e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1980828046798706,
"step": 1195,
"valid_targets_mean": 4812.1,
"valid_targets_min": 355
},
{
"epoch": 1.9047619047619047,
"grad_norm": 0.3844425255192722,
"learning_rate": 3.650691934117584e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17985425889492035,
"step": 1200,
"valid_targets_mean": 5473.3,
"valid_targets_min": 2775
},
{
"epoch": 1.9126984126984126,
"grad_norm": 0.4025013315745311,
"learning_rate": 3.646209809189611e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2079595923423767,
"step": 1205,
"valid_targets_mean": 5829.4,
"valid_targets_min": 2090
},
{
"epoch": 1.9206349206349205,
"grad_norm": 0.3718395023938511,
"learning_rate": 3.641701899556192e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20109693706035614,
"step": 1210,
"valid_targets_mean": 5616.2,
"valid_targets_min": 447
},
{
"epoch": 1.9285714285714286,
"grad_norm": 0.41192663980117594,
"learning_rate": 3.63716827582505e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19556891918182373,
"step": 1215,
"valid_targets_mean": 5405.4,
"valid_targets_min": 260
},
{
"epoch": 1.9365079365079365,
"grad_norm": 0.4061502796105446,
"learning_rate": 3.632609009006665e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1885574758052826,
"step": 1220,
"valid_targets_mean": 4830.4,
"valid_targets_min": 1806
},
{
"epoch": 1.9444444444444444,
"grad_norm": 0.394449808870156,
"learning_rate": 3.62802417051317e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1800915151834488,
"step": 1225,
"valid_targets_mean": 5700.7,
"valid_targets_min": 403
},
{
"epoch": 1.9523809523809523,
"grad_norm": 0.4440079869221486,
"learning_rate": 3.6234138321572274e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17726945877075195,
"step": 1230,
"valid_targets_mean": 5161.5,
"valid_targets_min": 1498
},
{
"epoch": 1.9603174603174605,
"grad_norm": 0.4620529228104198,
"learning_rate": 3.6187780661509074e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22657737135887146,
"step": 1235,
"valid_targets_mean": 5007.8,
"valid_targets_min": 1843
},
{
"epoch": 1.9682539682539684,
"grad_norm": 0.4536224923690941,
"learning_rate": 3.6141169451045526e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1943274736404419,
"step": 1240,
"valid_targets_mean": 4127.1,
"valid_targets_min": 391
},
{
"epoch": 1.9761904761904763,
"grad_norm": 0.46913089325037155,
"learning_rate": 3.609430542025646e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17612981796264648,
"step": 1245,
"valid_targets_mean": 5872.5,
"valid_targets_min": 1386
},
{
"epoch": 1.9841269841269842,
"grad_norm": 0.40006665679686376,
"learning_rate": 3.604718930317664e-05,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21723848581314087,
"step": 1250,
"valid_targets_mean": 5627.9,
"valid_targets_min": 1877
},
{
"epoch": 1.992063492063492,
"grad_norm": 0.4171450102000576,
"learning_rate": 3.5999821837789275e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17687958478927612,
"step": 1255,
"valid_targets_mean": 4820.7,
"valid_targets_min": 275
},
{
"epoch": 2.0,
"grad_norm": 0.39376114464436146,
"learning_rate": 3.595220376601447e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16747349500656128,
"step": 1260,
"valid_targets_mean": 5956.8,
"valid_targets_min": 510
},
{
"epoch": 2.007936507936508,
"grad_norm": 0.42367770753786105,
"learning_rate": 3.590433583369758e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.164157897233963,
"step": 1265,
"valid_targets_mean": 6732.4,
"valid_targets_min": 3077
},
{
"epoch": 2.015873015873016,
"grad_norm": 0.43491398653549607,
"learning_rate": 3.5856218790597554e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16858386993408203,
"step": 1270,
"valid_targets_mean": 4635.7,
"valid_targets_min": 267
},
{
"epoch": 2.0238095238095237,
"grad_norm": 0.4336346848049278,
"learning_rate": 3.580785339037519e-05,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1782153844833374,
"step": 1275,
"valid_targets_mean": 5509.9,
"valid_targets_min": 2820
},
{
"epoch": 2.0317460317460316,
"grad_norm": 0.4219922314179232,
"learning_rate": 3.57592403905813e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17715319991111755,
"step": 1280,
"valid_targets_mean": 5722.5,
"valid_targets_min": 269
},
{
"epoch": 2.0396825396825395,
"grad_norm": 0.3940209379170676,
"learning_rate": 3.571038055264489e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16919057071208954,
"step": 1285,
"valid_targets_mean": 5806.7,
"valid_targets_min": 2137
},
{
"epoch": 2.0476190476190474,
"grad_norm": 0.9513050625567275,
"learning_rate": 3.566127464186119e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17070958018302917,
"step": 1290,
"valid_targets_mean": 6109.1,
"valid_targets_min": 2815
},
{
"epoch": 2.0555555555555554,
"grad_norm": 0.39178871800874376,
"learning_rate": 3.56119234273797e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15980932116508484,
"step": 1295,
"valid_targets_mean": 6312.2,
"valid_targets_min": 2200
},
{
"epoch": 2.0634920634920633,
"grad_norm": 0.4545939454742837,
"learning_rate": 3.5562327682192134e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17266622185707092,
"step": 1300,
"valid_targets_mean": 5758.9,
"valid_targets_min": 322
},
{
"epoch": 2.0714285714285716,
"grad_norm": 0.40752366743563423,
"learning_rate": 3.5512488183120286e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18903039395809174,
"step": 1305,
"valid_targets_mean": 6031.5,
"valid_targets_min": 552
},
{
"epoch": 2.0793650793650795,
"grad_norm": 0.43154212786267104,
"learning_rate": 3.54624057108039e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1685219407081604,
"step": 1310,
"valid_targets_mean": 4359.1,
"valid_targets_min": 492
},
{
"epoch": 2.0873015873015874,
"grad_norm": 0.41368733303715804,
"learning_rate": 3.5412081049688444e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1651342809200287,
"step": 1315,
"valid_targets_mean": 5127.6,
"valid_targets_min": 1605
},
{
"epoch": 2.0952380952380953,
"grad_norm": 0.38589454302426857,
"learning_rate": 3.5361514988012774e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1480841338634491,
"step": 1320,
"valid_targets_mean": 5874.6,
"valid_targets_min": 1503
},
{
"epoch": 2.1031746031746033,
"grad_norm": 0.43713259076728145,
"learning_rate": 3.5310708317796844e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16304585337638855,
"step": 1325,
"valid_targets_mean": 5606.6,
"valid_targets_min": 2620
},
{
"epoch": 2.111111111111111,
"grad_norm": 0.5149351729670725,
"learning_rate": 3.5259661834829266e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17917974293231964,
"step": 1330,
"valid_targets_mean": 6228.2,
"valid_targets_min": 1503
},
{
"epoch": 2.119047619047619,
"grad_norm": 0.3861389835108437,
"learning_rate": 3.5208376338654866e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16448023915290833,
"step": 1335,
"valid_targets_mean": 6666.1,
"valid_targets_min": 708
},
{
"epoch": 2.126984126984127,
"grad_norm": 0.38207111066871835,
"learning_rate": 3.515685263256214e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17809657752513885,
"step": 1340,
"valid_targets_mean": 6127.4,
"valid_targets_min": 1544
},
{
"epoch": 2.134920634920635,
"grad_norm": 0.4127592358303544,
"learning_rate": 3.51050915235707e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18220895528793335,
"step": 1345,
"valid_targets_mean": 5229.9,
"valid_targets_min": 864
},
{
"epoch": 2.142857142857143,
"grad_norm": 0.42540313592591483,
"learning_rate": 3.5053093822418596e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1991414576768875,
"step": 1350,
"valid_targets_mean": 5462.2,
"valid_targets_min": 2257
},
{
"epoch": 2.1507936507936507,
"grad_norm": 0.39687138441854536,
"learning_rate": 3.500086034354966e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20256337523460388,
"step": 1355,
"valid_targets_mean": 5684.8,
"valid_targets_min": 2415
},
{
"epoch": 2.1587301587301586,
"grad_norm": 0.44932267888477845,
"learning_rate": 3.494839190510071e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17283421754837036,
"step": 1360,
"valid_targets_mean": 4960.4,
"valid_targets_min": 2345
},
{
"epoch": 2.1666666666666665,
"grad_norm": 0.49624084160009224,
"learning_rate": 3.489568932888877e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1903117299079895,
"step": 1365,
"valid_targets_mean": 5084.8,
"valid_targets_min": 301
},
{
"epoch": 2.1746031746031744,
"grad_norm": 0.42424536754472875,
"learning_rate": 3.484275344039815e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1761750876903534,
"step": 1370,
"valid_targets_mean": 4764.8,
"valid_targets_min": 310
},
{
"epoch": 2.1825396825396823,
"grad_norm": 0.3930655272562859,
"learning_rate": 3.478958506876759e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16021452844142914,
"step": 1375,
"valid_targets_mean": 5342.4,
"valid_targets_min": 2886
},
{
"epoch": 2.1904761904761907,
"grad_norm": 0.5253004636054942,
"learning_rate": 3.47361850467772e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1926204413175583,
"step": 1380,
"valid_targets_mean": 5126.9,
"valid_targets_min": 2220
},
{
"epoch": 2.1984126984126986,
"grad_norm": 0.3913488618062026,
"learning_rate": 3.468255421083546e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2079114466905594,
"step": 1385,
"valid_targets_mean": 6658.1,
"valid_targets_min": 906
},
{
"epoch": 2.2063492063492065,
"grad_norm": 0.4343501732005746,
"learning_rate": 3.46286934009661e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1819835603237152,
"step": 1390,
"valid_targets_mean": 4903.1,
"valid_targets_min": 1946
},
{
"epoch": 2.2142857142857144,
"grad_norm": 0.4642383235525826,
"learning_rate": 3.457460346079495e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1960304081439972,
"step": 1395,
"valid_targets_mean": 4859.3,
"valid_targets_min": 1756
},
{
"epoch": 2.2222222222222223,
"grad_norm": 0.39883822754099246,
"learning_rate": 3.452028523753673e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751224845647812,
"step": 1400,
"valid_targets_mean": 5698.9,
"valid_targets_min": 1531
},
{
"epoch": 2.2301587301587302,
"grad_norm": 0.37010389401431576,
"learning_rate": 3.446573958198176e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18461816012859344,
"step": 1405,
"valid_targets_mean": 6230.6,
"valid_targets_min": 1700
},
{
"epoch": 2.238095238095238,
"grad_norm": 0.6181478614629903,
"learning_rate": 3.4410967348482666e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14911070466041565,
"step": 1410,
"valid_targets_mean": 4602.1,
"valid_targets_min": 1798
},
{
"epoch": 2.246031746031746,
"grad_norm": 0.43108429750485655,
"learning_rate": 3.435596939494098e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1552506387233734,
"step": 1415,
"valid_targets_mean": 5343.7,
"valid_targets_min": 860
},
{
"epoch": 2.253968253968254,
"grad_norm": 0.3655618940959395,
"learning_rate": 3.430074658279369e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16736620664596558,
"step": 1420,
"valid_targets_mean": 6760.8,
"valid_targets_min": 4142
},
{
"epoch": 2.261904761904762,
"grad_norm": 0.43470898698901705,
"learning_rate": 3.424529977699977e-05,
"loss": 0.1747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18593010306358337,
"step": 1425,
"valid_targets_mean": 5456.4,
"valid_targets_min": 938
},
{
"epoch": 2.2698412698412698,
"grad_norm": 0.4012757385555316,
"learning_rate": 3.418962984602661e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2028789222240448,
"step": 1430,
"valid_targets_mean": 6217.8,
"valid_targets_min": 2538
},
{
"epoch": 2.2777777777777777,
"grad_norm": 0.422277687599635,
"learning_rate": 3.413373766183646e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17681989073753357,
"step": 1435,
"valid_targets_mean": 5242.7,
"valid_targets_min": 1133
},
{
"epoch": 2.2857142857142856,
"grad_norm": 0.4610732403739008,
"learning_rate": 3.40776240998727e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19924741983413696,
"step": 1440,
"valid_targets_mean": 5244.7,
"valid_targets_min": 878
},
{
"epoch": 2.2936507936507935,
"grad_norm": 0.4230850293753159,
"learning_rate": 3.4021290039046184e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18189997971057892,
"step": 1445,
"valid_targets_mean": 5056.2,
"valid_targets_min": 287
},
{
"epoch": 2.3015873015873014,
"grad_norm": 0.4282446015574262,
"learning_rate": 3.396473636172146e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1614503115415573,
"step": 1450,
"valid_targets_mean": 5646.3,
"valid_targets_min": 1748
},
{
"epoch": 2.3095238095238093,
"grad_norm": 0.35393446023512337,
"learning_rate": 3.390796395370294e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1533820927143097,
"step": 1455,
"valid_targets_mean": 6412.6,
"valid_targets_min": 930
},
{
"epoch": 2.317460317460317,
"grad_norm": 0.4006705141341369,
"learning_rate": 3.385097370422102e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17715230584144592,
"step": 1460,
"valid_targets_mean": 5679.0,
"valid_targets_min": 1403
},
{
"epoch": 2.3253968253968256,
"grad_norm": 0.41667317090980344,
"learning_rate": 3.3793766505918185e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18403995037078857,
"step": 1465,
"valid_targets_mean": 5691.4,
"valid_targets_min": 1804
},
{
"epoch": 2.3333333333333335,
"grad_norm": 0.4438049911035154,
"learning_rate": 3.3736343254834994e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16705909371376038,
"step": 1470,
"valid_targets_mean": 5163.1,
"valid_targets_min": 514
},
{
"epoch": 2.3412698412698414,
"grad_norm": 0.41724254225439533,
"learning_rate": 3.3678704850396045e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20384517312049866,
"step": 1475,
"valid_targets_mean": 5862.2,
"valid_targets_min": 328
},
{
"epoch": 2.3492063492063493,
"grad_norm": 0.4965895506653012,
"learning_rate": 3.362085219539592e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19839468598365784,
"step": 1480,
"valid_targets_mean": 5439.9,
"valid_targets_min": 1170
},
{
"epoch": 2.357142857142857,
"grad_norm": 0.38336740154664095,
"learning_rate": 3.3562786195985025e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.190034419298172,
"step": 1485,
"valid_targets_mean": 6053.7,
"valid_targets_min": 3073
},
{
"epoch": 2.365079365079365,
"grad_norm": 0.42799053268182136,
"learning_rate": 3.350450776165535e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17199914157390594,
"step": 1490,
"valid_targets_mean": 5109.0,
"valid_targets_min": 638
},
{
"epoch": 2.373015873015873,
"grad_norm": 0.49042106827448145,
"learning_rate": 3.344601780522634e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18558023869991302,
"step": 1495,
"valid_targets_mean": 4502.5,
"valid_targets_min": 1358
},
{
"epoch": 2.380952380952381,
"grad_norm": 0.452178036330889,
"learning_rate": 3.3387317242830466e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17586269974708557,
"step": 1500,
"valid_targets_mean": 5095.8,
"valid_targets_min": 271
},
{
"epoch": 2.388888888888889,
"grad_norm": 0.4167028985093456,
"learning_rate": 3.332840699389897e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16293631494045258,
"step": 1505,
"valid_targets_mean": 5093.2,
"valid_targets_min": 1199
},
{
"epoch": 2.3968253968253967,
"grad_norm": 0.4134999974854722,
"learning_rate": 3.32692879811474e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16504386067390442,
"step": 1510,
"valid_targets_mean": 4788.2,
"valid_targets_min": 281
},
{
"epoch": 2.4047619047619047,
"grad_norm": 0.38629332618116435,
"learning_rate": 3.320996113056123e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16470927000045776,
"step": 1515,
"valid_targets_mean": 5480.1,
"valid_targets_min": 1382
},
{
"epoch": 2.4126984126984126,
"grad_norm": 0.4517489878934338,
"learning_rate": 3.315042737138128e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19131216406822205,
"step": 1520,
"valid_targets_mean": 5177.0,
"valid_targets_min": 1427
},
{
"epoch": 2.4206349206349205,
"grad_norm": 0.3912437196261749,
"learning_rate": 3.309068763608919e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15866073966026306,
"step": 1525,
"valid_targets_mean": 4809.5,
"valid_targets_min": 304
},
{
"epoch": 2.4285714285714284,
"grad_norm": 0.4287081470079961,
"learning_rate": 3.303074286039285e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18889503180980682,
"step": 1530,
"valid_targets_mean": 5050.8,
"valid_targets_min": 1050
},
{
"epoch": 2.4365079365079367,
"grad_norm": 0.5226823839069293,
"learning_rate": 3.2970593983211694e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17266133427619934,
"step": 1535,
"valid_targets_mean": 5716.3,
"valid_targets_min": 2116
},
{
"epoch": 2.4444444444444446,
"grad_norm": 0.4142977777917709,
"learning_rate": 3.2910241946661993e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17832788825035095,
"step": 1540,
"valid_targets_mean": 5296.9,
"valid_targets_min": 600
},
{
"epoch": 2.4523809523809526,
"grad_norm": 0.4094380830442922,
"learning_rate": 3.2849687696042165e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16501125693321228,
"step": 1545,
"valid_targets_mean": 5243.6,
"valid_targets_min": 337
},
{
"epoch": 2.4603174603174605,
"grad_norm": 0.5264844857969575,
"learning_rate": 3.2788932179817886e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19089126586914062,
"step": 1550,
"valid_targets_mean": 4228.1,
"valid_targets_min": 574
},
{
"epoch": 2.4682539682539684,
"grad_norm": 0.3870078917146876,
"learning_rate": 3.2727976349607276e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16617675125598907,
"step": 1555,
"valid_targets_mean": 5233.7,
"valid_targets_min": 283
},
{
"epoch": 2.4761904761904763,
"grad_norm": 0.37140129207143047,
"learning_rate": 3.266682116016599e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15645205974578857,
"step": 1560,
"valid_targets_mean": 6038.5,
"valid_targets_min": 858
},
{
"epoch": 2.484126984126984,
"grad_norm": 0.3972434967156975,
"learning_rate": 3.260546756937227e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1872669756412506,
"step": 1565,
"valid_targets_mean": 5819.3,
"valid_targets_min": 343
},
{
"epoch": 2.492063492063492,
"grad_norm": 0.41540248633079907,
"learning_rate": 3.254391653821192e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1847609579563141,
"step": 1570,
"valid_targets_mean": 5872.5,
"valid_targets_min": 366
},
{
"epoch": 2.5,
"grad_norm": 0.4326289822516213,
"learning_rate": 3.248216903076328e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20463158190250397,
"step": 1575,
"valid_targets_mean": 5289.8,
"valid_targets_min": 279
},
{
"epoch": 2.507936507936508,
"grad_norm": 0.5002103630542671,
"learning_rate": 3.24202260141821e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19607800245285034,
"step": 1580,
"valid_targets_mean": 4856.6,
"valid_targets_min": 377
},
{
"epoch": 2.515873015873016,
"grad_norm": 0.44088426161151917,
"learning_rate": 3.235808845868641e-05,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17973065376281738,
"step": 1585,
"valid_targets_mean": 5105.2,
"valid_targets_min": 307
},
{
"epoch": 2.5238095238095237,
"grad_norm": 0.41586874944924196,
"learning_rate": 3.229575733754132e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18156777322292328,
"step": 1590,
"valid_targets_mean": 5101.9,
"valid_targets_min": 594
},
{
"epoch": 2.5317460317460316,
"grad_norm": 0.3977154984604151,
"learning_rate": 3.2233233627043765e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19697993993759155,
"step": 1595,
"valid_targets_mean": 5949.2,
"valid_targets_min": 838
},
{
"epoch": 2.5396825396825395,
"grad_norm": 0.3893767013034315,
"learning_rate": 3.217051830650722e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1648177206516266,
"step": 1600,
"valid_targets_mean": 5405.4,
"valid_targets_min": 633
},
{
"epoch": 2.5476190476190474,
"grad_norm": 0.4012855625129347,
"learning_rate": 3.210761235824639e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662881076335907,
"step": 1605,
"valid_targets_mean": 5683.6,
"valid_targets_min": 775
},
{
"epoch": 2.5555555555555554,
"grad_norm": 0.41653714911973017,
"learning_rate": 3.204451676756175e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690150797367096,
"step": 1610,
"valid_targets_mean": 5188.4,
"valid_targets_min": 2353
},
{
"epoch": 2.5634920634920633,
"grad_norm": 0.43105631877085077,
"learning_rate": 3.198123252272419e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1893271803855896,
"step": 1615,
"valid_targets_mean": 5241.9,
"valid_targets_min": 2285
},
{
"epoch": 2.571428571428571,
"grad_norm": 0.45967281455616704,
"learning_rate": 3.1917760614959505e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19677485525608063,
"step": 1620,
"valid_targets_mean": 5801.2,
"valid_targets_min": 1301
},
{
"epoch": 2.5793650793650795,
"grad_norm": 0.40150052297597855,
"learning_rate": 3.1854102038432856e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1876111626625061,
"step": 1625,
"valid_targets_mean": 5630.9,
"valid_targets_min": 404
},
{
"epoch": 2.5873015873015874,
"grad_norm": 0.352002911984159,
"learning_rate": 3.17902577902332e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494748890399933,
"step": 1630,
"valid_targets_mean": 5767.0,
"valid_targets_min": 330
},
{
"epoch": 2.5952380952380953,
"grad_norm": 0.38659122601598817,
"learning_rate": 3.172622887035771e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17912599444389343,
"step": 1635,
"valid_targets_mean": 5444.4,
"valid_targets_min": 260
},
{
"epoch": 2.6031746031746033,
"grad_norm": 0.566374914273737,
"learning_rate": 3.1662016281696073e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1878930926322937,
"step": 1640,
"valid_targets_mean": 4545.0,
"valid_targets_min": 502
},
{
"epoch": 2.611111111111111,
"grad_norm": 0.40019696946056404,
"learning_rate": 3.15976210300148e-05,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19527481496334076,
"step": 1645,
"valid_targets_mean": 5715.0,
"valid_targets_min": 366
},
{
"epoch": 2.619047619047619,
"grad_norm": 0.39423172570166204,
"learning_rate": 3.153304412394143e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640002578496933,
"step": 1650,
"valid_targets_mean": 5794.7,
"valid_targets_min": 680
},
{
"epoch": 2.626984126984127,
"grad_norm": 0.4024698863549588,
"learning_rate": 3.146828657494883e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1920669972896576,
"step": 1655,
"valid_targets_mean": 5749.9,
"valid_targets_min": 3138
},
{
"epoch": 2.634920634920635,
"grad_norm": 0.3925326135892127,
"learning_rate": 3.140334939733924e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18373993039131165,
"step": 1660,
"valid_targets_mean": 5227.9,
"valid_targets_min": 2482
},
{
"epoch": 2.642857142857143,
"grad_norm": 0.46866690749449025,
"learning_rate": 3.1338233608228455e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17870697379112244,
"step": 1665,
"valid_targets_mean": 5330.0,
"valid_targets_min": 609
},
{
"epoch": 2.6507936507936507,
"grad_norm": 0.3948699322229872,
"learning_rate": 3.127294022752988e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16245272755622864,
"step": 1670,
"valid_targets_mean": 5712.2,
"valid_targets_min": 768
},
{
"epoch": 2.6587301587301586,
"grad_norm": 0.33562761669358987,
"learning_rate": 3.120747027793854e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1378447711467743,
"step": 1675,
"valid_targets_mean": 6322.2,
"valid_targets_min": 674
},
{
"epoch": 2.6666666666666665,
"grad_norm": 0.4080788254926686,
"learning_rate": 3.114182478491509e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16858676075935364,
"step": 1680,
"valid_targets_mean": 5623.9,
"valid_targets_min": 325
},
{
"epoch": 2.674603174603175,
"grad_norm": 0.44788385062808955,
"learning_rate": 3.107600477666969e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17567336559295654,
"step": 1685,
"valid_targets_mean": 5283.2,
"valid_targets_min": 2475
},
{
"epoch": 2.682539682539683,
"grad_norm": 0.3698134704035969,
"learning_rate": 3.1010011284146004e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585252285003662,
"step": 1690,
"valid_targets_mean": 5612.2,
"valid_targets_min": 1509
},
{
"epoch": 2.6904761904761907,
"grad_norm": 0.4744606363702609,
"learning_rate": 3.0943845341004944e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21260786056518555,
"step": 1695,
"valid_targets_mean": 4632.7,
"valid_targets_min": 268
},
{
"epoch": 2.6984126984126986,
"grad_norm": 0.3925483959574624,
"learning_rate": 3.087750798360856e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1703377664089203,
"step": 1700,
"valid_targets_mean": 6203.7,
"valid_targets_min": 1733
},
{
"epoch": 2.7063492063492065,
"grad_norm": 0.423603961482913,
"learning_rate": 3.0811000251003774e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1864738166332245,
"step": 1705,
"valid_targets_mean": 4999.4,
"valid_targets_min": 633
},
{
"epoch": 2.7142857142857144,
"grad_norm": 0.42173447744798365,
"learning_rate": 3.074432318490608e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17015457153320312,
"step": 1710,
"valid_targets_mean": 4929.1,
"valid_targets_min": 1230
},
{
"epoch": 2.7222222222222223,
"grad_norm": 0.3656999014872132,
"learning_rate": 3.067747782968328e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662687063217163,
"step": 1715,
"valid_targets_mean": 5857.1,
"valid_targets_min": 1370
},
{
"epoch": 2.7301587301587302,
"grad_norm": 0.4250802423607952,
"learning_rate": 3.0610465232339096e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17572614550590515,
"step": 1720,
"valid_targets_mean": 5605.6,
"valid_targets_min": 895
},
{
"epoch": 2.738095238095238,
"grad_norm": 0.39832850275301074,
"learning_rate": 3.054328644249677e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17158354818820953,
"step": 1725,
"valid_targets_mean": 5492.9,
"valid_targets_min": 1324
},
{
"epoch": 2.746031746031746,
"grad_norm": 0.40611280034429587,
"learning_rate": 3.047594251238265e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17876523733139038,
"step": 1730,
"valid_targets_mean": 5122.9,
"valid_targets_min": 1754
},
{
"epoch": 2.753968253968254,
"grad_norm": 0.3850213501848369,
"learning_rate": 3.0408434496809643e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1557503491640091,
"step": 1735,
"valid_targets_mean": 4817.9,
"valid_targets_min": 346
},
{
"epoch": 2.761904761904762,
"grad_norm": 0.43072814030855905,
"learning_rate": 3.034076345316079e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1973961591720581,
"step": 1740,
"valid_targets_mean": 5802.5,
"valid_targets_min": 1788
},
{
"epoch": 2.7698412698412698,
"grad_norm": 0.4244003572959457,
"learning_rate": 3.0272930441372628e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1777854859828949,
"step": 1745,
"valid_targets_mean": 5021.1,
"valid_targets_min": 1233
},
{
"epoch": 2.7777777777777777,
"grad_norm": 0.3968223319635917,
"learning_rate": 3.02049365239186e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18718859553337097,
"step": 1750,
"valid_targets_mean": 5884.2,
"valid_targets_min": 3484
},
{
"epoch": 2.7857142857142856,
"grad_norm": 0.38979762153827907,
"learning_rate": 3.0136782765792455e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.184782013297081,
"step": 1755,
"valid_targets_mean": 5326.1,
"valid_targets_min": 3768
},
{
"epoch": 2.7936507936507935,
"grad_norm": 0.401430603353089,
"learning_rate": 3.0068470234491517e-05,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18122202157974243,
"step": 1760,
"valid_targets_mean": 5606.8,
"valid_targets_min": 2889
},
{
"epoch": 2.8015873015873014,
"grad_norm": 0.46774432941464267,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19038715958595276,
"step": 1765,
"valid_targets_mean": 5706.6,
"valid_targets_min": 953
},
{
"epoch": 2.8095238095238093,
"grad_norm": 0.3900657231476483,
"learning_rate": 2.993137313477223e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16720932722091675,
"step": 1770,
"valid_targets_mean": 5955.4,
"valid_targets_min": 229
},
{
"epoch": 2.817460317460317,
"grad_norm": 0.4671446489123995,
"learning_rate": 2.9862590713715837e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919449269771576,
"step": 1775,
"valid_targets_mean": 4992.8,
"valid_targets_min": 1710
},
{
"epoch": 2.825396825396825,
"grad_norm": 0.4108207960556999,
"learning_rate": 2.9793653814174957e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16805459558963776,
"step": 1780,
"valid_targets_mean": 5892.2,
"valid_targets_min": 1220
},
{
"epoch": 2.8333333333333335,
"grad_norm": 0.3878996578053704,
"learning_rate": 2.9724563515913317e-05,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16483880579471588,
"step": 1785,
"valid_targets_mean": 5715.8,
"valid_targets_min": 816
},
{
"epoch": 2.8412698412698414,
"grad_norm": 0.3924118467590962,
"learning_rate": 2.9655320901097348e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16196705400943756,
"step": 1790,
"valid_targets_mean": 5235.0,
"valid_targets_min": 2689
},
{
"epoch": 2.8492063492063493,
"grad_norm": 0.38981761916486113,
"learning_rate": 2.9585927054279224e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542998105287552,
"step": 1795,
"valid_targets_mean": 5381.4,
"valid_targets_min": 2263
},
{
"epoch": 2.857142857142857,
"grad_norm": 0.3581946508380772,
"learning_rate": 2.951638306237988e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17149242758750916,
"step": 1800,
"valid_targets_mean": 6313.2,
"valid_targets_min": 1580
},
{
"epoch": 2.865079365079365,
"grad_norm": 0.4494970197989124,
"learning_rate": 2.9446690014671976e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1602257341146469,
"step": 1805,
"valid_targets_mean": 5223.4,
"valid_targets_min": 935
},
{
"epoch": 2.873015873015873,
"grad_norm": 0.37530142354886875,
"learning_rate": 2.937684900276285e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15792617201805115,
"step": 1810,
"valid_targets_mean": 5738.4,
"valid_targets_min": 2336
},
{
"epoch": 2.880952380952381,
"grad_norm": 0.39396887510337375,
"learning_rate": 2.9306861120577416e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15244446694850922,
"step": 1815,
"valid_targets_mean": 5644.9,
"valid_targets_min": 1221
},
{
"epoch": 2.888888888888889,
"grad_norm": 0.3706798220884454,
"learning_rate": 2.923672746434103e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1762312352657318,
"step": 1820,
"valid_targets_mean": 6201.0,
"valid_targets_min": 552
},
{
"epoch": 2.8968253968253967,
"grad_norm": 0.4021984022426286,
"learning_rate": 2.9166449132562303e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2141510546207428,
"step": 1825,
"valid_targets_mean": 5325.4,
"valid_targets_min": 1539
},
{
"epoch": 2.9047619047619047,
"grad_norm": 0.42224038990358104,
"learning_rate": 2.9096027226015927e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18177683651447296,
"step": 1830,
"valid_targets_mean": 4708.6,
"valid_targets_min": 1117
},
{
"epoch": 2.9126984126984126,
"grad_norm": 0.3819006419400972,
"learning_rate": 2.9025462847725405e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16706177592277527,
"step": 1835,
"valid_targets_mean": 6122.9,
"valid_targets_min": 2503
},
{
"epoch": 2.9206349206349205,
"grad_norm": 0.4410064177919863,
"learning_rate": 2.8954757102945798e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2258429080247879,
"step": 1840,
"valid_targets_mean": 4895.2,
"valid_targets_min": 833
},
{
"epoch": 2.928571428571429,
"grad_norm": 0.39487518735853117,
"learning_rate": 2.888391109914638e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17937694489955902,
"step": 1845,
"valid_targets_mean": 5114.6,
"valid_targets_min": 643
},
{
"epoch": 2.9365079365079367,
"grad_norm": 0.38265019511969883,
"learning_rate": 2.8812925945993333e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17933601140975952,
"step": 1850,
"valid_targets_mean": 5663.7,
"valid_targets_min": 1513
},
{
"epoch": 2.9444444444444446,
"grad_norm": 0.402651671534175,
"learning_rate": 2.8741802755332332e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17298966646194458,
"step": 1855,
"valid_targets_mean": 4725.4,
"valid_targets_min": 403
},
{
"epoch": 2.9523809523809526,
"grad_norm": 0.43929484251032125,
"learning_rate": 2.8670542641171155e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19994154572486877,
"step": 1860,
"valid_targets_mean": 4797.8,
"valid_targets_min": 657
},
{
"epoch": 2.9603174603174605,
"grad_norm": 0.40410989413843573,
"learning_rate": 2.859914671966221e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17386558651924133,
"step": 1865,
"valid_targets_mean": 4977.1,
"valid_targets_min": 670
},
{
"epoch": 2.9682539682539684,
"grad_norm": 0.346301301173511,
"learning_rate": 2.8527616109085082e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15783601999282837,
"step": 1870,
"valid_targets_mean": 5833.5,
"valid_targets_min": 1896
},
{
"epoch": 2.9761904761904763,
"grad_norm": 0.38049759940528577,
"learning_rate": 2.8455951929828977e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15591737627983093,
"step": 1875,
"valid_targets_mean": 5575.6,
"valid_targets_min": 295
},
{
"epoch": 2.984126984126984,
"grad_norm": 0.3831654484686578,
"learning_rate": 2.8384155304375223e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19842402637004852,
"step": 1880,
"valid_targets_mean": 6079.8,
"valid_targets_min": 1937
},
{
"epoch": 2.992063492063492,
"grad_norm": 0.487008799638132,
"learning_rate": 2.8312227357279646e-05,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.192101389169693,
"step": 1885,
"valid_targets_mean": 4321.4,
"valid_targets_min": 342
},
{
"epoch": 3.0,
"grad_norm": 0.5184260476406786,
"learning_rate": 2.8240169215154977e-05,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595619022846222,
"step": 1890,
"valid_targets_mean": 5334.9,
"valid_targets_min": 325
},
{
"epoch": 3.007936507936508,
"grad_norm": 0.3405314330974361,
"learning_rate": 2.8167982006653196e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15521922707557678,
"step": 1895,
"valid_targets_mean": 6951.9,
"valid_targets_min": 3834
},
{
"epoch": 3.015873015873016,
"grad_norm": 0.44531826407382213,
"learning_rate": 2.8095666862447876e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18891948461532593,
"step": 1900,
"valid_targets_mean": 5601.6,
"valid_targets_min": 2266
},
{
"epoch": 3.0238095238095237,
"grad_norm": 0.3667355362457471,
"learning_rate": 2.8023224915216442e-05,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13565120100975037,
"step": 1905,
"valid_targets_mean": 6374.4,
"valid_targets_min": 1807
},
{
"epoch": 3.0317460317460316,
"grad_norm": 0.36488467668267915,
"learning_rate": 2.795065729962244e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15088070929050446,
"step": 1910,
"valid_targets_mean": 6743.3,
"valid_targets_min": 3371
},
{
"epoch": 3.0396825396825395,
"grad_norm": 0.5240072304479968,
"learning_rate": 2.7877965152297785e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16858817636966705,
"step": 1915,
"valid_targets_mean": 5218.3,
"valid_targets_min": 325
},
{
"epoch": 3.0476190476190474,
"grad_norm": 0.4345088557078499,
"learning_rate": 2.780514961182492e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18977370858192444,
"step": 1920,
"valid_targets_mean": 6161.9,
"valid_targets_min": 978
},
{
"epoch": 3.0555555555555554,
"grad_norm": 0.43067510343421206,
"learning_rate": 2.773221181871903e-05,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15231278538703918,
"step": 1925,
"valid_targets_mean": 5256.0,
"valid_targets_min": 1166
},
{
"epoch": 3.0634920634920633,
"grad_norm": 0.4329109482212343,
"learning_rate": 2.765915291541013e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1648765504360199,
"step": 1930,
"valid_targets_mean": 5768.6,
"valid_targets_min": 2664
},
{
"epoch": 3.0714285714285716,
"grad_norm": 0.4360393225780438,
"learning_rate": 2.7585974046225206e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16902469098567963,
"step": 1935,
"valid_targets_mean": 4864.1,
"valid_targets_min": 1763
},
{
"epoch": 3.0793650793650795,
"grad_norm": 0.42242563176181436,
"learning_rate": 2.751267635737027e-05,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15772101283073425,
"step": 1940,
"valid_targets_mean": 5512.9,
"valid_targets_min": 340
},
{
"epoch": 3.0873015873015874,
"grad_norm": 0.38359983981254425,
"learning_rate": 2.7439260996912423e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.171489417552948,
"step": 1945,
"valid_targets_mean": 5938.1,
"valid_targets_min": 2752
},
{
"epoch": 3.0952380952380953,
"grad_norm": 0.41322753491472525,
"learning_rate": 2.7365729114761862e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15758131444454193,
"step": 1950,
"valid_targets_mean": 5200.1,
"valid_targets_min": 370
},
{
"epoch": 3.1031746031746033,
"grad_norm": 0.4186192867390412,
"learning_rate": 2.729208186265386e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14994092285633087,
"step": 1955,
"valid_targets_mean": 5166.9,
"valid_targets_min": 251
},
{
"epoch": 3.111111111111111,
"grad_norm": 0.3644255779428956,
"learning_rate": 2.721832039413077e-05,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14574278891086578,
"step": 1960,
"valid_targets_mean": 6365.3,
"valid_targets_min": 1939
},
{
"epoch": 3.119047619047619,
"grad_norm": 0.41549829471711147,
"learning_rate": 2.7144445864523887e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15822090208530426,
"step": 1965,
"valid_targets_mean": 5193.6,
"valid_targets_min": 300
},
{
"epoch": 3.126984126984127,
"grad_norm": 0.4080754517778744,
"learning_rate": 2.7070459430935407e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18438664078712463,
"step": 1970,
"valid_targets_mean": 6076.5,
"valid_targets_min": 366
},
{
"epoch": 3.134920634920635,
"grad_norm": 0.34845655756539395,
"learning_rate": 2.69963622522203e-05,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505107879638672,
"step": 1975,
"valid_targets_mean": 7000.2,
"valid_targets_min": 867
},
{
"epoch": 3.142857142857143,
"grad_norm": 0.3957443526395654,
"learning_rate": 2.6922155488968117e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15863436460494995,
"step": 1980,
"valid_targets_mean": 6114.2,
"valid_targets_min": 1754
},
{
"epoch": 3.1507936507936507,
"grad_norm": 0.3987157816987954,
"learning_rate": 2.684784030348486e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1591426432132721,
"step": 1985,
"valid_targets_mean": 5729.1,
"valid_targets_min": 2795
},
{
"epoch": 3.1587301587301586,
"grad_norm": 0.3311471215567983,
"learning_rate": 2.6773417859774755e-05,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13412167131900787,
"step": 1990,
"valid_targets_mean": 7218.6,
"valid_targets_min": 5066
},
{
"epoch": 3.1666666666666665,
"grad_norm": 0.44452141015453234,
"learning_rate": 2.669888932352201e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14640459418296814,
"step": 1995,
"valid_targets_mean": 4116.0,
"valid_targets_min": 582
},
{
"epoch": 3.1746031746031744,
"grad_norm": 0.4296245823041024,
"learning_rate": 2.662425586207259e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18060961365699768,
"step": 2000,
"valid_targets_mean": 5717.8,
"valid_targets_min": 2684
},
{
"epoch": 3.1825396825396823,
"grad_norm": 0.44161933967338207,
"learning_rate": 2.6549518644415876e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13894905149936676,
"step": 2005,
"valid_targets_mean": 5385.4,
"valid_targets_min": 1651
},
{
"epoch": 3.1904761904761907,
"grad_norm": 0.4402027862054312,
"learning_rate": 2.6474678841166426e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15985198318958282,
"step": 2010,
"valid_targets_mean": 4908.7,
"valid_targets_min": 263
},
{
"epoch": 3.1984126984126986,
"grad_norm": 0.4521093840332604,
"learning_rate": 2.639973762454558e-05,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17308469116687775,
"step": 2015,
"valid_targets_mean": 5940.6,
"valid_targets_min": 2224
},
{
"epoch": 3.2063492063492065,
"grad_norm": 0.44949779778305143,
"learning_rate": 2.6324696168363134e-05,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16031065583229065,
"step": 2020,
"valid_targets_mean": 4588.2,
"valid_targets_min": 1570
},
{
"epoch": 3.2142857142857144,
"grad_norm": 0.44736879299802484,
"learning_rate": 2.624955564799894e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18750852346420288,
"step": 2025,
"valid_targets_mean": 4769.4,
"valid_targets_min": 558
},
{
"epoch": 3.2222222222222223,
"grad_norm": 0.4063469374069734,
"learning_rate": 2.617431724038451e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15944424271583557,
"step": 2030,
"valid_targets_mean": 5581.2,
"valid_targets_min": 1012
},
{
"epoch": 3.2301587301587302,
"grad_norm": 0.4237562908407849,
"learning_rate": 2.609898212398455e-05,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15621069073677063,
"step": 2035,
"valid_targets_mean": 5366.9,
"valid_targets_min": 1168
},
{
"epoch": 3.238095238095238,
"grad_norm": 0.39370444783531333,
"learning_rate": 2.6023551478778535e-05,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14452454447746277,
"step": 2040,
"valid_targets_mean": 5937.5,
"valid_targets_min": 225
},
{
"epoch": 3.246031746031746,
"grad_norm": 0.49270720514980915,
"learning_rate": 2.5948026486242225e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724134087562561,
"step": 2045,
"valid_targets_mean": 3770.9,
"valid_targets_min": 767
},
{
"epoch": 3.253968253968254,
"grad_norm": 0.4577588443456724,
"learning_rate": 2.5872408329329136e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13135287165641785,
"step": 2050,
"valid_targets_mean": 5848.4,
"valid_targets_min": 2027
},
{
"epoch": 3.261904761904762,
"grad_norm": 0.44271121122885954,
"learning_rate": 2.5796698192452016e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16199621558189392,
"step": 2055,
"valid_targets_mean": 4766.6,
"valid_targets_min": 404
},
{
"epoch": 3.2698412698412698,
"grad_norm": 0.39031087916457097,
"learning_rate": 2.572089726146432e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16037863492965698,
"step": 2060,
"valid_targets_mean": 5805.1,
"valid_targets_min": 728
},
{
"epoch": 3.2777777777777777,
"grad_norm": 0.4646573659873822,
"learning_rate": 2.564500672364162e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.162231907248497,
"step": 2065,
"valid_targets_mean": 4860.0,
"valid_targets_min": 260
},
{
"epoch": 3.2857142857142856,
"grad_norm": 0.3990327001371696,
"learning_rate": 2.556902776766298e-05,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15069621801376343,
"step": 2070,
"valid_targets_mean": 5909.9,
"valid_targets_min": 1698
},
{
"epoch": 3.2936507936507935,
"grad_norm": 0.43271648198961715,
"learning_rate": 2.5492961583592397e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.170293927192688,
"step": 2075,
"valid_targets_mean": 5133.9,
"valid_targets_min": 1647
},
{
"epoch": 3.3015873015873014,
"grad_norm": 0.44977807483400484,
"learning_rate": 2.5416809362860107e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18963780999183655,
"step": 2080,
"valid_targets_mean": 4750.8,
"valid_targets_min": 559
},
{
"epoch": 3.3095238095238093,
"grad_norm": 0.3681715462106892,
"learning_rate": 2.5340572298243946e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1364738941192627,
"step": 2085,
"valid_targets_mean": 6450.1,
"valid_targets_min": 4105
},
{
"epoch": 3.317460317460317,
"grad_norm": 0.45380051213619826,
"learning_rate": 2.5264251583850677e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1766563057899475,
"step": 2090,
"valid_targets_mean": 4932.4,
"valid_targets_min": 342
},
{
"epoch": 3.3253968253968256,
"grad_norm": 0.34929908788411107,
"learning_rate": 2.518784841509726e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.142880380153656,
"step": 2095,
"valid_targets_mean": 7236.7,
"valid_targets_min": 3519
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.42494242702127294,
"learning_rate": 2.511136398869216e-05,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1457439363002777,
"step": 2100,
"valid_targets_mean": 5273.4,
"valid_targets_min": 2522
},
{
"epoch": 3.3412698412698414,
"grad_norm": 0.41871282992961945,
"learning_rate": 2.503479950261658e-05,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14400547742843628,
"step": 2105,
"valid_targets_mean": 5479.6,
"valid_targets_min": 1124
},
{
"epoch": 3.3492063492063493,
"grad_norm": 0.41199941257756795,
"learning_rate": 2.4958156156105693e-05,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16985690593719482,
"step": 2110,
"valid_targets_mean": 5431.3,
"valid_targets_min": 322
},
{
"epoch": 3.357142857142857,
"grad_norm": 0.41511677551741843,
"learning_rate": 2.4881435149629892e-05,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15738296508789062,
"step": 2115,
"valid_targets_mean": 5947.6,
"valid_targets_min": 1723
},
{
"epoch": 3.365079365079365,
"grad_norm": 0.3658736974288424,
"learning_rate": 2.4804637684875937e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1301427185535431,
"step": 2120,
"valid_targets_mean": 7314.8,
"valid_targets_min": 534
},
{
"epoch": 3.373015873015873,
"grad_norm": 0.4048532254523095,
"learning_rate": 2.4727764964728177e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15161439776420593,
"step": 2125,
"valid_targets_mean": 5149.5,
"valid_targets_min": 2014
},
{
"epoch": 3.380952380952381,
"grad_norm": 0.3829760082289399,
"learning_rate": 2.4650818193249693e-05,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14068162441253662,
"step": 2130,
"valid_targets_mean": 5836.1,
"valid_targets_min": 1685
},
{
"epoch": 3.388888888888889,
"grad_norm": 0.4507430940791641,
"learning_rate": 2.4573798575663425e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16859221458435059,
"step": 2135,
"valid_targets_mean": 5247.2,
"valid_targets_min": 311
},
{
"epoch": 3.3968253968253967,
"grad_norm": 0.47784011418612515,
"learning_rate": 2.4496707318333323e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.176387220621109,
"step": 2140,
"valid_targets_mean": 4379.1,
"valid_targets_min": 1066
},
{
"epoch": 3.4047619047619047,
"grad_norm": 0.41751426715134293,
"learning_rate": 2.441954562874541e-05,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1648518145084381,
"step": 2145,
"valid_targets_mean": 5245.0,
"valid_targets_min": 1607
},
{
"epoch": 3.4126984126984126,
"grad_norm": 0.34417394477532504,
"learning_rate": 2.434231471548893e-05,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16924996674060822,
"step": 2150,
"valid_targets_mean": 7679.7,
"valid_targets_min": 4644
},
{
"epoch": 3.4206349206349205,
"grad_norm": 0.4099313742801725,
"learning_rate": 2.4265015788237348e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1553308665752411,
"step": 2155,
"valid_targets_mean": 5291.8,
"valid_targets_min": 1013
},
{
"epoch": 3.4285714285714284,
"grad_norm": 0.3644179150651529,
"learning_rate": 2.4187650057729465e-05,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13109582662582397,
"step": 2160,
"valid_targets_mean": 6145.5,
"valid_targets_min": 395
},
{
"epoch": 3.4365079365079367,
"grad_norm": 0.4344903235604141,
"learning_rate": 2.4110218735750403e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16567984223365784,
"step": 2165,
"valid_targets_mean": 5219.4,
"valid_targets_min": 272
},
{
"epoch": 3.4444444444444446,
"grad_norm": 0.44162025985134756,
"learning_rate": 2.4032723035112667e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17561107873916626,
"step": 2170,
"valid_targets_mean": 4544.6,
"valid_targets_min": 776
},
{
"epoch": 3.4523809523809526,
"grad_norm": 0.3932602300074192,
"learning_rate": 2.3955164169637124e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15324220061302185,
"step": 2175,
"valid_targets_mean": 5706.5,
"valid_targets_min": 347
},
{
"epoch": 3.4603174603174605,
"grad_norm": 0.42827386189990235,
"learning_rate": 2.387754335413398e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15386894345283508,
"step": 2180,
"valid_targets_mean": 4324.1,
"valid_targets_min": 373
},
{
"epoch": 3.4682539682539684,
"grad_norm": 0.41357075683918504,
"learning_rate": 2.3799861804383807e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15950973331928253,
"step": 2185,
"valid_targets_mean": 5571.4,
"valid_targets_min": 1700
},
{
"epoch": 3.4761904761904763,
"grad_norm": 0.4041812547912995,
"learning_rate": 2.3722120737118414e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1401449292898178,
"step": 2190,
"valid_targets_mean": 5355.0,
"valid_targets_min": 657
},
{
"epoch": 3.484126984126984,
"grad_norm": 0.4349818563348464,
"learning_rate": 2.3644321370001868e-05,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16082270443439484,
"step": 2195,
"valid_targets_mean": 4887.8,
"valid_targets_min": 201
},
{
"epoch": 3.492063492063492,
"grad_norm": 0.41308220488892183,
"learning_rate": 2.3566464921611393e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16265086829662323,
"step": 2200,
"valid_targets_mean": 5437.2,
"valid_targets_min": 625
},
{
"epoch": 3.5,
"grad_norm": 0.4212037346610392,
"learning_rate": 2.348855261141827e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16348662972450256,
"step": 2205,
"valid_targets_mean": 4889.4,
"valid_targets_min": 783
},
{
"epoch": 3.507936507936508,
"grad_norm": 0.4704570906062029,
"learning_rate": 2.341058565976874e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20820948481559753,
"step": 2210,
"valid_targets_mean": 5980.6,
"valid_targets_min": 961
},
{
"epoch": 3.515873015873016,
"grad_norm": 0.5036481968595117,
"learning_rate": 2.3332565287864918e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15473511815071106,
"step": 2215,
"valid_targets_mean": 5321.4,
"valid_targets_min": 1443
},
{
"epoch": 3.5238095238095237,
"grad_norm": 0.3735233109636718,
"learning_rate": 2.325449271774563e-05,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14910230040550232,
"step": 2220,
"valid_targets_mean": 6132.2,
"valid_targets_min": 1324
},
{
"epoch": 3.5317460317460316,
"grad_norm": 0.444413935820999,
"learning_rate": 2.3176369172267286e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17016586661338806,
"step": 2225,
"valid_targets_mean": 4620.8,
"valid_targets_min": 1621
},
{
"epoch": 3.5396825396825395,
"grad_norm": 0.3953957921849172,
"learning_rate": 2.3098195875084732e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15769408643245697,
"step": 2230,
"valid_targets_mean": 5690.9,
"valid_targets_min": 764
},
{
"epoch": 3.5476190476190474,
"grad_norm": 0.5077199865444484,
"learning_rate": 2.301997405063208e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15993595123291016,
"step": 2235,
"valid_targets_mean": 5084.5,
"valid_targets_min": 281
},
{
"epoch": 3.5555555555555554,
"grad_norm": 0.4086230414672359,
"learning_rate": 2.2941704924103535e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494399756193161,
"step": 2240,
"valid_targets_mean": 5467.4,
"valid_targets_min": 327
},
{
"epoch": 3.5634920634920633,
"grad_norm": 0.42370220867636965,
"learning_rate": 2.2863389721434165e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16436323523521423,
"step": 2245,
"valid_targets_mean": 6613.1,
"valid_targets_min": 301
},
{
"epoch": 3.571428571428571,
"grad_norm": 0.47414264477785967,
"learning_rate": 2.2785029669280775e-05,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16836649179458618,
"step": 2250,
"valid_targets_mean": 4143.4,
"valid_targets_min": 1765
},
{
"epoch": 3.5793650793650795,
"grad_norm": 0.4279968424111969,
"learning_rate": 2.2706625995002626e-05,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15963539481163025,
"step": 2255,
"valid_targets_mean": 5683.1,
"valid_targets_min": 677
},
{
"epoch": 3.5873015873015874,
"grad_norm": 0.43551657194367943,
"learning_rate": 2.262817992664224e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15465790033340454,
"step": 2260,
"valid_targets_mean": 5270.2,
"valid_targets_min": 792
},
{
"epoch": 3.5952380952380953,
"grad_norm": 0.473618019837446,
"learning_rate": 2.2549692692906158e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19456999003887177,
"step": 2265,
"valid_targets_mean": 4033.5,
"valid_targets_min": 1118
},
{
"epoch": 3.6031746031746033,
"grad_norm": 0.4610864812937639,
"learning_rate": 2.24711655231457e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16838069260120392,
"step": 2270,
"valid_targets_mean": 4850.8,
"valid_targets_min": 893
},
{
"epoch": 3.611111111111111,
"grad_norm": 0.4183921042676627,
"learning_rate": 2.2392599647337724e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15832781791687012,
"step": 2275,
"valid_targets_mean": 5614.7,
"valid_targets_min": 2089
},
{
"epoch": 3.619047619047619,
"grad_norm": 0.4746926085970967,
"learning_rate": 2.23139962960653e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17942070960998535,
"step": 2280,
"valid_targets_mean": 4651.3,
"valid_targets_min": 217
},
{
"epoch": 3.626984126984127,
"grad_norm": 0.42504033178119727,
"learning_rate": 2.2235356700498528e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1609695851802826,
"step": 2285,
"valid_targets_mean": 5650.9,
"valid_targets_min": 693
},
{
"epoch": 3.634920634920635,
"grad_norm": 0.35104401078143266,
"learning_rate": 2.2156682092375175e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14197728037834167,
"step": 2290,
"valid_targets_mean": 6449.4,
"valid_targets_min": 2699
},
{
"epoch": 3.642857142857143,
"grad_norm": 0.48629893819073916,
"learning_rate": 2.2077973703981423e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.171891987323761,
"step": 2295,
"valid_targets_mean": 5000.9,
"valid_targets_min": 325
},
{
"epoch": 3.6507936507936507,
"grad_norm": 0.38982495934645944,
"learning_rate": 2.1999232768132552e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15166640281677246,
"step": 2300,
"valid_targets_mean": 5598.8,
"valid_targets_min": 899
},
{
"epoch": 3.6587301587301586,
"grad_norm": 0.4538805178933535,
"learning_rate": 2.1920460518153637e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13476833701133728,
"step": 2305,
"valid_targets_mean": 4883.2,
"valid_targets_min": 655
},
{
"epoch": 3.6666666666666665,
"grad_norm": 0.4650060205808812,
"learning_rate": 2.1841658187860232e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1431887298822403,
"step": 2310,
"valid_targets_mean": 5863.8,
"valid_targets_min": 2487
},
{
"epoch": 3.674603174603175,
"grad_norm": 0.40827307741804697,
"learning_rate": 2.176282701153904e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16187241673469543,
"step": 2315,
"valid_targets_mean": 5186.4,
"valid_targets_min": 881
},
{
"epoch": 3.682539682539683,
"grad_norm": 0.40111783297909087,
"learning_rate": 2.1683968223928572e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1610245704650879,
"step": 2320,
"valid_targets_mean": 5193.5,
"valid_targets_min": 2007
},
{
"epoch": 3.6904761904761907,
"grad_norm": 0.4108636912566655,
"learning_rate": 2.1605083060199835e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19376526772975922,
"step": 2325,
"valid_targets_mean": 5273.6,
"valid_targets_min": 918
},
{
"epoch": 3.6984126984126986,
"grad_norm": 0.4090720045772208,
"learning_rate": 2.152617275593694e-05,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690284013748169,
"step": 2330,
"valid_targets_mean": 5263.3,
"valid_targets_min": 1166
},
{
"epoch": 3.7063492063492065,
"grad_norm": 0.37473461724981033,
"learning_rate": 2.144723854711781e-05,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14938317239284515,
"step": 2335,
"valid_targets_mean": 5389.9,
"valid_targets_min": 574
},
{
"epoch": 3.7142857142857144,
"grad_norm": 0.4843387089458587,
"learning_rate": 2.1368281670094766e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17382203042507172,
"step": 2340,
"valid_targets_mean": 4600.9,
"valid_targets_min": 1981
},
{
"epoch": 3.7222222222222223,
"grad_norm": 0.4119585290716737,
"learning_rate": 2.1289303361575175e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15374284982681274,
"step": 2345,
"valid_targets_mean": 5633.0,
"valid_targets_min": 2046
},
{
"epoch": 3.7301587301587302,
"grad_norm": 0.3952648176140555,
"learning_rate": 2.121030485860211e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17831559479236603,
"step": 2350,
"valid_targets_mean": 5893.4,
"valid_targets_min": 2787
},
{
"epoch": 3.738095238095238,
"grad_norm": 0.41411933208876145,
"learning_rate": 2.113128739853493e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17142191529273987,
"step": 2355,
"valid_targets_mean": 5256.2,
"valid_targets_min": 542
},
{
"epoch": 3.746031746031746,
"grad_norm": 0.45575184540137365,
"learning_rate": 2.1052252219029944e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1489437222480774,
"step": 2360,
"valid_targets_mean": 5599.4,
"valid_targets_min": 360
},
{
"epoch": 3.753968253968254,
"grad_norm": 0.38228242544809465,
"learning_rate": 2.0973200558020967e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1508997082710266,
"step": 2365,
"valid_targets_mean": 5869.1,
"valid_targets_min": 3409
},
{
"epoch": 3.761904761904762,
"grad_norm": 0.4148754628490215,
"learning_rate": 2.0894133653700005e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601417064666748,
"step": 2370,
"valid_targets_mean": 5959.2,
"valid_targets_min": 778
},
{
"epoch": 3.7698412698412698,
"grad_norm": 0.39421365324647456,
"learning_rate": 2.0815052744497795e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16802407801151276,
"step": 2375,
"valid_targets_mean": 5507.4,
"valid_targets_min": 539
},
{
"epoch": 3.7777777777777777,
"grad_norm": 0.4179727695736473,
"learning_rate": 2.0735959069064434e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505141705274582,
"step": 2380,
"valid_targets_mean": 4560.2,
"valid_targets_min": 946
},
{
"epoch": 3.7857142857142856,
"grad_norm": 0.4025223262448166,
"learning_rate": 2.065685386624999e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16200333833694458,
"step": 2385,
"valid_targets_mean": 5546.6,
"valid_targets_min": 2114
},
{
"epoch": 3.7936507936507935,
"grad_norm": 0.42971080125523514,
"learning_rate": 2.0577738375085076e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13847434520721436,
"step": 2390,
"valid_targets_mean": 4286.1,
"valid_targets_min": 670
},
{
"epoch": 3.8015873015873014,
"grad_norm": 0.4040671130609569,
"learning_rate": 2.0498613834761462e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16613656282424927,
"step": 2395,
"valid_targets_mean": 5606.1,
"valid_targets_min": 1122
},
{
"epoch": 3.8095238095238093,
"grad_norm": 0.4104422551171815,
"learning_rate": 2.041948148461264e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16815027594566345,
"step": 2400,
"valid_targets_mean": 6071.4,
"valid_targets_min": 1424
},
{
"epoch": 3.817460317460317,
"grad_norm": 0.433862516805992,
"learning_rate": 2.0340342564094436e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1456870138645172,
"step": 2405,
"valid_targets_mean": 4660.6,
"valid_targets_min": 300
},
{
"epoch": 3.825396825396825,
"grad_norm": 0.37026873619906453,
"learning_rate": 2.0261198312765597e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17130400240421295,
"step": 2410,
"valid_targets_mean": 7170.6,
"valid_targets_min": 3870
},
{
"epoch": 3.8333333333333335,
"grad_norm": 0.37774101351813544,
"learning_rate": 2.0182049970268355e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540232002735138,
"step": 2415,
"valid_targets_mean": 5801.1,
"valid_targets_min": 2004
},
{
"epoch": 3.8412698412698414,
"grad_norm": 0.40806762468519775,
"learning_rate": 2.010289877630902e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1633833944797516,
"step": 2420,
"valid_targets_mean": 6180.1,
"valid_targets_min": 278
},
{
"epoch": 3.8492063492063493,
"grad_norm": 0.4658635857688465,
"learning_rate": 2.002374597063858e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14994177222251892,
"step": 2425,
"valid_targets_mean": 5532.7,
"valid_targets_min": 741
},
{
"epoch": 3.857142857142857,
"grad_norm": 0.48235346332409923,
"learning_rate": 1.9944592793033255e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1955932080745697,
"step": 2430,
"valid_targets_mean": 4724.8,
"valid_targets_min": 766
},
{
"epoch": 3.865079365079365,
"grad_norm": 0.8801286649564228,
"learning_rate": 1.9865440483275086e-05,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1733412742614746,
"step": 2435,
"valid_targets_mean": 5920.0,
"valid_targets_min": 2207
},
{
"epoch": 3.873015873015873,
"grad_norm": 0.4518531270411737,
"learning_rate": 1.978629028113254e-05,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15560846030712128,
"step": 2440,
"valid_targets_mean": 4698.5,
"valid_targets_min": 369
},
{
"epoch": 3.880952380952381,
"grad_norm": 0.4095907564342567,
"learning_rate": 1.9707143426341058e-05,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14006567001342773,
"step": 2445,
"valid_targets_mean": 5711.9,
"valid_targets_min": 1934
},
{
"epoch": 3.888888888888889,
"grad_norm": 0.38371188352350993,
"learning_rate": 1.962800115858364e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15609079599380493,
"step": 2450,
"valid_targets_mean": 6032.2,
"valid_targets_min": 1733
},
{
"epoch": 3.8968253968253967,
"grad_norm": 0.4118539842920471,
"learning_rate": 1.9548864717471472e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14997440576553345,
"step": 2455,
"valid_targets_mean": 4638.2,
"valid_targets_min": 2217
},
{
"epoch": 3.9047619047619047,
"grad_norm": 0.4025039557270683,
"learning_rate": 1.9469735342524454e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1860060691833496,
"step": 2460,
"valid_targets_mean": 5977.4,
"valid_targets_min": 1525
},
{
"epoch": 3.9126984126984126,
"grad_norm": 0.4033220910310328,
"learning_rate": 1.939061427315179e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1573881059885025,
"step": 2465,
"valid_targets_mean": 5562.9,
"valid_targets_min": 466
},
{
"epoch": 3.9206349206349205,
"grad_norm": 0.40909002728066796,
"learning_rate": 1.931150274863265e-05,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1574082374572754,
"step": 2470,
"valid_targets_mean": 5320.6,
"valid_targets_min": 397
},
{
"epoch": 3.928571428571429,
"grad_norm": 0.42869522285562844,
"learning_rate": 1.9232402008096643e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19264186918735504,
"step": 2475,
"valid_targets_mean": 5145.9,
"valid_targets_min": 764
},
{
"epoch": 3.9365079365079367,
"grad_norm": 0.40381020748858665,
"learning_rate": 1.9153313290504495e-05,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13736480474472046,
"step": 2480,
"valid_targets_mean": 5991.2,
"valid_targets_min": 1935
},
{
"epoch": 3.9444444444444446,
"grad_norm": 0.44514859085692043,
"learning_rate": 1.9074237834628623e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14704057574272156,
"step": 2485,
"valid_targets_mean": 5541.5,
"valid_targets_min": 2647
},
{
"epoch": 3.9523809523809526,
"grad_norm": 0.4265501479636169,
"learning_rate": 1.8995176879033698e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18036606907844543,
"step": 2490,
"valid_targets_mean": 5466.8,
"valid_targets_min": 906
},
{
"epoch": 3.9603174603174605,
"grad_norm": 0.4487206178934192,
"learning_rate": 1.89161316620573e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17454467713832855,
"step": 2495,
"valid_targets_mean": 5006.6,
"valid_targets_min": 287
},
{
"epoch": 3.9682539682539684,
"grad_norm": 0.4033222789710387,
"learning_rate": 1.8837103421790486e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15375812351703644,
"step": 2500,
"valid_targets_mean": 6142.2,
"valid_targets_min": 1358
},
{
"epoch": 3.9761904761904763,
"grad_norm": 0.46326929396533706,
"learning_rate": 1.8758093396058386e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17514026165008545,
"step": 2505,
"valid_targets_mean": 5165.4,
"valid_targets_min": 2275
},
{
"epoch": 3.984126984126984,
"grad_norm": 0.40301115402832177,
"learning_rate": 1.8679102822400874e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15668317675590515,
"step": 2510,
"valid_targets_mean": 5199.4,
"valid_targets_min": 211
},
{
"epoch": 3.992063492063492,
"grad_norm": 0.4789393713046297,
"learning_rate": 1.8600132938053098e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19280311465263367,
"step": 2515,
"valid_targets_mean": 4916.7,
"valid_targets_min": 1007
},
{
"epoch": 4.0,
"grad_norm": 0.46667355097734303,
"learning_rate": 1.8521184979926177e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1989072561264038,
"step": 2520,
"valid_targets_mean": 5119.9,
"valid_targets_min": 207
},
{
"epoch": 4.007936507936508,
"grad_norm": 0.3847916291760838,
"learning_rate": 1.8442260184587804e-05,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16161227226257324,
"step": 2525,
"valid_targets_mean": 6026.6,
"valid_targets_min": 2419
},
{
"epoch": 4.015873015873016,
"grad_norm": 0.4090621169152007,
"learning_rate": 1.8363359788242842e-05,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14368446171283722,
"step": 2530,
"valid_targets_mean": 5862.6,
"valid_targets_min": 782
},
{
"epoch": 4.023809523809524,
"grad_norm": 0.6141566166940376,
"learning_rate": 1.8284485026714013e-05,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13589806854724884,
"step": 2535,
"valid_targets_mean": 6541.5,
"valid_targets_min": 1485
},
{
"epoch": 4.031746031746032,
"grad_norm": 0.4391239898708553,
"learning_rate": 1.8205637135422525e-05,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15070083737373352,
"step": 2540,
"valid_targets_mean": 5536.8,
"valid_targets_min": 938
},
{
"epoch": 4.0396825396825395,
"grad_norm": 0.41333666376927736,
"learning_rate": 1.8126817349368697e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329149305820465,
"step": 2545,
"valid_targets_mean": 5577.3,
"valid_targets_min": 1320
},
{
"epoch": 4.0476190476190474,
"grad_norm": 0.42756859856165286,
"learning_rate": 1.8048026903112632e-05,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1718430519104004,
"step": 2550,
"valid_targets_mean": 5278.7,
"valid_targets_min": 1393
},
{
"epoch": 4.055555555555555,
"grad_norm": 0.7929559502540676,
"learning_rate": 1.7969267030754903e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1519625186920166,
"step": 2555,
"valid_targets_mean": 4177.6,
"valid_targets_min": 290
},
{
"epoch": 4.063492063492063,
"grad_norm": 0.43339872921712147,
"learning_rate": 1.7890538965917184e-05,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12034216523170471,
"step": 2560,
"valid_targets_mean": 5259.5,
"valid_targets_min": 600
},
{
"epoch": 4.071428571428571,
"grad_norm": 0.4431280646696749,
"learning_rate": 1.7811843941722952e-05,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16165150701999664,
"step": 2565,
"valid_targets_mean": 5233.3,
"valid_targets_min": 343
},
{
"epoch": 4.079365079365079,
"grad_norm": 0.4733813623577339,
"learning_rate": 1.7733183190778174e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17020142078399658,
"step": 2570,
"valid_targets_mean": 4545.4,
"valid_targets_min": 852
},
{
"epoch": 4.087301587301587,
"grad_norm": 0.4256609723968049,
"learning_rate": 1.7654557945151968e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16018405556678772,
"step": 2575,
"valid_targets_mean": 5520.1,
"valid_targets_min": 2986
},
{
"epoch": 4.095238095238095,
"grad_norm": 0.41262793853257446,
"learning_rate": 1.7575969436357352e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13311775028705597,
"step": 2580,
"valid_targets_mean": 5285.7,
"valid_targets_min": 1788
},
{
"epoch": 4.103174603174603,
"grad_norm": 0.45945223536796,
"learning_rate": 1.7497418895331934e-05,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14666880667209625,
"step": 2585,
"valid_targets_mean": 4386.4,
"valid_targets_min": 325
},
{
"epoch": 4.111111111111111,
"grad_norm": 0.4675580885936456,
"learning_rate": 1.7418907552418597e-05,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15302041172981262,
"step": 2590,
"valid_targets_mean": 5458.4,
"valid_targets_min": 2918
},
{
"epoch": 4.119047619047619,
"grad_norm": 0.43934364103885165,
"learning_rate": 1.7340436637346315e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14084570109844208,
"step": 2595,
"valid_targets_mean": 4983.3,
"valid_targets_min": 1133
},
{
"epoch": 4.1269841269841265,
"grad_norm": 0.4164892763919611,
"learning_rate": 1.726200737921079e-05,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12312793731689453,
"step": 2600,
"valid_targets_mean": 6296.2,
"valid_targets_min": 596
},
{
"epoch": 4.134920634920635,
"grad_norm": 0.4532045098767217,
"learning_rate": 1.718362100645527e-05,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13698981702327728,
"step": 2605,
"valid_targets_mean": 4957.6,
"valid_targets_min": 1130
},
{
"epoch": 4.142857142857143,
"grad_norm": 0.4006124579380861,
"learning_rate": 1.710527874685129e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13815411925315857,
"step": 2610,
"valid_targets_mean": 6126.5,
"valid_targets_min": 855
},
{
"epoch": 4.150793650793651,
"grad_norm": 0.4714675135702414,
"learning_rate": 1.702698182747942e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14571262896060944,
"step": 2615,
"valid_targets_mean": 4147.3,
"valid_targets_min": 284
},
{
"epoch": 4.158730158730159,
"grad_norm": 0.42920831749050425,
"learning_rate": 1.6948731474710075e-05,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13257333636283875,
"step": 2620,
"valid_targets_mean": 5335.2,
"valid_targets_min": 618
},
{
"epoch": 4.166666666666667,
"grad_norm": 0.48356837750736714,
"learning_rate": 1.68705289141843e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1508401334285736,
"step": 2625,
"valid_targets_mean": 6277.6,
"valid_targets_min": 2995
},
{
"epoch": 4.174603174603175,
"grad_norm": 0.4755928358851968,
"learning_rate": 1.679237537079454e-05,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14255402982234955,
"step": 2630,
"valid_targets_mean": 4744.4,
"valid_targets_min": 466
},
{
"epoch": 4.182539682539683,
"grad_norm": 0.41585215382481877,
"learning_rate": 1.6714272068665526e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13894084095954895,
"step": 2635,
"valid_targets_mean": 5902.4,
"valid_targets_min": 838
},
{
"epoch": 4.190476190476191,
"grad_norm": 0.4189696451329358,
"learning_rate": 1.663622023113501e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1487642228603363,
"step": 2640,
"valid_targets_mean": 6358.3,
"valid_targets_min": 3083
},
{
"epoch": 4.198412698412699,
"grad_norm": 0.44087488345238157,
"learning_rate": 1.655822108073467e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14662505686283112,
"step": 2645,
"valid_targets_mean": 5523.2,
"valid_targets_min": 1561
},
{
"epoch": 4.2063492063492065,
"grad_norm": 0.47060099939704136,
"learning_rate": 1.648027583917095e-05,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13752037286758423,
"step": 2650,
"valid_targets_mean": 5949.6,
"valid_targets_min": 2002
},
{
"epoch": 4.214285714285714,
"grad_norm": 0.4223944809526827,
"learning_rate": 1.640238572730591e-05,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14241717755794525,
"step": 2655,
"valid_targets_mean": 5939.1,
"valid_targets_min": 1808
},
{
"epoch": 4.222222222222222,
"grad_norm": 0.3989848199161138,
"learning_rate": 1.632455196513809e-05,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15084542334079742,
"step": 2660,
"valid_targets_mean": 6282.1,
"valid_targets_min": 3096
},
{
"epoch": 4.23015873015873,
"grad_norm": 0.4334279841268595,
"learning_rate": 1.624677577178345e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15273742377758026,
"step": 2665,
"valid_targets_mean": 5628.8,
"valid_targets_min": 2067
},
{
"epoch": 4.238095238095238,
"grad_norm": 0.5090603717967935,
"learning_rate": 1.616905836545624e-05,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14674241840839386,
"step": 2670,
"valid_targets_mean": 4538.6,
"valid_targets_min": 294
},
{
"epoch": 4.246031746031746,
"grad_norm": 0.40233869436893316,
"learning_rate": 1.6091400963449894e-05,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16291236877441406,
"step": 2675,
"valid_targets_mean": 5911.8,
"valid_targets_min": 1450
},
{
"epoch": 4.253968253968254,
"grad_norm": 0.46919428409154407,
"learning_rate": 1.6013804782118043e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15669263899326324,
"step": 2680,
"valid_targets_mean": 4653.7,
"valid_targets_min": 1195
},
{
"epoch": 4.261904761904762,
"grad_norm": 0.46975419177737526,
"learning_rate": 1.5936271036855372e-05,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15147748589515686,
"step": 2685,
"valid_targets_mean": 6341.4,
"valid_targets_min": 3029
},
{
"epoch": 4.26984126984127,
"grad_norm": 0.416023668049094,
"learning_rate": 1.585880094207864e-05,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15425267815589905,
"step": 2690,
"valid_targets_mean": 5568.8,
"valid_targets_min": 2137
},
{
"epoch": 4.277777777777778,
"grad_norm": 0.48941294002103736,
"learning_rate": 1.5781395711207664e-05,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16209441423416138,
"step": 2695,
"valid_targets_mean": 5182.4,
"valid_targets_min": 3065
},
{
"epoch": 4.285714285714286,
"grad_norm": 0.4233678017768594,
"learning_rate": 1.5704056556646255e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15272748470306396,
"step": 2700,
"valid_targets_mean": 6165.9,
"valid_targets_min": 289
},
{
"epoch": 4.2936507936507935,
"grad_norm": 0.4883272680118086,
"learning_rate": 1.562678468976329e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14731578528881073,
"step": 2705,
"valid_targets_mean": 3793.1,
"valid_targets_min": 268
},
{
"epoch": 4.301587301587301,
"grad_norm": 0.4278181836239168,
"learning_rate": 1.5549581320873715e-05,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14064767956733704,
"step": 2710,
"valid_targets_mean": 6504.5,
"valid_targets_min": 2638
},
{
"epoch": 4.309523809523809,
"grad_norm": 0.44190091334584447,
"learning_rate": 1.5472447659219573e-05,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606476753950119,
"step": 2715,
"valid_targets_mean": 5205.2,
"valid_targets_min": 1350
},
{
"epoch": 4.317460317460317,
"grad_norm": 0.4287418443341925,
"learning_rate": 1.5395384912951096e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.143661230802536,
"step": 2720,
"valid_targets_mean": 5759.1,
"valid_targets_min": 539
},
{
"epoch": 4.325396825396825,
"grad_norm": 0.431052688233739,
"learning_rate": 1.531839428910774e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13569197058677673,
"step": 2725,
"valid_targets_mean": 5779.1,
"valid_targets_min": 2902
},
{
"epoch": 4.333333333333333,
"grad_norm": 0.4462658898939222,
"learning_rate": 1.5241476993599318e-05,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15712681412696838,
"step": 2730,
"valid_targets_mean": 5659.5,
"valid_targets_min": 719
},
{
"epoch": 4.341269841269841,
"grad_norm": 0.4365063885634691,
"learning_rate": 1.5164634231187106e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14231045544147491,
"step": 2735,
"valid_targets_mean": 5411.6,
"valid_targets_min": 1293
},
{
"epoch": 4.349206349206349,
"grad_norm": 0.3675606877485401,
"learning_rate": 1.5087867205464933e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12964603304862976,
"step": 2740,
"valid_targets_mean": 6364.4,
"valid_targets_min": 281
},
{
"epoch": 4.357142857142857,
"grad_norm": 0.44160911003260395,
"learning_rate": 1.5011177118840376e-05,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1406039297580719,
"step": 2745,
"valid_targets_mean": 5633.9,
"valid_targets_min": 403
},
{
"epoch": 4.365079365079365,
"grad_norm": 0.45789145016787364,
"learning_rate": 1.4934565172515917e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16867199540138245,
"step": 2750,
"valid_targets_mean": 4970.6,
"valid_targets_min": 2561
},
{
"epoch": 4.3730158730158735,
"grad_norm": 0.41734019364461133,
"learning_rate": 1.4858032566470107e-05,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14065919816493988,
"step": 2755,
"valid_targets_mean": 6324.4,
"valid_targets_min": 2455
},
{
"epoch": 4.380952380952381,
"grad_norm": 0.40415096511524873,
"learning_rate": 1.4781580499438794e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13654825091362,
"step": 2760,
"valid_targets_mean": 5964.2,
"valid_targets_min": 300
},
{
"epoch": 4.388888888888889,
"grad_norm": 0.40778882084936363,
"learning_rate": 1.4705210168896327e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12639005482196808,
"step": 2765,
"valid_targets_mean": 5996.9,
"valid_targets_min": 2114
},
{
"epoch": 4.396825396825397,
"grad_norm": 0.44063352236267495,
"learning_rate": 1.462892277103681e-05,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14338403940200806,
"step": 2770,
"valid_targets_mean": 5152.0,
"valid_targets_min": 487
},
{
"epoch": 4.404761904761905,
"grad_norm": 0.3874565040882736,
"learning_rate": 1.455271950075539e-05,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14000162482261658,
"step": 2775,
"valid_targets_mean": 5943.4,
"valid_targets_min": 3591
},
{
"epoch": 4.412698412698413,
"grad_norm": 0.3941349722942052,
"learning_rate": 1.4476601551629493e-05,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1478402018547058,
"step": 2780,
"valid_targets_mean": 6708.7,
"valid_targets_min": 3502
},
{
"epoch": 4.420634920634921,
"grad_norm": 0.41875630131970193,
"learning_rate": 1.4400570115900147e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15849897265434265,
"step": 2785,
"valid_targets_mean": 5522.6,
"valid_targets_min": 865
},
{
"epoch": 4.428571428571429,
"grad_norm": 0.5412264352868692,
"learning_rate": 1.4324626384453345e-05,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12859734892845154,
"step": 2790,
"valid_targets_mean": 4754.4,
"valid_targets_min": 1324
},
{
"epoch": 4.436507936507937,
"grad_norm": 0.42316575140054596,
"learning_rate": 1.4248771546801339e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14226463437080383,
"step": 2795,
"valid_targets_mean": 5423.4,
"valid_targets_min": 776
},
{
"epoch": 4.444444444444445,
"grad_norm": 0.431013383627872,
"learning_rate": 1.4173006791064023e-05,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14574524760246277,
"step": 2800,
"valid_targets_mean": 5876.1,
"valid_targets_min": 2317
},
{
"epoch": 4.4523809523809526,
"grad_norm": 0.4037541081664408,
"learning_rate": 1.4097333303950368e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440451443195343,
"step": 2805,
"valid_targets_mean": 5450.2,
"valid_targets_min": 1747
},
{
"epoch": 4.4603174603174605,
"grad_norm": 0.3978151834112168,
"learning_rate": 1.4021752270739759e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14280155301094055,
"step": 2810,
"valid_targets_mean": 6047.3,
"valid_targets_min": 2885
},
{
"epoch": 4.468253968253968,
"grad_norm": 0.39606766776930213,
"learning_rate": 1.3946264875263485e-05,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13499273359775543,
"step": 2815,
"valid_targets_mean": 5398.1,
"valid_targets_min": 881
},
{
"epoch": 4.476190476190476,
"grad_norm": 0.41951195439714245,
"learning_rate": 1.3870872299886184e-05,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15680038928985596,
"step": 2820,
"valid_targets_mean": 6016.8,
"valid_targets_min": 953
},
{
"epoch": 4.484126984126984,
"grad_norm": 0.6264261787683508,
"learning_rate": 1.3795575725487303e-05,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16164864599704742,
"step": 2825,
"valid_targets_mean": 5240.9,
"valid_targets_min": 1700
},
{
"epoch": 4.492063492063492,
"grad_norm": 0.8311634034364538,
"learning_rate": 1.3720376331442652e-05,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18453676998615265,
"step": 2830,
"valid_targets_mean": 6361.3,
"valid_targets_min": 3395
},
{
"epoch": 4.5,
"grad_norm": 0.42732218297283503,
"learning_rate": 1.364527529560586e-05,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15269696712493896,
"step": 2835,
"valid_targets_mean": 5456.8,
"valid_targets_min": 297
},
{
"epoch": 4.507936507936508,
"grad_norm": 0.39922258358961354,
"learning_rate": 1.3570273794289978e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15746167302131653,
"step": 2840,
"valid_targets_mean": 5865.9,
"valid_targets_min": 1646
},
{
"epoch": 4.515873015873016,
"grad_norm": 0.4249607848655103,
"learning_rate": 1.3495373002249061e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14502134919166565,
"step": 2845,
"valid_targets_mean": 5561.5,
"valid_targets_min": 2046
},
{
"epoch": 4.523809523809524,
"grad_norm": 0.45992538161194857,
"learning_rate": 1.3420574092659713e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13943564891815186,
"step": 2850,
"valid_targets_mean": 4809.2,
"valid_targets_min": 299
},
{
"epoch": 4.531746031746032,
"grad_norm": 0.4849743503805474,
"learning_rate": 1.3345878237102766e-05,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140847310423851,
"step": 2855,
"valid_targets_mean": 4423.5,
"valid_targets_min": 566
},
{
"epoch": 4.5396825396825395,
"grad_norm": 0.4337324469927627,
"learning_rate": 1.3271286605544906e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428968906402588,
"step": 2860,
"valid_targets_mean": 5831.9,
"valid_targets_min": 1871
},
{
"epoch": 4.5476190476190474,
"grad_norm": 0.46560324944354126,
"learning_rate": 1.3196800366320357e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14274823665618896,
"step": 2865,
"valid_targets_mean": 4730.6,
"valid_targets_min": 283
},
{
"epoch": 4.555555555555555,
"grad_norm": 0.44153707002684167,
"learning_rate": 1.3122420686112554e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14780506491661072,
"step": 2870,
"valid_targets_mean": 4814.2,
"valid_targets_min": 604
},
{
"epoch": 4.563492063492063,
"grad_norm": 0.4539431427613466,
"learning_rate": 1.3048148729935917e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18015024065971375,
"step": 2875,
"valid_targets_mean": 5631.1,
"valid_targets_min": 275
},
{
"epoch": 4.571428571428571,
"grad_norm": 0.42536670553586153,
"learning_rate": 1.297398566111756e-05,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14803089201450348,
"step": 2880,
"valid_targets_mean": 5638.5,
"valid_targets_min": 2487
},
{
"epoch": 4.579365079365079,
"grad_norm": 0.42937048670828487,
"learning_rate": 1.2899932641279082e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13798286020755768,
"step": 2885,
"valid_targets_mean": 4947.8,
"valid_targets_min": 299
},
{
"epoch": 4.587301587301587,
"grad_norm": 0.4404250376238387,
"learning_rate": 1.2825990830318395e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17519637942314148,
"step": 2890,
"valid_targets_mean": 5130.4,
"valid_targets_min": 1535
},
{
"epoch": 4.595238095238095,
"grad_norm": 0.4758481215827844,
"learning_rate": 1.2752161386391526e-05,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13737112283706665,
"step": 2895,
"valid_targets_mean": 4636.4,
"valid_targets_min": 293
},
{
"epoch": 4.603174603174603,
"grad_norm": 0.4767645902681976,
"learning_rate": 1.2678445465894491e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16972827911376953,
"step": 2900,
"valid_targets_mean": 4518.6,
"valid_targets_min": 1195
},
{
"epoch": 4.611111111111111,
"grad_norm": 0.4257119901155639,
"learning_rate": 1.2604844223445181e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15088322758674622,
"step": 2905,
"valid_targets_mean": 5354.5,
"valid_targets_min": 870
},
{
"epoch": 4.619047619047619,
"grad_norm": 0.42846734809049425,
"learning_rate": 1.2531358811865268e-05,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15017569065093994,
"step": 2910,
"valid_targets_mean": 5312.0,
"valid_targets_min": 737
},
{
"epoch": 4.6269841269841265,
"grad_norm": 0.4925025724969061,
"learning_rate": 1.2457990382162173e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1452239453792572,
"step": 2915,
"valid_targets_mean": 4835.2,
"valid_targets_min": 656
},
{
"epoch": 4.634920634920634,
"grad_norm": 0.4662611029234124,
"learning_rate": 1.238474008351101e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15926414728164673,
"step": 2920,
"valid_targets_mean": 5120.9,
"valid_targets_min": 674
},
{
"epoch": 4.642857142857143,
"grad_norm": 0.4322145630104494,
"learning_rate": 1.2311609063236594e-05,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1390167623758316,
"step": 2925,
"valid_targets_mean": 4672.6,
"valid_targets_min": 1746
},
{
"epoch": 4.650793650793651,
"grad_norm": 0.4130969360637945,
"learning_rate": 1.2238598466795493e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12715992331504822,
"step": 2930,
"valid_targets_mean": 5706.3,
"valid_targets_min": 1765
},
{
"epoch": 4.658730158730159,
"grad_norm": 0.3829382672782595,
"learning_rate": 1.2165709437758042e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14774689078330994,
"step": 2935,
"valid_targets_mean": 6549.7,
"valid_targets_min": 3799
},
{
"epoch": 4.666666666666667,
"grad_norm": 0.38939915661022567,
"learning_rate": 1.209294311779047e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14104187488555908,
"step": 2940,
"valid_targets_mean": 6312.2,
"valid_targets_min": 2275
},
{
"epoch": 4.674603174603175,
"grad_norm": 0.43181417781915576,
"learning_rate": 1.2020300646637018e-05,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11396326869726181,
"step": 2945,
"valid_targets_mean": 5581.9,
"valid_targets_min": 260
},
{
"epoch": 4.682539682539683,
"grad_norm": 0.44410129386120123,
"learning_rate": 1.1947783162102043e-05,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1418922394514084,
"step": 2950,
"valid_targets_mean": 4655.8,
"valid_targets_min": 693
},
{
"epoch": 4.690476190476191,
"grad_norm": 0.48458127033747794,
"learning_rate": 1.1875391800032248e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1841154396533966,
"step": 2955,
"valid_targets_mean": 4632.9,
"valid_targets_min": 313
},
{
"epoch": 4.698412698412699,
"grad_norm": 0.4032339427441577,
"learning_rate": 1.1803127694298873e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14213016629219055,
"step": 2960,
"valid_targets_mean": 5584.8,
"valid_targets_min": 934
},
{
"epoch": 4.7063492063492065,
"grad_norm": 0.4419975398132066,
"learning_rate": 1.173099197677992e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1430945247411728,
"step": 2965,
"valid_targets_mean": 5749.8,
"valid_targets_min": 2081
},
{
"epoch": 4.714285714285714,
"grad_norm": 0.43503178571092443,
"learning_rate": 1.1658985777342458e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14752447605133057,
"step": 2970,
"valid_targets_mean": 5720.0,
"valid_targets_min": 1862
},
{
"epoch": 4.722222222222222,
"grad_norm": 0.42023994518841934,
"learning_rate": 1.1587110223824874e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15875454246997833,
"step": 2975,
"valid_targets_mean": 5639.4,
"valid_targets_min": 1270
},
{
"epoch": 4.73015873015873,
"grad_norm": 0.37363144454032915,
"learning_rate": 1.151536644201925e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11643218994140625,
"step": 2980,
"valid_targets_mean": 5878.9,
"valid_targets_min": 1841
},
{
"epoch": 4.738095238095238,
"grad_norm": 0.44030969849082424,
"learning_rate": 1.1443755555653751e-05,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15411710739135742,
"step": 2985,
"valid_targets_mean": 4914.2,
"valid_targets_min": 1221
},
{
"epoch": 4.746031746031746,
"grad_norm": 0.41262993153981603,
"learning_rate": 1.1372278686374935e-05,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1678827404975891,
"step": 2990,
"valid_targets_mean": 5873.3,
"valid_targets_min": 1320
},
{
"epoch": 4.753968253968254,
"grad_norm": 0.4311749330104684,
"learning_rate": 1.1300936953730273e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.143174409866333,
"step": 2995,
"valid_targets_mean": 5119.6,
"valid_targets_min": 752
},
{
"epoch": 4.761904761904762,
"grad_norm": 0.361954540458806,
"learning_rate": 1.1229731475150594e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13922378420829773,
"step": 3000,
"valid_targets_mean": 6611.1,
"valid_targets_min": 3655
},
{
"epoch": 4.76984126984127,
"grad_norm": 0.3966366790173581,
"learning_rate": 1.1158663365932529e-05,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15058225393295288,
"step": 3005,
"valid_targets_mean": 5934.8,
"valid_targets_min": 3133
},
{
"epoch": 4.777777777777778,
"grad_norm": 0.4612543471363477,
"learning_rate": 1.1087733739221109e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15629416704177856,
"step": 3010,
"valid_targets_mean": 4712.2,
"valid_targets_min": 285
},
{
"epoch": 4.785714285714286,
"grad_norm": 0.38989272621213816,
"learning_rate": 1.1016943705992311e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1398439258337021,
"step": 3015,
"valid_targets_mean": 6174.9,
"valid_targets_min": 2064
},
{
"epoch": 4.7936507936507935,
"grad_norm": 0.4371800342017838,
"learning_rate": 1.0946294375035639e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1522529125213623,
"step": 3020,
"valid_targets_mean": 4937.9,
"valid_targets_min": 820
},
{
"epoch": 4.801587301587301,
"grad_norm": 0.5205141553470364,
"learning_rate": 1.087578685293674e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15628096461296082,
"step": 3025,
"valid_targets_mean": 5111.9,
"valid_targets_min": 295
},
{
"epoch": 4.809523809523809,
"grad_norm": 0.4077302471049976,
"learning_rate": 1.080542224406015e-05,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14736653864383698,
"step": 3030,
"valid_targets_mean": 5978.1,
"valid_targets_min": 522
},
{
"epoch": 4.817460317460317,
"grad_norm": 0.4091248100895989,
"learning_rate": 1.0735201650531915e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1352832168340683,
"step": 3035,
"valid_targets_mean": 5664.2,
"valid_targets_min": 2353
},
{
"epoch": 4.825396825396825,
"grad_norm": 0.3968540500697524,
"learning_rate": 1.066512617222235e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12752054631710052,
"step": 3040,
"valid_targets_mean": 6093.6,
"valid_targets_min": 1203
},
{
"epoch": 4.833333333333333,
"grad_norm": 0.3642854376590935,
"learning_rate": 1.059519690672884e-05,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15932929515838623,
"step": 3045,
"valid_targets_mean": 7128.1,
"valid_targets_min": 2558
},
{
"epoch": 4.841269841269841,
"grad_norm": 0.38602348967427114,
"learning_rate": 1.0525414949358614e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1197904720902443,
"step": 3050,
"valid_targets_mean": 5888.0,
"valid_targets_min": 2560
},
{
"epoch": 4.849206349206349,
"grad_norm": 0.510022835675847,
"learning_rate": 1.0455781393111613e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14147284626960754,
"step": 3055,
"valid_targets_mean": 5739.3,
"valid_targets_min": 1793
},
{
"epoch": 4.857142857142857,
"grad_norm": 0.6751258587414498,
"learning_rate": 1.0386297328663353e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16436898708343506,
"step": 3060,
"valid_targets_mean": 6290.2,
"valid_targets_min": 440
},
{
"epoch": 4.865079365079366,
"grad_norm": 0.4424084854510193,
"learning_rate": 1.0316963844347843e-05,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15425124764442444,
"step": 3065,
"valid_targets_mean": 5844.6,
"valid_targets_min": 2170
},
{
"epoch": 4.8730158730158735,
"grad_norm": 0.4168794838811193,
"learning_rate": 1.0247782026140576e-05,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13188251852989197,
"step": 3070,
"valid_targets_mean": 5396.5,
"valid_targets_min": 1348
},
{
"epoch": 4.880952380952381,
"grad_norm": 0.49315142334278483,
"learning_rate": 1.017875295764144e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13740713894367218,
"step": 3075,
"valid_targets_mean": 5882.2,
"valid_targets_min": 538
},
{
"epoch": 4.888888888888889,
"grad_norm": 0.4543689569217225,
"learning_rate": 1.0109877720057818e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16015523672103882,
"step": 3080,
"valid_targets_mean": 5451.6,
"valid_targets_min": 2056
},
{
"epoch": 4.896825396825397,
"grad_norm": 0.36802504019714555,
"learning_rate": 1.0041157392187651e-05,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11829912662506104,
"step": 3085,
"valid_targets_mean": 5831.1,
"valid_targets_min": 2830
},
{
"epoch": 4.904761904761905,
"grad_norm": 0.3966134482676806,
"learning_rate": 9.972593050402471e-06,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14243818819522858,
"step": 3090,
"valid_targets_mean": 6406.8,
"valid_targets_min": 1428
},
{
"epoch": 4.912698412698413,
"grad_norm": 0.4183961944811586,
"learning_rate": 9.904185768630612e-06,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16794633865356445,
"step": 3095,
"valid_targets_mean": 6009.8,
"valid_targets_min": 3070
},
{
"epoch": 4.920634920634921,
"grad_norm": 0.44212723748685295,
"learning_rate": 9.835936618340377e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14964662492275238,
"step": 3100,
"valid_targets_mean": 4590.1,
"valid_targets_min": 1122
},
{
"epoch": 4.928571428571429,
"grad_norm": 0.41070340267056166,
"learning_rate": 9.76784666852323e-06,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12387900054454803,
"step": 3105,
"valid_targets_mean": 6402.7,
"valid_targets_min": 3540
},
{
"epoch": 4.936507936507937,
"grad_norm": 0.44233711675764437,
"learning_rate": 9.699916985677062e-06,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1574784517288208,
"step": 3110,
"valid_targets_mean": 4382.4,
"valid_targets_min": 920
},
{
"epoch": 4.944444444444445,
"grad_norm": 0.46887051592133433,
"learning_rate": 9.6321486337895e-06,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15827694535255432,
"step": 3115,
"valid_targets_mean": 5222.6,
"valid_targets_min": 1313
},
{
"epoch": 4.9523809523809526,
"grad_norm": 0.41511980613828253,
"learning_rate": 9.564542674321228e-06,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14313764870166779,
"step": 3120,
"valid_targets_mean": 5663.2,
"valid_targets_min": 800
},
{
"epoch": 4.9603174603174605,
"grad_norm": 0.4621864142346036,
"learning_rate": 9.49710016618937e-06,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15151920914649963,
"step": 3125,
"valid_targets_mean": 5380.6,
"valid_targets_min": 313
},
{
"epoch": 4.968253968253968,
"grad_norm": 0.48527019717345327,
"learning_rate": 9.429822165750893e-06,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14661577343940735,
"step": 3130,
"valid_targets_mean": 4398.2,
"valid_targets_min": 633
},
{
"epoch": 4.976190476190476,
"grad_norm": 0.3831996919641483,
"learning_rate": 9.36270972678607e-06,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13461735844612122,
"step": 3135,
"valid_targets_mean": 6052.1,
"valid_targets_min": 1578
},
{
"epoch": 4.984126984126984,
"grad_norm": 0.4100072649060219,
"learning_rate": 9.295763900481977e-06,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12445595860481262,
"step": 3140,
"valid_targets_mean": 5427.4,
"valid_targets_min": 307
},
{
"epoch": 4.992063492063492,
"grad_norm": 0.46254552204793853,
"learning_rate": 9.22898573541602e-06,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16388916969299316,
"step": 3145,
"valid_targets_mean": 5861.9,
"valid_targets_min": 2467
},
{
"epoch": 5.0,
"grad_norm": 0.40795669884699387,
"learning_rate": 9.162376277539513e-06,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15090236067771912,
"step": 3150,
"valid_targets_mean": 5592.5,
"valid_targets_min": 1990
},
{
"epoch": 5.007936507936508,
"grad_norm": 0.3857823068068869,
"learning_rate": 9.095936570161301e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14320944249629974,
"step": 3155,
"valid_targets_mean": 5639.6,
"valid_targets_min": 260
},
{
"epoch": 5.015873015873016,
"grad_norm": 0.5435449453461013,
"learning_rate": 9.029667653931411e-06,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1401306390762329,
"step": 3160,
"valid_targets_mean": 5760.2,
"valid_targets_min": 371
},
{
"epoch": 5.023809523809524,
"grad_norm": 0.6789857642195729,
"learning_rate": 8.96357056682475e-06,
"loss": 0.1367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12801998853683472,
"step": 3165,
"valid_targets_mean": 5610.3,
"valid_targets_min": 522
},
{
"epoch": 5.031746031746032,
"grad_norm": 0.38873846063838485,
"learning_rate": 8.897646344124882e-06,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11531123518943787,
"step": 3170,
"valid_targets_mean": 6343.7,
"valid_targets_min": 2461
},
{
"epoch": 5.0396825396825395,
"grad_norm": 0.4632360566976383,
"learning_rate": 8.83189601840773e-06,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14523249864578247,
"step": 3175,
"valid_targets_mean": 5589.1,
"valid_targets_min": 1310
},
{
"epoch": 5.0476190476190474,
"grad_norm": 0.44480606265136036,
"learning_rate": 8.766320619525511e-06,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1437515914440155,
"step": 3180,
"valid_targets_mean": 5137.6,
"valid_targets_min": 1450
},
{
"epoch": 5.055555555555555,
"grad_norm": 0.40620681435947337,
"learning_rate": 8.700921174590525e-06,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13447782397270203,
"step": 3185,
"valid_targets_mean": 6346.1,
"valid_targets_min": 4150
},
{
"epoch": 5.063492063492063,
"grad_norm": 0.46662620571823504,
"learning_rate": 8.63569870795907e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14662285149097443,
"step": 3190,
"valid_targets_mean": 6060.2,
"valid_targets_min": 1308
},
{
"epoch": 5.071428571428571,
"grad_norm": 0.4654130995805731,
"learning_rate": 8.570654241215466e-06,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14438563585281372,
"step": 3195,
"valid_targets_mean": 5318.1,
"valid_targets_min": 1095
},
{
"epoch": 5.079365079365079,
"grad_norm": 0.40240677129462593,
"learning_rate": 8.505788793155978e-06,
"loss": 0.1285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11840318888425827,
"step": 3200,
"valid_targets_mean": 6147.7,
"valid_targets_min": 403
},
{
"epoch": 5.087301587301587,
"grad_norm": 0.5552645220273652,
"learning_rate": 8.441103379772893e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15520301461219788,
"step": 3205,
"valid_targets_mean": 5761.9,
"valid_targets_min": 1220
},
{
"epoch": 5.095238095238095,
"grad_norm": 0.4847744229611747,
"learning_rate": 8.376599014238605e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12781260907649994,
"step": 3210,
"valid_targets_mean": 5049.5,
"valid_targets_min": 2182
},
{
"epoch": 5.103174603174603,
"grad_norm": 0.4448058887555173,
"learning_rate": 8.312276706889738e-06,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14810214936733246,
"step": 3215,
"valid_targets_mean": 4893.2,
"valid_targets_min": 712
},
{
"epoch": 5.111111111111111,
"grad_norm": 0.3769447002552102,
"learning_rate": 8.24813746521133e-06,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11988615989685059,
"step": 3220,
"valid_targets_mean": 6354.1,
"valid_targets_min": 552
},
{
"epoch": 5.119047619047619,
"grad_norm": 0.40775763269992454,
"learning_rate": 8.184182293821046e-06,
"loss": 0.1335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13774478435516357,
"step": 3225,
"valid_targets_mean": 6155.4,
"valid_targets_min": 1769
},
{
"epoch": 5.1269841269841265,
"grad_norm": 0.4621791306803943,
"learning_rate": 8.120412194453442e-06,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13131381571292877,
"step": 3230,
"valid_targets_mean": 5662.6,
"valid_targets_min": 1704
},
{
"epoch": 5.134920634920635,
"grad_norm": 0.47477190317994294,
"learning_rate": 8.056828165944282e-06,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11765207350254059,
"step": 3235,
"valid_targets_mean": 4793.4,
"valid_targets_min": 556
},
{
"epoch": 5.142857142857143,
"grad_norm": 0.4211817590749248,
"learning_rate": 7.993431204214883e-06,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140112042427063,
"step": 3240,
"valid_targets_mean": 6042.8,
"valid_targets_min": 2069
},
{
"epoch": 5.150793650793651,
"grad_norm": 0.4100200812051378,
"learning_rate": 7.93022230225652e-06,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1306135654449463,
"step": 3245,
"valid_targets_mean": 5446.9,
"valid_targets_min": 1408
},
{
"epoch": 5.158730158730159,
"grad_norm": 0.4654477832902761,
"learning_rate": 7.867202450114892e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1470104455947876,
"step": 3250,
"valid_targets_mean": 4906.9,
"valid_targets_min": 483
},
{
"epoch": 5.166666666666667,
"grad_norm": 0.523468892447528,
"learning_rate": 7.804372634874582e-06,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13795553147792816,
"step": 3255,
"valid_targets_mean": 4284.5,
"valid_targets_min": 1195
},
{
"epoch": 5.174603174603175,
"grad_norm": 0.6078996381505655,
"learning_rate": 7.74173384064359e-06,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1462775468826294,
"step": 3260,
"valid_targets_mean": 5041.4,
"valid_targets_min": 1305
},
{
"epoch": 5.182539682539683,
"grad_norm": 0.4607675067323951,
"learning_rate": 7.679287048537987e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1391090750694275,
"step": 3265,
"valid_targets_mean": 5745.2,
"valid_targets_min": 336
},
{
"epoch": 5.190476190476191,
"grad_norm": 0.4923341770949091,
"learning_rate": 7.617033236666469e-06,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1512683480978012,
"step": 3270,
"valid_targets_mean": 4856.6,
"valid_targets_min": 860
},
{
"epoch": 5.198412698412699,
"grad_norm": 0.4823935955118556,
"learning_rate": 7.55497338011506e-06,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12928101420402527,
"step": 3275,
"valid_targets_mean": 5083.1,
"valid_targets_min": 674
},
{
"epoch": 5.2063492063492065,
"grad_norm": 0.4571859304803118,
"learning_rate": 7.493108450931879e-06,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.147546648979187,
"step": 3280,
"valid_targets_mean": 5298.1,
"valid_targets_min": 584
},
{
"epoch": 5.214285714285714,
"grad_norm": 0.4656323081387472,
"learning_rate": 7.4314394181118636e-06,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13368697464466095,
"step": 3285,
"valid_targets_mean": 5323.8,
"valid_targets_min": 1007
},
{
"epoch": 5.222222222222222,
"grad_norm": 0.47778320363976773,
"learning_rate": 7.369967247581611e-06,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14050470292568207,
"step": 3290,
"valid_targets_mean": 4988.6,
"valid_targets_min": 1255
},
{
"epoch": 5.23015873015873,
"grad_norm": 0.47185902185121587,
"learning_rate": 7.3086929021842575e-06,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14221060276031494,
"step": 3295,
"valid_targets_mean": 4921.3,
"valid_targets_min": 778
},
{
"epoch": 5.238095238095238,
"grad_norm": 0.40677949622794063,
"learning_rate": 7.247617341664384e-06,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15191778540611267,
"step": 3300,
"valid_targets_mean": 6783.2,
"valid_targets_min": 2108
},
{
"epoch": 5.246031746031746,
"grad_norm": 0.5597275095189963,
"learning_rate": 7.186741522652994e-06,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1412215381860733,
"step": 3305,
"valid_targets_mean": 5306.6,
"valid_targets_min": 1796
},
{
"epoch": 5.253968253968254,
"grad_norm": 0.4136667615907917,
"learning_rate": 7.12606639865252e-06,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13404718041419983,
"step": 3310,
"valid_targets_mean": 5412.3,
"valid_targets_min": 838
},
{
"epoch": 5.261904761904762,
"grad_norm": 0.5072282174178516,
"learning_rate": 7.065592920021893e-06,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1653522104024887,
"step": 3315,
"valid_targets_mean": 5170.6,
"valid_targets_min": 1293
},
{
"epoch": 5.26984126984127,
"grad_norm": 0.43649425013960674,
"learning_rate": 7.005322033961679e-06,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14359837770462036,
"step": 3320,
"valid_targets_mean": 5731.9,
"valid_targets_min": 2041
},
{
"epoch": 5.277777777777778,
"grad_norm": 0.4609844808793299,
"learning_rate": 6.945254684499185e-06,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14887037873268127,
"step": 3325,
"valid_targets_mean": 5072.8,
"valid_targets_min": 565
},
{
"epoch": 5.285714285714286,
"grad_norm": 0.4423681058460165,
"learning_rate": 6.8853918124737274e-06,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1400473713874817,
"step": 3330,
"valid_targets_mean": 5419.5,
"valid_targets_min": 461
},
{
"epoch": 5.2936507936507935,
"grad_norm": 0.4833740463102983,
"learning_rate": 6.825734355521898e-06,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1373916119337082,
"step": 3335,
"valid_targets_mean": 5413.9,
"valid_targets_min": 285
},
{
"epoch": 5.301587301587301,
"grad_norm": 0.46607539050074326,
"learning_rate": 6.766283248062817e-06,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14503991603851318,
"step": 3340,
"valid_targets_mean": 5005.1,
"valid_targets_min": 1372
},
{
"epoch": 5.309523809523809,
"grad_norm": 0.46602580090763035,
"learning_rate": 6.707039421283559e-06,
"loss": 0.1362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1407843828201294,
"step": 3345,
"valid_targets_mean": 4867.7,
"valid_targets_min": 279
},
{
"epoch": 5.317460317460317,
"grad_norm": 0.4977380166852099,
"learning_rate": 6.648003803124559e-06,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18442052602767944,
"step": 3350,
"valid_targets_mean": 4517.1,
"valid_targets_min": 528
},
{
"epoch": 5.325396825396825,
"grad_norm": 0.45300213871690015,
"learning_rate": 6.589177318265047e-06,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13406887650489807,
"step": 3355,
"valid_targets_mean": 5391.9,
"valid_targets_min": 501
},
{
"epoch": 5.333333333333333,
"grad_norm": 0.4255524573366613,
"learning_rate": 6.53056088810857e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14955641329288483,
"step": 3360,
"valid_targets_mean": 5542.8,
"valid_targets_min": 2458
},
{
"epoch": 5.341269841269841,
"grad_norm": 0.5534775234199173,
"learning_rate": 6.472155430768608e-06,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12088638544082642,
"step": 3365,
"valid_targets_mean": 6366.4,
"valid_targets_min": 1428
},
{
"epoch": 5.349206349206349,
"grad_norm": 0.4364437395513567,
"learning_rate": 6.413961861054132e-06,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15652699768543243,
"step": 3370,
"valid_targets_mean": 5471.2,
"valid_targets_min": 591
},
{
"epoch": 5.357142857142857,
"grad_norm": 0.45770813360412227,
"learning_rate": 6.3559810904553095e-06,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14036116003990173,
"step": 3375,
"valid_targets_mean": 5520.9,
"valid_targets_min": 256
},
{
"epoch": 5.365079365079365,
"grad_norm": 0.4153555346953972,
"learning_rate": 6.298214027129219e-06,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13151246309280396,
"step": 3380,
"valid_targets_mean": 6010.9,
"valid_targets_min": 263
},
{
"epoch": 5.3730158730158735,
"grad_norm": 0.4451350722143499,
"learning_rate": 6.240661575885629e-06,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1685609072446823,
"step": 3385,
"valid_targets_mean": 5214.2,
"valid_targets_min": 763
},
{
"epoch": 5.380952380952381,
"grad_norm": 0.46292596088927307,
"learning_rate": 6.183324638172819e-06,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15203514695167542,
"step": 3390,
"valid_targets_mean": 5266.0,
"valid_targets_min": 861
},
{
"epoch": 5.388888888888889,
"grad_norm": 0.4676464235157195,
"learning_rate": 6.126204112063463e-06,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13088193535804749,
"step": 3395,
"valid_targets_mean": 4737.1,
"valid_targets_min": 1121
},
{
"epoch": 5.396825396825397,
"grad_norm": 0.6797962177962652,
"learning_rate": 6.069300892240564e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16591420769691467,
"step": 3400,
"valid_targets_mean": 4606.3,
"valid_targets_min": 377
},
{
"epoch": 5.404761904761905,
"grad_norm": 0.47267093685643496,
"learning_rate": 6.0126158699834625e-06,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13353607058525085,
"step": 3405,
"valid_targets_mean": 5052.6,
"valid_targets_min": 2020
},
{
"epoch": 5.412698412698413,
"grad_norm": 0.428442687908954,
"learning_rate": 5.956149933153816e-06,
"loss": 0.1318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12273760139942169,
"step": 3410,
"valid_targets_mean": 5588.0,
"valid_targets_min": 2053
},
{
"epoch": 5.420634920634921,
"grad_norm": 0.4412367255518039,
"learning_rate": 5.899903966181751e-06,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14523178339004517,
"step": 3415,
"valid_targets_mean": 5505.2,
"valid_targets_min": 2042
},
{
"epoch": 5.428571428571429,
"grad_norm": 0.43781568976305363,
"learning_rate": 5.843878850052007e-06,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14099499583244324,
"step": 3420,
"valid_targets_mean": 5586.9,
"valid_targets_min": 839
},
{
"epoch": 5.436507936507937,
"grad_norm": 0.46059817758019467,
"learning_rate": 5.788075462290084e-06,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1432957500219345,
"step": 3425,
"valid_targets_mean": 4740.2,
"valid_targets_min": 705
},
{
"epoch": 5.444444444444445,
"grad_norm": 0.415134511085044,
"learning_rate": 5.732494676948554e-06,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12942150235176086,
"step": 3430,
"valid_targets_mean": 6054.6,
"valid_targets_min": 608
},
{
"epoch": 5.4523809523809526,
"grad_norm": 0.41001838037825894,
"learning_rate": 5.677137364593363e-06,
"loss": 0.1379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14375941455364227,
"step": 3435,
"valid_targets_mean": 5782.4,
"valid_targets_min": 2362
},
{
"epoch": 5.4603174603174605,
"grad_norm": 0.4462203270648477,
"learning_rate": 5.622004392290163e-06,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13974609971046448,
"step": 3440,
"valid_targets_mean": 5166.1,
"valid_targets_min": 1105
},
{
"epoch": 5.468253968253968,
"grad_norm": 0.5621286314149347,
"learning_rate": 5.567096623590758e-06,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14251437783241272,
"step": 3445,
"valid_targets_mean": 5521.8,
"valid_targets_min": 1822
},
{
"epoch": 5.476190476190476,
"grad_norm": 0.3951253389087575,
"learning_rate": 5.512414918519573e-06,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.138666570186615,
"step": 3450,
"valid_targets_mean": 6410.9,
"valid_targets_min": 2903
},
{
"epoch": 5.484126984126984,
"grad_norm": 0.42978600879401685,
"learning_rate": 5.457960133560179e-06,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13873498141765594,
"step": 3455,
"valid_targets_mean": 5563.0,
"valid_targets_min": 2443
},
{
"epoch": 5.492063492063492,
"grad_norm": 0.4763755663272107,
"learning_rate": 5.403733121641883e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14260432124137878,
"step": 3460,
"valid_targets_mean": 5387.6,
"valid_targets_min": 1680
},
{
"epoch": 5.5,
"grad_norm": 0.45865214891995293,
"learning_rate": 5.349734732126366e-06,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15055881440639496,
"step": 3465,
"valid_targets_mean": 5297.8,
"valid_targets_min": 247
},
{
"epoch": 5.507936507936508,
"grad_norm": 0.4739801326379873,
"learning_rate": 5.295965810794376e-06,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1341158002614975,
"step": 3470,
"valid_targets_mean": 4671.8,
"valid_targets_min": 1946
},
{
"epoch": 5.515873015873016,
"grad_norm": 0.4054624348563083,
"learning_rate": 5.2424271998324895e-06,
"loss": 0.1305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13239628076553345,
"step": 3475,
"valid_targets_mean": 5538.2,
"valid_targets_min": 2317
},
{
"epoch": 5.523809523809524,
"grad_norm": 0.47822327586671515,
"learning_rate": 5.189119737819912e-06,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13307338953018188,
"step": 3480,
"valid_targets_mean": 5326.6,
"valid_targets_min": 1927
},
{
"epoch": 5.531746031746032,
"grad_norm": 0.45640673731159975,
"learning_rate": 5.136044259715342e-06,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569247543811798,
"step": 3485,
"valid_targets_mean": 5192.1,
"valid_targets_min": 1402
},
{
"epoch": 5.5396825396825395,
"grad_norm": 0.47606206142121826,
"learning_rate": 5.083201596843905e-06,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13270564377307892,
"step": 3490,
"valid_targets_mean": 5579.8,
"valid_targets_min": 1802
},
{
"epoch": 5.5476190476190474,
"grad_norm": 0.48207429223420034,
"learning_rate": 5.030592576884117e-06,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1469019204378128,
"step": 3495,
"valid_targets_mean": 5300.8,
"valid_targets_min": 578
},
{
"epoch": 5.555555555555555,
"grad_norm": 0.46920831785621236,
"learning_rate": 4.978218023854928e-06,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14404523372650146,
"step": 3500,
"valid_targets_mean": 4518.9,
"valid_targets_min": 229
},
{
"epoch": 5.563492063492063,
"grad_norm": 0.42912173167963297,
"learning_rate": 4.926078758102834e-06,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1521531045436859,
"step": 3505,
"valid_targets_mean": 5723.4,
"valid_targets_min": 1020
},
{
"epoch": 5.571428571428571,
"grad_norm": 0.503182430334019,
"learning_rate": 4.87417559628897e-06,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13956725597381592,
"step": 3510,
"valid_targets_mean": 5755.2,
"valid_targets_min": 342
},
{
"epoch": 5.579365079365079,
"grad_norm": 0.483615956667945,
"learning_rate": 4.822509351376399e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15917867422103882,
"step": 3515,
"valid_targets_mean": 4745.8,
"valid_targets_min": 871
},
{
"epoch": 5.587301587301587,
"grad_norm": 0.44843746346045477,
"learning_rate": 4.7710808326173115e-06,
"loss": 0.1376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14553232491016388,
"step": 3520,
"valid_targets_mean": 5322.7,
"valid_targets_min": 949
},
{
"epoch": 5.595238095238095,
"grad_norm": 0.4446428825967545,
"learning_rate": 4.719890845540385e-06,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1446400284767151,
"step": 3525,
"valid_targets_mean": 5464.6,
"valid_targets_min": 1876
},
{
"epoch": 5.603174603174603,
"grad_norm": 0.44461133087445714,
"learning_rate": 4.668940191938156e-06,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12743496894836426,
"step": 3530,
"valid_targets_mean": 5617.1,
"valid_targets_min": 867
},
{
"epoch": 5.611111111111111,
"grad_norm": 0.46893046808084937,
"learning_rate": 4.618229669854464e-06,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1406087577342987,
"step": 3535,
"valid_targets_mean": 5965.8,
"valid_targets_min": 2904
},
{
"epoch": 5.619047619047619,
"grad_norm": 0.49547441030459144,
"learning_rate": 4.567760073571947e-06,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14891457557678223,
"step": 3540,
"valid_targets_mean": 4223.9,
"valid_targets_min": 1503
},
{
"epoch": 5.6269841269841265,
"grad_norm": 0.48451923979691575,
"learning_rate": 4.51753219359961e-06,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14008775353431702,
"step": 3545,
"valid_targets_mean": 5037.8,
"valid_targets_min": 2496
},
{
"epoch": 5.634920634920634,
"grad_norm": 0.4290885471458542,
"learning_rate": 4.467546816660433e-06,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1463758647441864,
"step": 3550,
"valid_targets_mean": 6069.6,
"valid_targets_min": 2782
},
{
"epoch": 5.642857142857143,
"grad_norm": 0.4422867985916354,
"learning_rate": 4.417804725679058e-06,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1522657573223114,
"step": 3555,
"valid_targets_mean": 7388.6,
"valid_targets_min": 2410
},
{
"epoch": 5.650793650793651,
"grad_norm": 0.4326771572943575,
"learning_rate": 4.368306699769518e-06,
"loss": 0.1362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13901498913764954,
"step": 3560,
"valid_targets_mean": 5687.3,
"valid_targets_min": 930
},
{
"epoch": 5.658730158730159,
"grad_norm": 0.5184808560608285,
"learning_rate": 4.319053514223033e-06,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12393245846033096,
"step": 3565,
"valid_targets_mean": 4805.2,
"valid_targets_min": 277
},
{
"epoch": 5.666666666666667,
"grad_norm": 0.4747228961326593,
"learning_rate": 4.270045940495879e-06,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1519310176372528,
"step": 3570,
"valid_targets_mean": 4909.6,
"valid_targets_min": 525
},
{
"epoch": 5.674603174603175,
"grad_norm": 0.4817480251050087,
"learning_rate": 4.221284746197292e-06,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14879171550273895,
"step": 3575,
"valid_targets_mean": 5205.3,
"valid_targets_min": 512
},
{
"epoch": 5.682539682539683,
"grad_norm": 0.5206783763038453,
"learning_rate": 4.172770695077437e-06,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16022273898124695,
"step": 3580,
"valid_targets_mean": 4187.7,
"valid_targets_min": 754
},
{
"epoch": 5.690476190476191,
"grad_norm": 0.42530942051464743,
"learning_rate": 4.124504547015487e-06,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1300957351922989,
"step": 3585,
"valid_targets_mean": 6382.3,
"valid_targets_min": 2232
},
{
"epoch": 5.698412698412699,
"grad_norm": 0.4773846019671863,
"learning_rate": 4.0764870580076675e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17422491312026978,
"step": 3590,
"valid_targets_mean": 5224.0,
"valid_targets_min": 1170
},
{
"epoch": 5.7063492063492065,
"grad_norm": 0.3861656168881239,
"learning_rate": 4.0287189801554304e-06,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12745806574821472,
"step": 3595,
"valid_targets_mean": 6368.2,
"valid_targets_min": 1124
},
{
"epoch": 5.714285714285714,
"grad_norm": 0.41849044348707654,
"learning_rate": 3.98120106165371e-06,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13698044419288635,
"step": 3600,
"valid_targets_mean": 5723.8,
"valid_targets_min": 2689
},
{
"epoch": 5.722222222222222,
"grad_norm": 0.5006534631008478,
"learning_rate": 3.933934046779164e-06,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15041181445121765,
"step": 3605,
"valid_targets_mean": 4726.2,
"valid_targets_min": 625
},
{
"epoch": 5.73015873015873,
"grad_norm": 0.5390021957931794,
"learning_rate": 3.886918675878513e-06,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15215769410133362,
"step": 3610,
"valid_targets_mean": 5078.9,
"valid_targets_min": 355
},
{
"epoch": 5.738095238095238,
"grad_norm": 0.4242218655638763,
"learning_rate": 3.840155685356983e-06,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12816202640533447,
"step": 3615,
"valid_targets_mean": 5724.1,
"valid_targets_min": 2290
},
{
"epoch": 5.746031746031746,
"grad_norm": 0.40905901981368425,
"learning_rate": 3.793645807666735e-06,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12471656501293182,
"step": 3620,
"valid_targets_mean": 6163.4,
"valid_targets_min": 447
},
{
"epoch": 5.753968253968254,
"grad_norm": 0.5134066612062572,
"learning_rate": 3.747389771295411e-06,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13810807466506958,
"step": 3625,
"valid_targets_mean": 5215.5,
"valid_targets_min": 320
},
{
"epoch": 5.761904761904762,
"grad_norm": 0.44176531273164726,
"learning_rate": 3.701388300754709e-06,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15570278465747833,
"step": 3630,
"valid_targets_mean": 5831.4,
"valid_targets_min": 1928
},
{
"epoch": 5.76984126984127,
"grad_norm": 0.4552213038987976,
"learning_rate": 3.6556421165690516e-06,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13112439215183258,
"step": 3635,
"valid_targets_mean": 5127.6,
"valid_targets_min": 1412
},
{
"epoch": 5.777777777777778,
"grad_norm": 0.5475459293945621,
"learning_rate": 3.610151935264288e-06,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13923147320747375,
"step": 3640,
"valid_targets_mean": 5058.1,
"valid_targets_min": 1271
},
{
"epoch": 5.785714285714286,
"grad_norm": 0.4062383720325422,
"learning_rate": 3.5649184693564797e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12178117781877518,
"step": 3645,
"valid_targets_mean": 6188.1,
"valid_targets_min": 2820
},
{
"epoch": 5.7936507936507935,
"grad_norm": 0.41210477208428037,
"learning_rate": 3.5199424273407277e-06,
"loss": 0.1329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11573171615600586,
"step": 3650,
"valid_targets_mean": 5608.1,
"valid_targets_min": 291
},
{
"epoch": 5.801587301587301,
"grad_norm": 0.39026902409095005,
"learning_rate": 3.4752245136801065e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11422628164291382,
"step": 3655,
"valid_targets_mean": 6121.1,
"valid_targets_min": 919
},
{
"epoch": 5.809523809523809,
"grad_norm": 0.44136839976284375,
"learning_rate": 3.430765428794569e-06,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15087169408798218,
"step": 3660,
"valid_targets_mean": 5458.3,
"valid_targets_min": 663
},
{
"epoch": 5.817460317460317,
"grad_norm": 0.47272488901004456,
"learning_rate": 3.3865658690500424e-06,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12730719149112701,
"step": 3665,
"valid_targets_mean": 5489.8,
"valid_targets_min": 266
},
{
"epoch": 5.825396825396825,
"grad_norm": 0.4286583074647361,
"learning_rate": 3.34262652674749e-06,
"loss": 0.1399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13272640109062195,
"step": 3670,
"valid_targets_mean": 5855.3,
"valid_targets_min": 3739
},
{
"epoch": 5.833333333333333,
"grad_norm": 0.4961674424548416,
"learning_rate": 3.2989480901120684e-06,
"loss": 0.1305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14517953991889954,
"step": 3675,
"valid_targets_mean": 5103.6,
"valid_targets_min": 629
},
{
"epoch": 5.841269841269841,
"grad_norm": 0.5038921133963972,
"learning_rate": 3.2555312432823283e-06,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14607466757297516,
"step": 3680,
"valid_targets_mean": 4695.1,
"valid_targets_min": 2224
},
{
"epoch": 5.849206349206349,
"grad_norm": 0.4516355692524723,
"learning_rate": 3.2123766662995572e-06,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13942056894302368,
"step": 3685,
"valid_targets_mean": 5577.4,
"valid_targets_min": 1295
},
{
"epoch": 5.857142857142857,
"grad_norm": 0.43990400419076664,
"learning_rate": 3.1694850350970686e-06,
"loss": 0.1373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14388282597064972,
"step": 3690,
"valid_targets_mean": 5896.1,
"valid_targets_min": 1277
},
{
"epoch": 5.865079365079366,
"grad_norm": 0.4430961156309604,
"learning_rate": 3.1268570214896265e-06,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16903355717658997,
"step": 3695,
"valid_targets_mean": 5768.0,
"valid_targets_min": 309
},
{
"epoch": 5.8730158730158735,
"grad_norm": 0.4687413821050724,
"learning_rate": 3.0844932931629602e-06,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12664330005645752,
"step": 3700,
"valid_targets_mean": 5469.9,
"valid_targets_min": 582
},
{
"epoch": 5.880952380952381,
"grad_norm": 0.4251478406093825,
"learning_rate": 3.0423945136632626e-06,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14676138758659363,
"step": 3705,
"valid_targets_mean": 6292.8,
"valid_targets_min": 1166
},
{
"epoch": 5.888888888888889,
"grad_norm": 0.4418913815124218,
"learning_rate": 3.000561342386814e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596686840057373,
"step": 3710,
"valid_targets_mean": 5276.0,
"valid_targets_min": 656
},
{
"epoch": 5.896825396825397,
"grad_norm": 0.46832139188754646,
"learning_rate": 2.9589944345696596e-06,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12101615965366364,
"step": 3715,
"valid_targets_mean": 4913.4,
"valid_targets_min": 343
},
{
"epoch": 5.904761904761905,
"grad_norm": 0.4657929056680499,
"learning_rate": 2.9176944412773322e-06,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17338143289089203,
"step": 3720,
"valid_targets_mean": 5412.4,
"valid_targets_min": 554
},
{
"epoch": 5.912698412698413,
"grad_norm": 0.4449595143164407,
"learning_rate": 2.876662009394673e-06,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15727762877941132,
"step": 3725,
"valid_targets_mean": 5328.9,
"valid_targets_min": 643
},
{
"epoch": 5.920634920634921,
"grad_norm": 0.39696814679103,
"learning_rate": 2.8358977816156796e-06,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11638738214969635,
"step": 3730,
"valid_targets_mean": 6867.2,
"valid_targets_min": 3676
},
{
"epoch": 5.928571428571429,
"grad_norm": 0.47195292364800606,
"learning_rate": 2.7954023964334485e-06,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505923867225647,
"step": 3735,
"valid_targets_mean": 5757.2,
"valid_targets_min": 704
},
{
"epoch": 5.936507936507937,
"grad_norm": 0.4486759780229958,
"learning_rate": 2.7551764881301955e-06,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13487672805786133,
"step": 3740,
"valid_targets_mean": 5926.0,
"valid_targets_min": 1024
},
{
"epoch": 5.944444444444445,
"grad_norm": 0.45150456684299833,
"learning_rate": 2.715220686767268e-06,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13316667079925537,
"step": 3745,
"valid_targets_mean": 5609.4,
"valid_targets_min": 2528
},
{
"epoch": 5.9523809523809526,
"grad_norm": 0.4612924420161714,
"learning_rate": 2.6755356181753247e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17791566252708435,
"step": 3750,
"valid_targets_mean": 5493.9,
"valid_targets_min": 600
},
{
"epoch": 5.9603174603174605,
"grad_norm": 0.4466679622369211,
"learning_rate": 2.6361219039445328e-06,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1417991816997528,
"step": 3755,
"valid_targets_mean": 5531.8,
"valid_targets_min": 3560
},
{
"epoch": 5.968253968253968,
"grad_norm": 0.46290951572004435,
"learning_rate": 2.5969801614147838e-06,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562907099723816,
"step": 3760,
"valid_targets_mean": 5726.4,
"valid_targets_min": 325
},
{
"epoch": 5.976190476190476,
"grad_norm": 0.41130105503656605,
"learning_rate": 2.558111003666075e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13213077187538147,
"step": 3765,
"valid_targets_mean": 5965.7,
"valid_targets_min": 1546
},
{
"epoch": 5.984126984126984,
"grad_norm": 0.4305429547314029,
"learning_rate": 2.519515039508893e-06,
"loss": 0.1328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11605265736579895,
"step": 3770,
"valid_targets_mean": 5509.0,
"valid_targets_min": 290
},
{
"epoch": 5.992063492063492,
"grad_norm": 0.43615187162481,
"learning_rate": 2.481192873474667e-06,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13950824737548828,
"step": 3775,
"valid_targets_mean": 5780.9,
"valid_targets_min": 1479
},
{
"epoch": 6.0,
"grad_norm": 0.39743183112610925,
"learning_rate": 2.4431451058062928e-06,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1134757548570633,
"step": 3780,
"valid_targets_mean": 5882.9,
"valid_targets_min": 2457
},
{
"epoch": 6.007936507936508,
"grad_norm": 0.4320579605085731,
"learning_rate": 2.4053723324487677e-06,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12739768624305725,
"step": 3785,
"valid_targets_mean": 4568.0,
"valid_targets_min": 652
},
{
"epoch": 6.015873015873016,
"grad_norm": 0.45806291042546377,
"learning_rate": 2.3678751450398196e-06,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1493530422449112,
"step": 3790,
"valid_targets_mean": 5264.6,
"valid_targets_min": 901
},
{
"epoch": 6.023809523809524,
"grad_norm": 0.4440865317653884,
"learning_rate": 2.330654130900656e-06,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13022762537002563,
"step": 3795,
"valid_targets_mean": 4942.4,
"valid_targets_min": 2199
},
{
"epoch": 6.031746031746032,
"grad_norm": 0.4289001750038118,
"learning_rate": 2.2937098730267572e-06,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11798284202814102,
"step": 3800,
"valid_targets_mean": 5962.4,
"valid_targets_min": 656
},
{
"epoch": 6.0396825396825395,
"grad_norm": 0.4804416865960379,
"learning_rate": 2.2570429500787604e-06,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13769641518592834,
"step": 3805,
"valid_targets_mean": 4876.4,
"valid_targets_min": 2078
},
{
"epoch": 6.0476190476190474,
"grad_norm": 0.4248137219988032,
"learning_rate": 2.2206539363733738e-06,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09792445600032806,
"step": 3810,
"valid_targets_mean": 6735.6,
"valid_targets_min": 2875
},
{
"epoch": 6.055555555555555,
"grad_norm": 0.4458277839797382,
"learning_rate": 2.1845434018744038e-06,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13032405078411102,
"step": 3815,
"valid_targets_mean": 5100.5,
"valid_targets_min": 1711
},
{
"epoch": 6.063492063492063,
"grad_norm": 0.46870997489479654,
"learning_rate": 2.148711912183803e-06,
"loss": 0.1349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340586543083191,
"step": 3820,
"valid_targets_mean": 6257.2,
"valid_targets_min": 3713
},
{
"epoch": 6.071428571428571,
"grad_norm": 0.43220936389411174,
"learning_rate": 2.1131600285328458e-06,
"loss": 0.1372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13491111993789673,
"step": 3825,
"valid_targets_mean": 5652.9,
"valid_targets_min": 2291
},
{
"epoch": 6.079365079365079,
"grad_norm": 0.4938619349035986,
"learning_rate": 2.0778883077732903e-06,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12590594589710236,
"step": 3830,
"valid_targets_mean": 5837.1,
"valid_targets_min": 1277
},
{
"epoch": 6.087301587301587,
"grad_norm": 0.4461842204628299,
"learning_rate": 2.0428973023686983e-06,
"loss": 0.1301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12995757162570953,
"step": 3835,
"valid_targets_mean": 5839.1,
"valid_targets_min": 2495
},
{
"epoch": 6.095238095238095,
"grad_norm": 0.4514403709392358,
"learning_rate": 2.0081875603857726e-06,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11519353836774826,
"step": 3840,
"valid_targets_mean": 5285.4,
"valid_targets_min": 1198
},
{
"epoch": 6.103174603174603,
"grad_norm": 0.5872250143318944,
"learning_rate": 1.973759625485743e-06,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12013471126556396,
"step": 3845,
"valid_targets_mean": 3976.3,
"valid_targets_min": 1509
},
{
"epoch": 6.111111111111111,
"grad_norm": 0.5053201570927205,
"learning_rate": 1.9396140369159e-06,
"loss": 0.1314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14312024414539337,
"step": 3850,
"valid_targets_mean": 5034.4,
"valid_targets_min": 712
},
{
"epoch": 6.119047619047619,
"grad_norm": 0.4254491047353564,
"learning_rate": 1.9057513295011087e-06,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11980589479207993,
"step": 3855,
"valid_targets_mean": 5230.5,
"valid_targets_min": 618
},
{
"epoch": 6.1269841269841265,
"grad_norm": 0.45350019220553667,
"learning_rate": 1.8721720336354487e-06,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1343933343887329,
"step": 3860,
"valid_targets_mean": 5310.0,
"valid_targets_min": 861
},
{
"epoch": 6.134920634920635,
"grad_norm": 0.44908680436264514,
"learning_rate": 1.8388766752739017e-06,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13214536011219025,
"step": 3865,
"valid_targets_mean": 4819.6,
"valid_targets_min": 360
},
{
"epoch": 6.142857142857143,
"grad_norm": 0.43728782320626974,
"learning_rate": 1.805865775924116e-06,
"loss": 0.137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12990088760852814,
"step": 3870,
"valid_targets_mean": 5668.4,
"valid_targets_min": 2900
},
{
"epoch": 6.150793650793651,
"grad_norm": 0.46855550237931853,
"learning_rate": 1.7731398526382416e-06,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11653086543083191,
"step": 3875,
"valid_targets_mean": 5082.9,
"valid_targets_min": 278
},
{
"epoch": 6.158730158730159,
"grad_norm": 0.4633118493365201,
"learning_rate": 1.7406994180048231e-06,
"loss": 0.1302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1214178055524826,
"step": 3880,
"valid_targets_mean": 5079.4,
"valid_targets_min": 596
},
{
"epoch": 6.166666666666667,
"grad_norm": 0.4324845887042187,
"learning_rate": 1.7085449801407783e-06,
"loss": 0.1242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11891638487577438,
"step": 3885,
"valid_targets_mean": 5482.2,
"valid_targets_min": 630
},
{
"epoch": 6.174603174603175,
"grad_norm": 0.4593597812117515,
"learning_rate": 1.67667704268343e-06,
"loss": 0.1302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12844383716583252,
"step": 3890,
"valid_targets_mean": 5304.3,
"valid_targets_min": 968
},
{
"epoch": 6.182539682539683,
"grad_norm": 1.0409294151451973,
"learning_rate": 1.6450961047826353e-06,
"loss": 0.127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14141665399074554,
"step": 3895,
"valid_targets_mean": 4083.4,
"valid_targets_min": 287
},
{
"epoch": 6.190476190476191,
"grad_norm": 0.4147176475336051,
"learning_rate": 1.6138026610929446e-06,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12204622477293015,
"step": 3900,
"valid_targets_mean": 6026.9,
"valid_targets_min": 1789
},
{
"epoch": 6.198412698412699,
"grad_norm": 0.7688468165385852,
"learning_rate": 1.5827972017658732e-06,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14009518921375275,
"step": 3905,
"valid_targets_mean": 5232.4,
"valid_targets_min": 609
},
{
"epoch": 6.2063492063492065,
"grad_norm": 0.5742634408323547,
"learning_rate": 1.5520802124422108e-06,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11271405220031738,
"step": 3910,
"valid_targets_mean": 5412.1,
"valid_targets_min": 677
},
{
"epoch": 6.214285714285714,
"grad_norm": 0.4434637011482024,
"learning_rate": 1.5216521742444236e-06,
"loss": 0.1266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15959657728672028,
"step": 3915,
"valid_targets_mean": 5545.5,
"valid_targets_min": 366
},
{
"epoch": 6.222222222222222,
"grad_norm": 0.4473257762920866,
"learning_rate": 1.491513563769118e-06,
"loss": 0.1277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13596297800540924,
"step": 3920,
"valid_targets_mean": 6079.2,
"valid_targets_min": 1352
},
{
"epoch": 6.23015873015873,
"grad_norm": 0.40218956890406166,
"learning_rate": 1.4616648530795673e-06,
"loss": 0.1367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13123834133148193,
"step": 3925,
"valid_targets_mean": 6588.4,
"valid_targets_min": 1264
},
{
"epoch": 6.238095238095238,
"grad_norm": 0.4665917089898694,
"learning_rate": 1.432106509698319e-06,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14458967745304108,
"step": 3930,
"valid_targets_mean": 5620.0,
"valid_targets_min": 2860
},
{
"epoch": 6.246031746031746,
"grad_norm": 0.4804278259544632,
"learning_rate": 1.4028389965998867e-06,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13646945357322693,
"step": 3935,
"valid_targets_mean": 4918.8,
"valid_targets_min": 2109
},
{
"epoch": 6.253968253968254,
"grad_norm": 0.4573452936493578,
"learning_rate": 1.3738627722034848e-06,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12479956448078156,
"step": 3940,
"valid_targets_mean": 5664.0,
"valid_targets_min": 890
},
{
"epoch": 6.261904761904762,
"grad_norm": 0.4112194821979111,
"learning_rate": 1.345178290365845e-06,
"loss": 0.1303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12601318955421448,
"step": 3945,
"valid_targets_mean": 5897.8,
"valid_targets_min": 2441
},
{
"epoch": 6.26984126984127,
"grad_norm": 0.43770788181094994,
"learning_rate": 1.3167860003741218e-06,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13687068223953247,
"step": 3950,
"valid_targets_mean": 5294.8,
"valid_targets_min": 872
},
{
"epoch": 6.277777777777778,
"grad_norm": 0.43651984734406524,
"learning_rate": 1.2886863469388389e-06,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13095057010650635,
"step": 3955,
"valid_targets_mean": 5041.6,
"valid_targets_min": 946
},
{
"epoch": 6.285714285714286,
"grad_norm": 0.4407006248372022,
"learning_rate": 1.2608797701869425e-06,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13327287137508392,
"step": 3960,
"valid_targets_mean": 5152.8,
"valid_targets_min": 968
},
{
"epoch": 6.2936507936507935,
"grad_norm": 0.4830750093647113,
"learning_rate": 1.2333667056548881e-06,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12351542711257935,
"step": 3965,
"valid_targets_mean": 4494.3,
"valid_targets_min": 299
},
{
"epoch": 6.301587301587301,
"grad_norm": 0.4721717415354756,
"learning_rate": 1.2061475842818337e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15659388899803162,
"step": 3970,
"valid_targets_mean": 5026.2,
"valid_targets_min": 1775
},
{
"epoch": 6.309523809523809,
"grad_norm": 0.42311493337432965,
"learning_rate": 1.1792228324028776e-06,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15567630529403687,
"step": 3975,
"valid_targets_mean": 5791.2,
"valid_targets_min": 3515
},
{
"epoch": 6.317460317460317,
"grad_norm": 1.4585742478929205,
"learning_rate": 1.152592871742395e-06,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13825181126594543,
"step": 3980,
"valid_targets_mean": 5244.9,
"valid_targets_min": 558
},
{
"epoch": 6.325396825396825,
"grad_norm": 0.461117951811656,
"learning_rate": 1.1262581194074152e-06,
"loss": 0.131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11796639859676361,
"step": 3985,
"valid_targets_mean": 5554.2,
"valid_targets_min": 2245
},
{
"epoch": 6.333333333333333,
"grad_norm": 0.47633924217416224,
"learning_rate": 1.100218987881112e-06,
"loss": 0.1325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12955845892429352,
"step": 3990,
"valid_targets_mean": 6029.9,
"valid_targets_min": 2670
},
{
"epoch": 6.341269841269841,
"grad_norm": 0.45154703338066743,
"learning_rate": 1.0744758850163085e-06,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13291522860527039,
"step": 3995,
"valid_targets_mean": 5422.9,
"valid_targets_min": 539
},
{
"epoch": 6.349206349206349,
"grad_norm": 0.5119900863580499,
"learning_rate": 1.0490292140291247e-06,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13096119463443756,
"step": 4000,
"valid_targets_mean": 5480.8,
"valid_targets_min": 291
},
{
"epoch": 6.357142857142857,
"grad_norm": 0.5126206204332201,
"learning_rate": 1.0238793734926467e-06,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14911425113677979,
"step": 4005,
"valid_targets_mean": 4797.0,
"valid_targets_min": 1266
},
{
"epoch": 6.365079365079365,
"grad_norm": 0.4880357246785836,
"learning_rate": 9.990267573306745e-07,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1387421041727066,
"step": 4010,
"valid_targets_mean": 4544.9,
"valid_targets_min": 690
},
{
"epoch": 6.3730158730158735,
"grad_norm": 0.40558138018757806,
"learning_rate": 9.744717548115613e-07,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12570391595363617,
"step": 4015,
"valid_targets_mean": 6268.6,
"valid_targets_min": 3291
},
{
"epoch": 6.380952380952381,
"grad_norm": 0.41810620070165866,
"learning_rate": 9.502147505421244e-07,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1270408034324646,
"step": 4020,
"valid_targets_mean": 6078.6,
"valid_targets_min": 797
},
{
"epoch": 6.388888888888889,
"grad_norm": 0.4496644146071595,
"learning_rate": 9.262561244616108e-07,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14739742875099182,
"step": 4025,
"valid_targets_mean": 5835.8,
"valid_targets_min": 783
},
{
"epoch": 6.396825396825397,
"grad_norm": 0.45373871441149133,
"learning_rate": 9.025962518357323e-07,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11742935329675674,
"step": 4030,
"valid_targets_mean": 4566.4,
"valid_targets_min": 290
},
{
"epoch": 6.404761904761905,
"grad_norm": 0.4617395683182264,
"learning_rate": 8.792355032508282e-07,
"loss": 0.1362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12306074798107147,
"step": 4035,
"valid_targets_mean": 5038.2,
"valid_targets_min": 626
},
{
"epoch": 6.412698412698413,
"grad_norm": 0.4644079416505595,
"learning_rate": 8.561742446080168e-07,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1280827522277832,
"step": 4040,
"valid_targets_mean": 5057.6,
"valid_targets_min": 663
},
{
"epoch": 6.420634920634921,
"grad_norm": 0.425213082782362,
"learning_rate": 8.334128371174955e-07,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14657798409461975,
"step": 4045,
"valid_targets_mean": 6001.6,
"valid_targets_min": 582
},
{
"epoch": 6.428571428571429,
"grad_norm": 0.428425934530618,
"learning_rate": 8.109516372928605e-07,
"loss": 0.1309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13139371573925018,
"step": 4050,
"valid_targets_mean": 5651.9,
"valid_targets_min": 2298
},
{
"epoch": 6.436507936507937,
"grad_norm": 0.4405821827658464,
"learning_rate": 7.887909969455366e-07,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12469398230314255,
"step": 4055,
"valid_targets_mean": 5376.2,
"valid_targets_min": 267
},
{
"epoch": 6.444444444444445,
"grad_norm": 0.5057128403035726,
"learning_rate": 7.669312631792758e-07,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14254549145698547,
"step": 4060,
"valid_targets_mean": 5674.9,
"valid_targets_min": 2241
},
{
"epoch": 6.4523809523809526,
"grad_norm": 0.615770615958985,
"learning_rate": 7.453727783846876e-07,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313585788011551,
"step": 4065,
"valid_targets_mean": 5325.8,
"valid_targets_min": 1267
},
{
"epoch": 6.4603174603174605,
"grad_norm": 0.4640004582080486,
"learning_rate": 7.241158802339065e-07,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14738494157791138,
"step": 4070,
"valid_targets_mean": 5742.9,
"valid_targets_min": 297
},
{
"epoch": 6.468253968253968,
"grad_norm": 0.44707812759358856,
"learning_rate": 7.031609016753016e-07,
"loss": 0.1372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283096969127655,
"step": 4075,
"valid_targets_mean": 5941.6,
"valid_targets_min": 2715
},
{
"epoch": 6.476190476190476,
"grad_norm": 0.5025741831025621,
"learning_rate": 6.825081709282377e-07,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14924189448356628,
"step": 4080,
"valid_targets_mean": 5481.9,
"valid_targets_min": 673
},
{
"epoch": 6.484126984126984,
"grad_norm": 0.4928322290987037,
"learning_rate": 6.62158011477958e-07,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14254453778266907,
"step": 4085,
"valid_targets_mean": 5396.4,
"valid_targets_min": 1013
},
{
"epoch": 6.492063492063492,
"grad_norm": 0.4463090392869717,
"learning_rate": 6.421107420705097e-07,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1291046142578125,
"step": 4090,
"valid_targets_mean": 5304.8,
"valid_targets_min": 1268
},
{
"epoch": 6.5,
"grad_norm": 0.41940627052314144,
"learning_rate": 6.223666767077508e-07,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1368085891008377,
"step": 4095,
"valid_targets_mean": 5791.9,
"valid_targets_min": 824
},
{
"epoch": 6.507936507936508,
"grad_norm": 0.38633976220944566,
"learning_rate": 6.029261246424267e-07,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11674937605857849,
"step": 4100,
"valid_targets_mean": 7173.1,
"valid_targets_min": 3321
},
{
"epoch": 6.515873015873016,
"grad_norm": 0.5710755866104514,
"learning_rate": 5.837893903733394e-07,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14703723788261414,
"step": 4105,
"valid_targets_mean": 4992.6,
"valid_targets_min": 251
},
{
"epoch": 6.523809523809524,
"grad_norm": 0.42790485901259206,
"learning_rate": 5.649567736405681e-07,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11689166724681854,
"step": 4110,
"valid_targets_mean": 5996.3,
"valid_targets_min": 3073
},
{
"epoch": 6.531746031746032,
"grad_norm": 0.3978542753238711,
"learning_rate": 5.464285694207672e-07,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12328889966011047,
"step": 4115,
"valid_targets_mean": 6366.9,
"valid_targets_min": 2921
},
{
"epoch": 6.5396825396825395,
"grad_norm": 0.4803261314786915,
"learning_rate": 5.282050679225714e-07,
"loss": 0.1332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13136357069015503,
"step": 4120,
"valid_targets_mean": 5456.8,
"valid_targets_min": 1746
},
{
"epoch": 6.5476190476190474,
"grad_norm": 0.3906973340150284,
"learning_rate": 5.102865545820245e-07,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12256291508674622,
"step": 4125,
"valid_targets_mean": 6359.6,
"valid_targets_min": 2305
},
{
"epoch": 6.555555555555555,
"grad_norm": 0.4059594097865994,
"learning_rate": 4.926733100581182e-07,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11908716708421707,
"step": 4130,
"valid_targets_mean": 6355.2,
"valid_targets_min": 325
},
{
"epoch": 6.563492063492063,
"grad_norm": 0.5832130007483879,
"learning_rate": 4.7536561022840213e-07,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13830284774303436,
"step": 4135,
"valid_targets_mean": 4896.4,
"valid_targets_min": 1408
},
{
"epoch": 6.571428571428571,
"grad_norm": 0.4059800621113446,
"learning_rate": 4.5836372618464964e-07,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12423016875982285,
"step": 4140,
"valid_targets_mean": 6594.7,
"valid_targets_min": 3811
},
{
"epoch": 6.579365079365079,
"grad_norm": 0.4185374589094962,
"learning_rate": 4.416679242286215e-07,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13419991731643677,
"step": 4145,
"valid_targets_mean": 6087.1,
"valid_targets_min": 2433
},
{
"epoch": 6.587301587301587,
"grad_norm": 0.5103870835544566,
"learning_rate": 4.2527846586789547e-07,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14000031352043152,
"step": 4150,
"valid_targets_mean": 4625.3,
"valid_targets_min": 221
},
{
"epoch": 6.595238095238095,
"grad_norm": 0.5765993905041488,
"learning_rate": 4.0919560781176317e-07,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13032563030719757,
"step": 4155,
"valid_targets_mean": 5195.4,
"valid_targets_min": 1443
},
{
"epoch": 6.603174603174603,
"grad_norm": 0.48593436180980204,
"learning_rate": 3.934196019672176e-07,
"loss": 0.1267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13097088038921356,
"step": 4160,
"valid_targets_mean": 4735.8,
"valid_targets_min": 1686
},
{
"epoch": 6.611111111111111,
"grad_norm": 0.4395609496182445,
"learning_rate": 3.779506954349965e-07,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12398695945739746,
"step": 4165,
"valid_targets_mean": 6392.1,
"valid_targets_min": 2819
},
{
"epoch": 6.619047619047619,
"grad_norm": 0.47600560032316025,
"learning_rate": 3.6278913050572076e-07,
"loss": 0.1377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1410660743713379,
"step": 4170,
"valid_targets_mean": 4714.9,
"valid_targets_min": 921
},
{
"epoch": 6.6269841269841265,
"grad_norm": 0.4626328635010138,
"learning_rate": 3.4793514465610414e-07,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12245401740074158,
"step": 4175,
"valid_targets_mean": 5662.9,
"valid_targets_min": 1293
},
{
"epoch": 6.634920634920634,
"grad_norm": 0.4856477089680751,
"learning_rate": 3.3338897054521205e-07,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12981770932674408,
"step": 4180,
"valid_targets_mean": 6161.9,
"valid_targets_min": 1672
},
{
"epoch": 6.642857142857143,
"grad_norm": 0.4382225877662096,
"learning_rate": 3.191508360108464e-07,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12940582633018494,
"step": 4185,
"valid_targets_mean": 5541.3,
"valid_targets_min": 525
},
{
"epoch": 6.650793650793651,
"grad_norm": 0.4467797690671947,
"learning_rate": 3.0522096406595536e-07,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12461797893047333,
"step": 4190,
"valid_targets_mean": 5350.9,
"valid_targets_min": 1531
},
{
"epoch": 6.658730158730159,
"grad_norm": 0.4315640371338101,
"learning_rate": 2.9159957289514926e-07,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1185673251748085,
"step": 4195,
"valid_targets_mean": 5560.6,
"valid_targets_min": 2700
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.48404703695546003,
"learning_rate": 2.782868758512791e-07,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13700520992279053,
"step": 4200,
"valid_targets_mean": 5088.4,
"valid_targets_min": 708
},
{
"epoch": 6.674603174603175,
"grad_norm": 0.4561326307439442,
"learning_rate": 2.6528308145210125e-07,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14443397521972656,
"step": 4205,
"valid_targets_mean": 5388.9,
"valid_targets_min": 987
},
{
"epoch": 6.682539682539683,
"grad_norm": 0.4432184683642521,
"learning_rate": 2.525883933770046e-07,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13129255175590515,
"step": 4210,
"valid_targets_mean": 6560.8,
"valid_targets_min": 2872
},
{
"epoch": 6.690476190476191,
"grad_norm": 0.4428498025907347,
"learning_rate": 2.402030104638198e-07,
"loss": 0.1281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1193118616938591,
"step": 4215,
"valid_targets_mean": 5178.1,
"valid_targets_min": 1066
},
{
"epoch": 6.698412698412699,
"grad_norm": 0.4342898053436231,
"learning_rate": 2.2812712670571502e-07,
"loss": 0.1307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13040482997894287,
"step": 4220,
"valid_targets_mean": 5622.1,
"valid_targets_min": 2496
},
{
"epoch": 6.7063492063492065,
"grad_norm": 2.0764732196910196,
"learning_rate": 2.1636093124814738e-07,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12159843742847443,
"step": 4225,
"valid_targets_mean": 5518.6,
"valid_targets_min": 1795
},
{
"epoch": 6.714285714285714,
"grad_norm": 0.4586433877189939,
"learning_rate": 2.0490460838589855e-07,
"loss": 0.1337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12682956457138062,
"step": 4230,
"valid_targets_mean": 4948.1,
"valid_targets_min": 1032
},
{
"epoch": 6.722222222222222,
"grad_norm": 0.47132990810816733,
"learning_rate": 1.9375833756019923e-07,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15487657487392426,
"step": 4235,
"valid_targets_mean": 4774.9,
"valid_targets_min": 1168
},
{
"epoch": 6.73015873015873,
"grad_norm": 0.4124840094163903,
"learning_rate": 1.8292229335590716e-07,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11652678996324539,
"step": 4240,
"valid_targets_mean": 6393.1,
"valid_targets_min": 3197
},
{
"epoch": 6.738095238095238,
"grad_norm": 0.4350958770760526,
"learning_rate": 1.7239664549878688e-07,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1278618425130844,
"step": 4245,
"valid_targets_mean": 5711.4,
"valid_targets_min": 307
},
{
"epoch": 6.746031746031746,
"grad_norm": 0.4380389060922931,
"learning_rate": 1.6218155885283192e-07,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1238991990685463,
"step": 4250,
"valid_targets_mean": 5243.3,
"valid_targets_min": 1150
},
{
"epoch": 6.753968253968254,
"grad_norm": 0.45207585431063574,
"learning_rate": 1.5227719341769364e-07,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12772828340530396,
"step": 4255,
"valid_targets_mean": 6135.6,
"valid_targets_min": 2455
},
{
"epoch": 6.761904761904762,
"grad_norm": 0.48236608264345426,
"learning_rate": 1.4268370432618306e-07,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14505012333393097,
"step": 4260,
"valid_targets_mean": 4687.0,
"valid_targets_min": 764
},
{
"epoch": 6.76984126984127,
"grad_norm": 0.4233867675421516,
"learning_rate": 1.3340124184182178e-07,
"loss": 0.1289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12908919155597687,
"step": 4265,
"valid_targets_mean": 6025.6,
"valid_targets_min": 2257
},
{
"epoch": 6.777777777777778,
"grad_norm": 0.4877416792035469,
"learning_rate": 1.2442995135650393e-07,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15760302543640137,
"step": 4270,
"valid_targets_mean": 4828.7,
"valid_targets_min": 268
},
{
"epoch": 6.785714285714286,
"grad_norm": 0.6506490177567913,
"learning_rate": 1.1576997338821339e-07,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13028597831726074,
"step": 4275,
"valid_targets_mean": 5155.9,
"valid_targets_min": 845
},
{
"epoch": 6.7936507936507935,
"grad_norm": 0.4477970591498348,
"learning_rate": 1.0742144357882567e-07,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585049331188202,
"step": 4280,
"valid_targets_mean": 5534.2,
"valid_targets_min": 310
},
{
"epoch": 6.801587301587301,
"grad_norm": 0.49507868999640176,
"learning_rate": 9.938449269197181e-08,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1410304307937622,
"step": 4285,
"valid_targets_mean": 4884.3,
"valid_targets_min": 447
},
{
"epoch": 6.809523809523809,
"grad_norm": 0.4842993936056907,
"learning_rate": 9.165924661100889e-08,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12479911744594574,
"step": 4290,
"valid_targets_mean": 5132.9,
"valid_targets_min": 397
},
{
"epoch": 6.817460317460317,
"grad_norm": 0.43326494078340105,
"learning_rate": 8.424582633703493e-08,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13402575254440308,
"step": 4295,
"valid_targets_mean": 5267.1,
"valid_targets_min": 1121
},
{
"epoch": 6.825396825396825,
"grad_norm": 0.39800154553874223,
"learning_rate": 7.714434798699933e-08,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12014246731996536,
"step": 4300,
"valid_targets_mean": 6144.5,
"valid_targets_min": 2815
},
{
"epoch": 6.833333333333333,
"grad_norm": 0.42208852936776803,
"learning_rate": 7.035492279187538e-08,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12092911452054977,
"step": 4305,
"valid_targets_mean": 5618.4,
"valid_targets_min": 855
},
{
"epoch": 6.841269841269841,
"grad_norm": 0.5061623759467122,
"learning_rate": 6.387765709493288e-08,
"loss": 0.1362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13144025206565857,
"step": 4310,
"valid_targets_mean": 5299.0,
"valid_targets_min": 737
},
{
"epoch": 6.849206349206349,
"grad_norm": 0.4703474965866674,
"learning_rate": 5.7712652350061515e-08,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14938583970069885,
"step": 4315,
"valid_targets_mean": 4459.2,
"valid_targets_min": 229
},
{
"epoch": 6.857142857142857,
"grad_norm": 0.4544153706399285,
"learning_rate": 5.186000512018341e-08,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13210490345954895,
"step": 4320,
"valid_targets_mean": 5968.1,
"valid_targets_min": 1966
},
{
"epoch": 6.865079365079366,
"grad_norm": 0.3951693224390717,
"learning_rate": 4.631980707574535e-08,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10764377564191818,
"step": 4325,
"valid_targets_mean": 6102.2,
"valid_targets_min": 281
},
{
"epoch": 6.8730158730158735,
"grad_norm": 0.47764153403255666,
"learning_rate": 4.10921449932733e-08,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13427546620368958,
"step": 4330,
"valid_targets_mean": 4686.6,
"valid_targets_min": 1301
},
{
"epoch": 6.880952380952381,
"grad_norm": 0.4686718928282114,
"learning_rate": 3.61771007540268e-08,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12770965695381165,
"step": 4335,
"valid_targets_mean": 5458.8,
"valid_targets_min": 632
},
{
"epoch": 6.888888888888889,
"grad_norm": 0.45215811836727576,
"learning_rate": 3.157475134270227e-08,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14995113015174866,
"step": 4340,
"valid_targets_mean": 5664.1,
"valid_targets_min": 3600
},
{
"epoch": 6.896825396825397,
"grad_norm": 0.49008507070012214,
"learning_rate": 2.728516884624277e-08,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13054564595222473,
"step": 4345,
"valid_targets_mean": 5089.6,
"valid_targets_min": 637
},
{
"epoch": 6.904761904761905,
"grad_norm": 0.48404319287292985,
"learning_rate": 2.3308420452690106e-08,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13617941737174988,
"step": 4350,
"valid_targets_mean": 4722.2,
"valid_targets_min": 1597
},
{
"epoch": 6.912698412698413,
"grad_norm": 0.40638533094484175,
"learning_rate": 1.9644568450147837e-08,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14109522104263306,
"step": 4355,
"valid_targets_mean": 6445.0,
"valid_targets_min": 3553
},
{
"epoch": 6.920634920634921,
"grad_norm": 0.4629617085369057,
"learning_rate": 1.6293670225799864e-08,
"loss": 0.1253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1260548233985901,
"step": 4360,
"valid_targets_mean": 5373.1,
"valid_targets_min": 543
},
{
"epoch": 6.928571428571429,
"grad_norm": 0.45402888146937276,
"learning_rate": 1.3255778265013342e-08,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14494284987449646,
"step": 4365,
"valid_targets_mean": 5725.3,
"valid_targets_min": 1550
},
{
"epoch": 6.936507936507937,
"grad_norm": 0.4086709277572136,
"learning_rate": 1.0530940150512703e-08,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1179996132850647,
"step": 4370,
"valid_targets_mean": 5990.4,
"valid_targets_min": 361
},
{
"epoch": 6.944444444444445,
"grad_norm": 0.42662410297325026,
"learning_rate": 8.119198561638009e-09,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14371398091316223,
"step": 4375,
"valid_targets_mean": 5997.8,
"valid_targets_min": 3437
},
{
"epoch": 6.9523809523809526,
"grad_norm": 0.42639557312324744,
"learning_rate": 6.020591273674381e-09,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1339547336101532,
"step": 4380,
"valid_targets_mean": 6416.2,
"valid_targets_min": 609
},
{
"epoch": 6.9603174603174605,
"grad_norm": 0.4092765044556627,
"learning_rate": 4.2351511572635835e-09,
"loss": 0.1359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10867651551961899,
"step": 4385,
"valid_targets_mean": 6632.2,
"valid_targets_min": 1370
},
{
"epoch": 6.968253968253968,
"grad_norm": 0.4951156195990528,
"learning_rate": 2.7629061778866597e-09,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1670551598072052,
"step": 4390,
"valid_targets_mean": 5063.4,
"valid_targets_min": 949
},
{
"epoch": 6.976190476190476,
"grad_norm": 0.5279789366650457,
"learning_rate": 1.603879395422059e-09,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14463752508163452,
"step": 4395,
"valid_targets_mean": 4726.2,
"valid_targets_min": 638
},
{
"epoch": 6.984126984126984,
"grad_norm": 0.43870727411718197,
"learning_rate": 7.580889637925914e-10,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14193710684776306,
"step": 4400,
"valid_targets_mean": 5203.9,
"valid_targets_min": 767
},
{
"epoch": 6.992063492063492,
"grad_norm": 0.4604903629839532,
"learning_rate": 2.2554813067676705e-10,
"loss": 0.1268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1437646746635437,
"step": 4405,
"valid_targets_mean": 5522.9,
"valid_targets_min": 809
},
{
"epoch": 7.0,
"grad_norm": 0.4923560486700678,
"learning_rate": 6.265237300073778e-12,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15846839547157288,
"step": 4410,
"valid_targets_mean": 5295.1,
"valid_targets_min": 1258
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15846839547157288,
"step": 4410,
"total_flos": 1765744004825088.0,
"train_loss": 0.17469855595608147,
"train_runtime": 27741.8701,
"train_samples_per_second": 2.541,
"train_steps_per_second": 0.159,
"valid_targets_mean": 5295.1,
"valid_targets_min": 1258
}
],
"logging_steps": 5,
"max_steps": 4410,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1765744004825088.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}