{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4158, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.015822784810126583, "grad_norm": 19.635326284997042, "learning_rate": 7.207207207207208e-07, "loss": 0.8894, "loss_nan_ranks": 0, "loss_rank_avg": 0.8479753136634827, "step": 5, "valid_targets_mean": 6356.2, "valid_targets_min": 4626 }, { "epoch": 0.03164556962025317, "grad_norm": 16.13080891734784, "learning_rate": 1.6216216216216219e-06, "loss": 0.8811, "loss_nan_ranks": 0, "loss_rank_avg": 0.8280214071273804, "step": 10, "valid_targets_mean": 5469.8, "valid_targets_min": 1984 }, { "epoch": 0.04746835443037975, "grad_norm": 11.991696300533674, "learning_rate": 2.5225225225225225e-06, "loss": 0.8509, "loss_nan_ranks": 0, "loss_rank_avg": 0.8600161075592041, "step": 15, "valid_targets_mean": 4922.1, "valid_targets_min": 963 }, { "epoch": 0.06329113924050633, "grad_norm": 5.138935831764275, "learning_rate": 3.423423423423424e-06, "loss": 0.7628, "loss_nan_ranks": 0, "loss_rank_avg": 0.730722188949585, "step": 20, "valid_targets_mean": 5286.3, "valid_targets_min": 2311 }, { "epoch": 0.07911392405063292, "grad_norm": 2.5378388792138282, "learning_rate": 4.324324324324325e-06, "loss": 0.7133, "loss_nan_ranks": 0, "loss_rank_avg": 0.7108891010284424, "step": 25, "valid_targets_mean": 6008.8, "valid_targets_min": 2554 }, { "epoch": 0.0949367088607595, "grad_norm": 1.7389619679720372, "learning_rate": 5.225225225225226e-06, "loss": 0.6769, "loss_nan_ranks": 0, "loss_rank_avg": 0.6590981483459473, "step": 30, "valid_targets_mean": 5323.6, "valid_targets_min": 738 }, { "epoch": 0.11075949367088607, "grad_norm": 1.3640080618334556, "learning_rate": 6.126126126126126e-06, "loss": 0.6836, "loss_nan_ranks": 0, "loss_rank_avg": 0.618993878364563, "step": 35, "valid_targets_mean": 6272.8, "valid_targets_min": 4170 }, { "epoch": 0.12658227848101267, "grad_norm": 1.1186375634687915, "learning_rate": 7.027027027027028e-06, "loss": 0.6246, "loss_nan_ranks": 0, "loss_rank_avg": 0.6017647981643677, "step": 40, "valid_targets_mean": 5764.1, "valid_targets_min": 4916 }, { "epoch": 0.14240506329113925, "grad_norm": 0.9386209237716225, "learning_rate": 7.927927927927929e-06, "loss": 0.6045, "loss_nan_ranks": 0, "loss_rank_avg": 0.59061598777771, "step": 45, "valid_targets_mean": 5393.1, "valid_targets_min": 2068 }, { "epoch": 0.15822784810126583, "grad_norm": 0.8597710318195954, "learning_rate": 8.82882882882883e-06, "loss": 0.587, "loss_nan_ranks": 0, "loss_rank_avg": 0.5794469714164734, "step": 50, "valid_targets_mean": 5057.8, "valid_targets_min": 529 }, { "epoch": 0.17405063291139242, "grad_norm": 0.7380078972896661, "learning_rate": 9.729729729729732e-06, "loss": 0.5877, "loss_nan_ranks": 0, "loss_rank_avg": 0.5776603817939758, "step": 55, "valid_targets_mean": 5990.2, "valid_targets_min": 2501 }, { "epoch": 0.189873417721519, "grad_norm": 0.7385128432786578, "learning_rate": 1.0630630630630632e-05, "loss": 0.5414, "loss_nan_ranks": 0, "loss_rank_avg": 0.5155864357948303, "step": 60, "valid_targets_mean": 5768.9, "valid_targets_min": 2221 }, { "epoch": 0.20569620253164558, "grad_norm": 0.6209730262155323, "learning_rate": 1.1531531531531532e-05, "loss": 0.5315, "loss_nan_ranks": 0, "loss_rank_avg": 0.5242434740066528, "step": 65, "valid_targets_mean": 5509.4, "valid_targets_min": 936 }, { "epoch": 0.22151898734177214, "grad_norm": 0.6528264506538175, "learning_rate": 1.2432432432432433e-05, "loss": 0.512, "loss_nan_ranks": 0, "loss_rank_avg": 0.4938278794288635, "step": 70, "valid_targets_mean": 5477.1, "valid_targets_min": 706 }, { "epoch": 0.23734177215189872, "grad_norm": 0.5670440656251462, "learning_rate": 1.3333333333333333e-05, "loss": 0.4835, "loss_nan_ranks": 0, "loss_rank_avg": 0.490886926651001, "step": 75, "valid_targets_mean": 6629.6, "valid_targets_min": 2375 }, { "epoch": 0.25316455696202533, "grad_norm": 0.5622722280452882, "learning_rate": 1.4234234234234234e-05, "loss": 0.466, "loss_nan_ranks": 0, "loss_rank_avg": 0.45689529180526733, "step": 80, "valid_targets_mean": 5843.8, "valid_targets_min": 3654 }, { "epoch": 0.2689873417721519, "grad_norm": 0.605023842930082, "learning_rate": 1.5135135135135138e-05, "loss": 0.4579, "loss_nan_ranks": 0, "loss_rank_avg": 0.4165900945663452, "step": 85, "valid_targets_mean": 5597.8, "valid_targets_min": 1965 }, { "epoch": 0.2848101265822785, "grad_norm": 0.5554544705328142, "learning_rate": 1.6036036036036036e-05, "loss": 0.4421, "loss_nan_ranks": 0, "loss_rank_avg": 0.46295350790023804, "step": 90, "valid_targets_mean": 5449.9, "valid_targets_min": 572 }, { "epoch": 0.30063291139240506, "grad_norm": 0.6041342893699451, "learning_rate": 1.693693693693694e-05, "loss": 0.4352, "loss_nan_ranks": 0, "loss_rank_avg": 0.44789403676986694, "step": 95, "valid_targets_mean": 5553.9, "valid_targets_min": 607 }, { "epoch": 0.31645569620253167, "grad_norm": 0.7659279709674273, "learning_rate": 1.783783783783784e-05, "loss": 0.4242, "loss_nan_ranks": 0, "loss_rank_avg": 0.4142349660396576, "step": 100, "valid_targets_mean": 5741.9, "valid_targets_min": 1930 }, { "epoch": 0.3322784810126582, "grad_norm": 0.6209067476802824, "learning_rate": 1.873873873873874e-05, "loss": 0.4183, "loss_nan_ranks": 0, "loss_rank_avg": 0.4335191547870636, "step": 105, "valid_targets_mean": 6375.3, "valid_targets_min": 4533 }, { "epoch": 0.34810126582278483, "grad_norm": 0.581107613504689, "learning_rate": 1.963963963963964e-05, "loss": 0.4175, "loss_nan_ranks": 0, "loss_rank_avg": 0.41051313281059265, "step": 110, "valid_targets_mean": 5599.6, "valid_targets_min": 1732 }, { "epoch": 0.3639240506329114, "grad_norm": 0.6038416216295759, "learning_rate": 2.054054054054054e-05, "loss": 0.3992, "loss_nan_ranks": 0, "loss_rank_avg": 0.4384707808494568, "step": 115, "valid_targets_mean": 5761.0, "valid_targets_min": 809 }, { "epoch": 0.379746835443038, "grad_norm": 0.5907567666475526, "learning_rate": 2.1441441441441442e-05, "loss": 0.3927, "loss_nan_ranks": 0, "loss_rank_avg": 0.40794870257377625, "step": 120, "valid_targets_mean": 5991.1, "valid_targets_min": 710 }, { "epoch": 0.39556962025316456, "grad_norm": 0.5764381955083145, "learning_rate": 2.234234234234234e-05, "loss": 0.4041, "loss_nan_ranks": 0, "loss_rank_avg": 0.4018586277961731, "step": 125, "valid_targets_mean": 5456.4, "valid_targets_min": 1555 }, { "epoch": 0.41139240506329117, "grad_norm": 0.5755518106976973, "learning_rate": 2.3243243243243243e-05, "loss": 0.3897, "loss_nan_ranks": 0, "loss_rank_avg": 0.3841174840927124, "step": 130, "valid_targets_mean": 5648.2, "valid_targets_min": 3331 }, { "epoch": 0.4272151898734177, "grad_norm": 0.7549254910637737, "learning_rate": 2.414414414414415e-05, "loss": 0.3976, "loss_nan_ranks": 0, "loss_rank_avg": 0.36377841234207153, "step": 135, "valid_targets_mean": 4960.0, "valid_targets_min": 685 }, { "epoch": 0.4430379746835443, "grad_norm": 0.646228878541494, "learning_rate": 2.5045045045045047e-05, "loss": 0.39, "loss_nan_ranks": 0, "loss_rank_avg": 0.3614453077316284, "step": 140, "valid_targets_mean": 6316.5, "valid_targets_min": 3461 }, { "epoch": 0.4588607594936709, "grad_norm": 0.6223647658352607, "learning_rate": 2.594594594594595e-05, "loss": 0.3932, "loss_nan_ranks": 0, "loss_rank_avg": 0.3782048523426056, "step": 145, "valid_targets_mean": 5925.8, "valid_targets_min": 962 }, { "epoch": 0.47468354430379744, "grad_norm": 0.5319538222768427, "learning_rate": 2.6846846846846852e-05, "loss": 0.3691, "loss_nan_ranks": 0, "loss_rank_avg": 0.35863935947418213, "step": 150, "valid_targets_mean": 6230.6, "valid_targets_min": 4410 }, { "epoch": 0.49050632911392406, "grad_norm": 0.5959100850015796, "learning_rate": 2.774774774774775e-05, "loss": 0.3906, "loss_nan_ranks": 0, "loss_rank_avg": 0.4075894355773926, "step": 155, "valid_targets_mean": 5685.1, "valid_targets_min": 2217 }, { "epoch": 0.5063291139240507, "grad_norm": 0.6104000907758355, "learning_rate": 2.8648648648648653e-05, "loss": 0.3632, "loss_nan_ranks": 0, "loss_rank_avg": 0.3834109902381897, "step": 160, "valid_targets_mean": 5372.4, "valid_targets_min": 2488 }, { "epoch": 0.5221518987341772, "grad_norm": 0.5943597918399458, "learning_rate": 2.954954954954955e-05, "loss": 0.3611, "loss_nan_ranks": 0, "loss_rank_avg": 0.34721097350120544, "step": 165, "valid_targets_mean": 6153.5, "valid_targets_min": 3625 }, { "epoch": 0.5379746835443038, "grad_norm": 0.8779668397824408, "learning_rate": 3.0450450450450454e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.3657713830471039, "step": 170, "valid_targets_mean": 6067.9, "valid_targets_min": 2587 }, { "epoch": 0.5537974683544303, "grad_norm": 0.6223661471412824, "learning_rate": 3.135135135135135e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.3509843051433563, "step": 175, "valid_targets_mean": 5559.8, "valid_targets_min": 2152 }, { "epoch": 0.569620253164557, "grad_norm": 0.6222537770299622, "learning_rate": 3.225225225225225e-05, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.3183259963989258, "step": 180, "valid_targets_mean": 5944.1, "valid_targets_min": 806 }, { "epoch": 0.5854430379746836, "grad_norm": 0.6005449566296928, "learning_rate": 3.3153153153153157e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.35840126872062683, "step": 185, "valid_targets_mean": 5495.9, "valid_targets_min": 3212 }, { "epoch": 0.6012658227848101, "grad_norm": 0.6023686554503512, "learning_rate": 3.4054054054054055e-05, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.3845367431640625, "step": 190, "valid_targets_mean": 6150.2, "valid_targets_min": 4223 }, { "epoch": 0.6170886075949367, "grad_norm": 0.5614758195645654, "learning_rate": 3.4954954954954954e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.35003113746643066, "step": 195, "valid_targets_mean": 6085.7, "valid_targets_min": 648 }, { "epoch": 0.6329113924050633, "grad_norm": 0.5669477947277907, "learning_rate": 3.585585585585586e-05, "loss": 0.3482, "loss_nan_ranks": 0, "loss_rank_avg": 0.3124888241291046, "step": 200, "valid_targets_mean": 5489.0, "valid_targets_min": 3469 }, { "epoch": 0.6487341772151899, "grad_norm": 0.5792807141463496, "learning_rate": 3.6756756756756765e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.3375263214111328, "step": 205, "valid_targets_mean": 6183.4, "valid_targets_min": 1949 }, { "epoch": 0.6645569620253164, "grad_norm": 0.5605895836940232, "learning_rate": 3.7657657657657664e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.3439105153083801, "step": 210, "valid_targets_mean": 6067.1, "valid_targets_min": 3691 }, { "epoch": 0.680379746835443, "grad_norm": 0.5409677012753102, "learning_rate": 3.855855855855856e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.32987433671951294, "step": 215, "valid_targets_mean": 5943.6, "valid_targets_min": 2565 }, { "epoch": 0.6962025316455697, "grad_norm": 0.5651963802609234, "learning_rate": 3.945945945945946e-05, "loss": 0.3547, "loss_nan_ranks": 0, "loss_rank_avg": 0.3495904207229614, "step": 220, "valid_targets_mean": 5503.1, "valid_targets_min": 769 }, { "epoch": 0.7120253164556962, "grad_norm": 0.6159705821271058, "learning_rate": 3.999990030962651e-05, "loss": 0.3513, "loss_nan_ranks": 0, "loss_rank_avg": 0.3498522639274597, "step": 225, "valid_targets_mean": 5073.9, "valid_targets_min": 916 }, { "epoch": 0.7278481012658228, "grad_norm": 0.5769256804710682, "learning_rate": 3.9998778804338035e-05, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.3386867046356201, "step": 230, "valid_targets_mean": 5822.4, "valid_targets_min": 823 }, { "epoch": 0.7436708860759493, "grad_norm": 0.5997266023641833, "learning_rate": 3.9996411250903884e-05, "loss": 0.338, "loss_nan_ranks": 0, "loss_rank_avg": 0.32479092478752136, "step": 235, "valid_targets_mean": 5829.8, "valid_targets_min": 2857 }, { "epoch": 0.759493670886076, "grad_norm": 0.5809144885862758, "learning_rate": 3.9992797796837354e-05, "loss": 0.3587, "loss_nan_ranks": 0, "loss_rank_avg": 0.3352227807044983, "step": 240, "valid_targets_mean": 5659.2, "valid_targets_min": 1761 }, { "epoch": 0.7753164556962026, "grad_norm": 0.5987836701077235, "learning_rate": 3.9987938667279065e-05, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.33761051297187805, "step": 245, "valid_targets_mean": 6031.9, "valid_targets_min": 650 }, { "epoch": 0.7911392405063291, "grad_norm": 0.5120036432889168, "learning_rate": 3.998183416498299e-05, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.32812052965164185, "step": 250, "valid_targets_mean": 6019.6, "valid_targets_min": 3347 }, { "epoch": 0.8069620253164557, "grad_norm": 0.5533906259307175, "learning_rate": 3.9974484670297515e-05, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.33938735723495483, "step": 255, "valid_targets_mean": 6177.3, "valid_targets_min": 2736 }, { "epoch": 0.8227848101265823, "grad_norm": 0.5463218213680792, "learning_rate": 3.996589064114183e-05, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.33829447627067566, "step": 260, "valid_targets_mean": 5798.7, "valid_targets_min": 2076 }, { "epoch": 0.8386075949367089, "grad_norm": 0.5858802651211497, "learning_rate": 3.995605261297733e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.32265397906303406, "step": 265, "valid_targets_mean": 5114.2, "valid_targets_min": 669 }, { "epoch": 0.8544303797468354, "grad_norm": 0.5957957307763452, "learning_rate": 3.994497119877429e-05, "loss": 0.3462, "loss_nan_ranks": 0, "loss_rank_avg": 0.36409419775009155, "step": 270, "valid_targets_mean": 5744.9, "valid_targets_min": 2013 }, { "epoch": 0.870253164556962, "grad_norm": 0.5392854104650391, "learning_rate": 3.9932647088973635e-05, "loss": 0.3229, "loss_nan_ranks": 0, "loss_rank_avg": 0.3287871181964874, "step": 275, "valid_targets_mean": 5633.2, "valid_targets_min": 1960 }, { "epoch": 0.8860759493670886, "grad_norm": 0.544848398408457, "learning_rate": 3.9919081051443974e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.3490983247756958, "step": 280, "valid_targets_mean": 6091.4, "valid_targets_min": 2448 }, { "epoch": 0.9018987341772152, "grad_norm": 0.5207114070396386, "learning_rate": 3.990427393143369e-05, "loss": 0.337, "loss_nan_ranks": 0, "loss_rank_avg": 0.3348560333251953, "step": 285, "valid_targets_mean": 5576.4, "valid_targets_min": 886 }, { "epoch": 0.9177215189873418, "grad_norm": 0.5913839083299426, "learning_rate": 3.988822665151836e-05, "loss": 0.3334, "loss_nan_ranks": 0, "loss_rank_avg": 0.35333555936813354, "step": 290, "valid_targets_mean": 5589.2, "valid_targets_min": 766 }, { "epoch": 0.9335443037974683, "grad_norm": 0.6143720688184718, "learning_rate": 3.987094021154319e-05, "loss": 0.3388, "loss_nan_ranks": 0, "loss_rank_avg": 0.3340070843696594, "step": 295, "valid_targets_mean": 5667.8, "valid_targets_min": 2662 }, { "epoch": 0.9493670886075949, "grad_norm": 0.5592248016927946, "learning_rate": 3.985241568856077e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.30103063583374023, "step": 300, "valid_targets_mean": 5012.6, "valid_targets_min": 2048 }, { "epoch": 0.9651898734177216, "grad_norm": 0.5453255678206526, "learning_rate": 3.983265423676396e-05, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.29531943798065186, "step": 305, "valid_targets_mean": 5888.4, "valid_targets_min": 1837 }, { "epoch": 0.9810126582278481, "grad_norm": 0.5365359931030111, "learning_rate": 3.9811657087413955e-05, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.32722777128219604, "step": 310, "valid_targets_mean": 5922.3, "valid_targets_min": 1486 }, { "epoch": 0.9968354430379747, "grad_norm": 0.5234404324989647, "learning_rate": 3.9789425548763574e-05, "loss": 0.3202, "loss_nan_ranks": 0, "loss_rank_avg": 0.30988502502441406, "step": 315, "valid_targets_mean": 6443.0, "valid_targets_min": 3893 }, { "epoch": 1.0126582278481013, "grad_norm": 0.5183687500516394, "learning_rate": 3.976596100597579e-05, "loss": 0.3204, "loss_nan_ranks": 0, "loss_rank_avg": 0.3249934911727905, "step": 320, "valid_targets_mean": 5519.9, "valid_targets_min": 1847 }, { "epoch": 1.0284810126582278, "grad_norm": 0.5331896984808763, "learning_rate": 3.974126492103736e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.3015314042568207, "step": 325, "valid_targets_mean": 6262.5, "valid_targets_min": 2170 }, { "epoch": 1.0443037974683544, "grad_norm": 0.5855356182197418, "learning_rate": 3.971533883266778e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.3428266644477844, "step": 330, "valid_targets_mean": 4937.9, "valid_targets_min": 1619 }, { "epoch": 1.0601265822784811, "grad_norm": 0.5338122150976636, "learning_rate": 3.9688184356223406e-05, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.31056129932403564, "step": 335, "valid_targets_mean": 5959.5, "valid_targets_min": 3731 }, { "epoch": 1.0759493670886076, "grad_norm": 0.5365587414802077, "learning_rate": 3.9659803183596794e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.33881163597106934, "step": 340, "valid_targets_mean": 6117.9, "valid_targets_min": 4169 }, { "epoch": 1.0917721518987342, "grad_norm": 0.5883328441611787, "learning_rate": 3.963019708311129e-05, "loss": 0.3151, "loss_nan_ranks": 0, "loss_rank_avg": 0.2953089475631714, "step": 345, "valid_targets_mean": 5483.4, "valid_targets_min": 3383 }, { "epoch": 1.1075949367088607, "grad_norm": 0.5639266443192867, "learning_rate": 3.9599367899410865e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.3456162214279175, "step": 350, "valid_targets_mean": 5594.0, "valid_targets_min": 2189 }, { "epoch": 1.1234177215189873, "grad_norm": 0.4882291609214383, "learning_rate": 3.956731755334516e-05, "loss": 0.3251, "loss_nan_ranks": 0, "loss_rank_avg": 0.30995047092437744, "step": 355, "valid_targets_mean": 6331.2, "valid_targets_min": 2270 }, { "epoch": 1.139240506329114, "grad_norm": 0.5272761657710062, "learning_rate": 3.953404804184982e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.3174111247062683, "step": 360, "valid_targets_mean": 5742.4, "valid_targets_min": 3466 }, { "epoch": 1.1550632911392404, "grad_norm": 0.5368848055456228, "learning_rate": 3.949956143782208e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.32597553730010986, "step": 365, "valid_targets_mean": 6278.2, "valid_targets_min": 809 }, { "epoch": 1.1708860759493671, "grad_norm": 0.46231267116022384, "learning_rate": 3.946385988999158e-05, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.2897875905036926, "step": 370, "valid_targets_mean": 6156.8, "valid_targets_min": 2261 }, { "epoch": 1.1867088607594938, "grad_norm": 0.5279582306080264, "learning_rate": 3.942694562278652e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.33394286036491394, "step": 375, "valid_targets_mean": 5678.4, "valid_targets_min": 3621 }, { "epoch": 1.2025316455696202, "grad_norm": 0.5047890297509585, "learning_rate": 3.938882093619505e-05, "loss": 0.3206, "loss_nan_ranks": 0, "loss_rank_avg": 0.32703208923339844, "step": 380, "valid_targets_mean": 5641.8, "valid_targets_min": 677 }, { "epoch": 1.2183544303797469, "grad_norm": 0.5044680379524039, "learning_rate": 3.934948820562196e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.3180423676967621, "step": 385, "valid_targets_mean": 6107.4, "valid_targets_min": 4917 }, { "epoch": 1.2341772151898733, "grad_norm": 0.5054464486878625, "learning_rate": 3.9308949881740684e-05, "loss": 0.3133, "loss_nan_ranks": 0, "loss_rank_avg": 0.3271169662475586, "step": 390, "valid_targets_mean": 5758.1, "valid_targets_min": 693 }, { "epoch": 1.25, "grad_norm": 0.4722764193174416, "learning_rate": 3.926720849034062e-05, "loss": 0.308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2783935070037842, "step": 395, "valid_targets_mean": 5941.9, "valid_targets_min": 4132 }, { "epoch": 1.2658227848101267, "grad_norm": 0.5869772158307476, "learning_rate": 3.922426663216973e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.31632736325263977, "step": 400, "valid_targets_mean": 5153.4, "valid_targets_min": 806 }, { "epoch": 1.2816455696202531, "grad_norm": 0.4936808719044175, "learning_rate": 3.9180126982772524e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.32065725326538086, "step": 405, "valid_targets_mean": 5738.6, "valid_targets_min": 3262 }, { "epoch": 1.2974683544303798, "grad_norm": 0.49156656318553427, "learning_rate": 3.9134792292323343e-05, "loss": 0.3147, "loss_nan_ranks": 0, "loss_rank_avg": 0.2900536060333252, "step": 410, "valid_targets_mean": 6236.5, "valid_targets_min": 2029 }, { "epoch": 1.3132911392405062, "grad_norm": 0.48351243867680455, "learning_rate": 3.9088265385454995e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.2834135591983795, "step": 415, "valid_targets_mean": 5412.0, "valid_targets_min": 753 }, { "epoch": 1.3291139240506329, "grad_norm": 0.5149369616768734, "learning_rate": 3.9040549161082804e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.3001251220703125, "step": 420, "valid_targets_mean": 6026.9, "valid_targets_min": 4356 }, { "epoch": 1.3449367088607596, "grad_norm": 0.5056930922739988, "learning_rate": 3.8991646592223936e-05, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.32380956411361694, "step": 425, "valid_targets_mean": 6292.7, "valid_targets_min": 5079 }, { "epoch": 1.360759493670886, "grad_norm": 0.4975035489093388, "learning_rate": 3.8941560725812196e-05, "loss": 0.316, "loss_nan_ranks": 0, "loss_rank_avg": 0.3131970167160034, "step": 430, "valid_targets_mean": 6082.8, "valid_targets_min": 4291 }, { "epoch": 1.3765822784810127, "grad_norm": 0.5135806794137311, "learning_rate": 3.889029468250819e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.31978845596313477, "step": 435, "valid_targets_mean": 5666.0, "valid_targets_min": 3586 }, { "epoch": 1.3924050632911391, "grad_norm": 0.517191652020098, "learning_rate": 3.883785165650486e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.34643927216529846, "step": 440, "valid_targets_mean": 6099.8, "valid_targets_min": 4447 }, { "epoch": 1.4082278481012658, "grad_norm": 0.46886883431653514, "learning_rate": 3.878423491532848e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.29647165536880493, "step": 445, "valid_targets_mean": 5554.6, "valid_targets_min": 2158 }, { "epoch": 1.4240506329113924, "grad_norm": 0.5009776650584222, "learning_rate": 3.872944779963508e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930678725242615, "step": 450, "valid_targets_mean": 5905.5, "valid_targets_min": 4156 }, { "epoch": 1.439873417721519, "grad_norm": 0.5581179183711339, "learning_rate": 3.8673493723002295e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.3513834476470947, "step": 455, "valid_targets_mean": 4625.1, "valid_targets_min": 628 }, { "epoch": 1.4556962025316456, "grad_norm": 0.4973056639296272, "learning_rate": 3.861637617171666e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.3165348172187805, "step": 460, "valid_targets_mean": 6393.6, "valid_targets_min": 842 }, { "epoch": 1.4715189873417722, "grad_norm": 0.5759427318216085, "learning_rate": 3.855809870455642e-05, "loss": 0.323, "loss_nan_ranks": 0, "loss_rank_avg": 0.3243919014930725, "step": 465, "valid_targets_mean": 5460.6, "valid_targets_min": 771 }, { "epoch": 1.4873417721518987, "grad_norm": 0.4546482939790815, "learning_rate": 3.8498664952569776e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.31235501170158386, "step": 470, "valid_targets_mean": 6463.9, "valid_targets_min": 3142 }, { "epoch": 1.5031645569620253, "grad_norm": 0.6343641310574493, "learning_rate": 3.843807861884866e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.2982757091522217, "step": 475, "valid_targets_mean": 4136.8, "valid_targets_min": 648 }, { "epoch": 1.518987341772152, "grad_norm": 0.5069046822030032, "learning_rate": 3.8376343478298016e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.29897549748420715, "step": 480, "valid_targets_mean": 6222.6, "valid_targets_min": 5441 }, { "epoch": 1.5348101265822784, "grad_norm": 0.5330238248658747, "learning_rate": 3.831346337740057e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.31486159563064575, "step": 485, "valid_targets_mean": 5535.6, "valid_targets_min": 514 }, { "epoch": 1.5506329113924051, "grad_norm": 0.48002428336966424, "learning_rate": 3.824944223397721e-05, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.32473498582839966, "step": 490, "valid_targets_mean": 5520.2, "valid_targets_min": 806 }, { "epoch": 1.5664556962025316, "grad_norm": 0.46876258971251733, "learning_rate": 3.818428403694283e-05, "loss": 0.3074, "loss_nan_ranks": 0, "loss_rank_avg": 0.3067629933357239, "step": 495, "valid_targets_mean": 6308.1, "valid_targets_min": 4391 }, { "epoch": 1.5822784810126582, "grad_norm": 0.5196291770297198, "learning_rate": 3.811799284605787e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.3322131633758545, "step": 500, "valid_targets_mean": 5697.0, "valid_targets_min": 799 }, { "epoch": 1.5981012658227849, "grad_norm": 0.523916980014032, "learning_rate": 3.805057279167529e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.3147963881492615, "step": 505, "valid_targets_mean": 5464.8, "valid_targets_min": 744 }, { "epoch": 1.6139240506329116, "grad_norm": 0.5145689742215844, "learning_rate": 3.798202807448328e-05, "loss": 0.3121, "loss_nan_ranks": 0, "loss_rank_avg": 0.3126614987850189, "step": 510, "valid_targets_mean": 5357.8, "valid_targets_min": 2133 }, { "epoch": 1.629746835443038, "grad_norm": 0.522545617708332, "learning_rate": 3.791236296524349e-05, "loss": 0.3017, "loss_nan_ranks": 0, "loss_rank_avg": 0.31563282012939453, "step": 515, "valid_targets_mean": 6165.4, "valid_targets_min": 4172 }, { "epoch": 1.6455696202531644, "grad_norm": 0.4587360075244091, "learning_rate": 3.7841581804524966e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.3099702298641205, "step": 520, "valid_targets_mean": 6268.2, "valid_targets_min": 5153 }, { "epoch": 1.6613924050632911, "grad_norm": 0.48285835961523327, "learning_rate": 3.776968900243369e-05, "loss": 0.3118, "loss_nan_ranks": 0, "loss_rank_avg": 0.3159397840499878, "step": 525, "valid_targets_mean": 6025.0, "valid_targets_min": 882 }, { "epoch": 1.6772151898734178, "grad_norm": 0.5027822640943034, "learning_rate": 3.7696689038337807e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.3112294673919678, "step": 530, "valid_targets_mean": 6107.8, "valid_targets_min": 3057 }, { "epoch": 1.6930379746835444, "grad_norm": 0.49706927167370746, "learning_rate": 3.762258646058854e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948613166809082, "step": 535, "valid_targets_mean": 5631.9, "valid_targets_min": 2175 }, { "epoch": 1.7088607594936709, "grad_norm": 0.5035384651568894, "learning_rate": 3.754738588623679e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.3071019649505615, "step": 540, "valid_targets_mean": 6088.6, "valid_targets_min": 2811 }, { "epoch": 1.7246835443037973, "grad_norm": 0.5147424772974462, "learning_rate": 3.747109200074544e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.2903684973716736, "step": 545, "valid_targets_mean": 5766.8, "valid_targets_min": 1985 }, { "epoch": 1.740506329113924, "grad_norm": 0.5282616133475547, "learning_rate": 3.739370955769748e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.305397093296051, "step": 550, "valid_targets_mean": 5689.4, "valid_targets_min": 2557 }, { "epoch": 1.7563291139240507, "grad_norm": 0.4682192117249516, "learning_rate": 3.73152433784998e-05, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.3013456165790558, "step": 555, "valid_targets_mean": 5368.7, "valid_targets_min": 1986 }, { "epoch": 1.7721518987341773, "grad_norm": 0.44057671857937225, "learning_rate": 3.723569835208276e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.2914057672023773, "step": 560, "valid_targets_mean": 6597.2, "valid_targets_min": 5193 }, { "epoch": 1.7879746835443038, "grad_norm": 0.4796159961996015, "learning_rate": 3.715507943459561e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.2853228449821472, "step": 565, "valid_targets_mean": 5998.0, "valid_targets_min": 3590 }, { "epoch": 1.8037974683544302, "grad_norm": 0.4610958393107323, "learning_rate": 3.70733916490977e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.2611140012741089, "step": 570, "valid_targets_mean": 5264.6, "valid_targets_min": 2780 }, { "epoch": 1.8196202531645569, "grad_norm": 0.49037791791585045, "learning_rate": 3.699064008524548e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.32969820499420166, "step": 575, "valid_targets_mean": 5529.9, "valid_targets_min": 2026 }, { "epoch": 1.8354430379746836, "grad_norm": 0.4797430506584315, "learning_rate": 3.690682989897539e-05, "loss": 0.2992, "loss_nan_ranks": 0, "loss_rank_avg": 0.2864863872528076, "step": 580, "valid_targets_mean": 5474.2, "valid_targets_min": 2469 }, { "epoch": 1.8512658227848102, "grad_norm": 0.49388198180056775, "learning_rate": 3.682196631218267e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.3122454881668091, "step": 585, "valid_targets_mean": 5575.6, "valid_targets_min": 2994 }, { "epoch": 1.8670886075949367, "grad_norm": 0.45749314010557557, "learning_rate": 3.67360546123959e-05, "loss": 0.3121, "loss_nan_ranks": 0, "loss_rank_avg": 0.2997322082519531, "step": 590, "valid_targets_mean": 5467.4, "valid_targets_min": 767 }, { "epoch": 1.8829113924050633, "grad_norm": 0.45411543089255624, "learning_rate": 3.6649100152447636e-05, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.30825352668762207, "step": 595, "valid_targets_mean": 6071.1, "valid_targets_min": 3451 }, { "epoch": 1.8987341772151898, "grad_norm": 0.44164946101678815, "learning_rate": 3.6561108350140876e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.2762806713581085, "step": 600, "valid_targets_mean": 6110.0, "valid_targets_min": 4094 }, { "epoch": 1.9145569620253164, "grad_norm": 0.4843182843398918, "learning_rate": 3.647208468791147e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.3104550838470459, "step": 605, "valid_targets_mean": 5450.8, "valid_targets_min": 2042 }, { "epoch": 1.9303797468354431, "grad_norm": 0.5246679183938616, "learning_rate": 3.638203471248656e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.311735063791275, "step": 610, "valid_targets_mean": 6342.0, "valid_targets_min": 4203 }, { "epoch": 1.9462025316455698, "grad_norm": 0.4739098308477039, "learning_rate": 3.6290964034539e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.2983429729938507, "step": 615, "valid_targets_mean": 6205.6, "valid_targets_min": 805 }, { "epoch": 1.9620253164556962, "grad_norm": 0.43160749249022473, "learning_rate": 3.61988783283377e-05, "loss": 0.3155, "loss_nan_ranks": 0, "loss_rank_avg": 0.31190475821495056, "step": 620, "valid_targets_mean": 6585.2, "valid_targets_min": 3950 }, { "epoch": 1.9778481012658227, "grad_norm": 0.48372069468120066, "learning_rate": 3.610578333139418e-05, "loss": 0.2993, "loss_nan_ranks": 0, "loss_rank_avg": 0.30041295289993286, "step": 625, "valid_targets_mean": 5826.0, "valid_targets_min": 2238 }, { "epoch": 1.9936708860759493, "grad_norm": 0.5074154638338687, "learning_rate": 3.601168484410503e-05, "loss": 0.2986, "loss_nan_ranks": 0, "loss_rank_avg": 0.29460474848747253, "step": 630, "valid_targets_mean": 5909.8, "valid_targets_min": 3580 }, { "epoch": 2.009493670886076, "grad_norm": 0.4582513785903484, "learning_rate": 3.591658872939051e-05, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.2935415804386139, "step": 635, "valid_targets_mean": 6060.9, "valid_targets_min": 685 }, { "epoch": 2.0253164556962027, "grad_norm": 0.4865535063786641, "learning_rate": 3.582050091232927e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.30103033781051636, "step": 640, "valid_targets_mean": 5298.8, "valid_targets_min": 2244 }, { "epoch": 2.041139240506329, "grad_norm": 0.4899472148100494, "learning_rate": 3.572342737978919e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.2633832097053528, "step": 645, "valid_targets_mean": 5349.4, "valid_targets_min": 1965 }, { "epoch": 2.0569620253164556, "grad_norm": 0.4592971443361485, "learning_rate": 3.562537418005433e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.26928383111953735, "step": 650, "valid_targets_mean": 5509.2, "valid_targets_min": 767 }, { "epoch": 2.0727848101265822, "grad_norm": 0.45093775520530355, "learning_rate": 3.5526347422448115e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.30223190784454346, "step": 655, "valid_targets_mean": 5825.9, "valid_targets_min": 3179 }, { "epoch": 2.088607594936709, "grad_norm": 0.46619156750938906, "learning_rate": 3.5426353276952664e-05, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.31004923582077026, "step": 660, "valid_targets_mean": 6050.8, "valid_targets_min": 836 }, { "epoch": 2.1044303797468356, "grad_norm": 0.5198681015561224, "learning_rate": 3.532539797382438e-05, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.30181536078453064, "step": 665, "valid_targets_mean": 5796.1, "valid_targets_min": 2469 }, { "epoch": 2.1202531645569622, "grad_norm": 0.48495786428109977, "learning_rate": 3.5223487803205745e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.28098708391189575, "step": 670, "valid_targets_mean": 5556.3, "valid_targets_min": 3519 }, { "epoch": 2.1360759493670884, "grad_norm": 0.4697953936662229, "learning_rate": 3.512062911473342e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.2885569930076599, "step": 675, "valid_targets_mean": 5751.8, "valid_targets_min": 3446 }, { "epoch": 2.151898734177215, "grad_norm": 0.4778592999393128, "learning_rate": 3.501682831714263e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.2793217897415161, "step": 680, "valid_targets_mean": 6121.1, "valid_targets_min": 5274 }, { "epoch": 2.1677215189873418, "grad_norm": 0.49097382184697463, "learning_rate": 3.491209187786784e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594742774963379, "step": 685, "valid_targets_mean": 5144.1, "valid_targets_min": 1753 }, { "epoch": 2.1835443037974684, "grad_norm": 0.48053227810239074, "learning_rate": 3.480642632263981e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.3140348792076111, "step": 690, "valid_targets_mean": 5762.4, "valid_targets_min": 1713 }, { "epoch": 2.199367088607595, "grad_norm": 0.4554353384848606, "learning_rate": 3.469983823507898e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.29892221093177795, "step": 695, "valid_targets_mean": 5548.7, "valid_targets_min": 642 }, { "epoch": 2.2151898734177213, "grad_norm": 0.47227747671392983, "learning_rate": 3.4592334256285306e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.2790769338607788, "step": 700, "valid_targets_mean": 5659.8, "valid_targets_min": 2595 }, { "epoch": 2.231012658227848, "grad_norm": 0.46014971292294476, "learning_rate": 3.4483921084424446e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2855474352836609, "step": 705, "valid_targets_mean": 5672.0, "valid_targets_min": 2942 }, { "epoch": 2.2468354430379747, "grad_norm": 0.45834270629586105, "learning_rate": 3.437460547431044e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.2855965793132782, "step": 710, "valid_targets_mean": 6076.5, "valid_targets_min": 2378 }, { "epoch": 2.2626582278481013, "grad_norm": 0.4760222160081626, "learning_rate": 3.426439423698483e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.30656492710113525, "step": 715, "valid_targets_mean": 6437.0, "valid_targets_min": 4826 }, { "epoch": 2.278481012658228, "grad_norm": 0.46990296888744815, "learning_rate": 3.41532942392923e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.3031311333179474, "step": 720, "valid_targets_mean": 6133.1, "valid_targets_min": 3111 }, { "epoch": 2.2943037974683547, "grad_norm": 0.4571705839965309, "learning_rate": 3.404131240345281e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.29287195205688477, "step": 725, "valid_targets_mean": 6849.6, "valid_targets_min": 5307 }, { "epoch": 2.310126582278481, "grad_norm": 0.45070130004909464, "learning_rate": 3.3928455706630354e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.29879462718963623, "step": 730, "valid_targets_mean": 6255.3, "valid_targets_min": 4712 }, { "epoch": 2.3259493670886076, "grad_norm": 0.46137028628139504, "learning_rate": 3.3814731180498166e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.2994469702243805, "step": 735, "valid_targets_mean": 6294.0, "valid_targets_min": 3962 }, { "epoch": 2.3417721518987342, "grad_norm": 0.46762059401539763, "learning_rate": 3.370014591080064e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.26314711570739746, "step": 740, "valid_targets_mean": 5497.4, "valid_targets_min": 2189 }, { "epoch": 2.357594936708861, "grad_norm": 0.4572706524806831, "learning_rate": 3.358470703691184e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.28679436445236206, "step": 745, "valid_targets_mean": 5952.6, "valid_targets_min": 3586 }, { "epoch": 2.3734177215189876, "grad_norm": 0.4595477740780959, "learning_rate": 3.34684217513907e-05, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.2892051041126251, "step": 750, "valid_targets_mean": 5905.7, "valid_targets_min": 2447 }, { "epoch": 2.3892405063291138, "grad_norm": 0.46680713190521667, "learning_rate": 3.335129729953282e-05, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.31123167276382446, "step": 755, "valid_targets_mean": 6154.4, "valid_targets_min": 4720 }, { "epoch": 2.4050632911392404, "grad_norm": 0.486405918820402, "learning_rate": 3.323334097891908e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746376097202301, "step": 760, "valid_targets_mean": 5427.4, "valid_targets_min": 2031 }, { "epoch": 2.420886075949367, "grad_norm": 0.48586284114044387, "learning_rate": 3.311456013896099e-05, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.3024941384792328, "step": 765, "valid_targets_mean": 5223.7, "valid_targets_min": 778 }, { "epoch": 2.4367088607594938, "grad_norm": 0.5025764682649462, "learning_rate": 3.299496218044269e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.315251886844635, "step": 770, "valid_targets_mean": 4921.6, "valid_targets_min": 596 }, { "epoch": 2.4525316455696204, "grad_norm": 0.4549092472858824, "learning_rate": 3.287455455505991e-05, "loss": 0.2828, "loss_nan_ranks": 0, "loss_rank_avg": 0.293832927942276, "step": 775, "valid_targets_mean": 6210.0, "valid_targets_min": 775 }, { "epoch": 2.4683544303797467, "grad_norm": 0.5687625275372207, "learning_rate": 3.275334476495564e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.25202175974845886, "step": 780, "valid_targets_mean": 5337.6, "valid_targets_min": 2448 }, { "epoch": 2.4841772151898733, "grad_norm": 0.5152415549279067, "learning_rate": 3.2631340362252725e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.29954302310943604, "step": 785, "valid_targets_mean": 4789.7, "valid_targets_min": 743 }, { "epoch": 2.5, "grad_norm": 0.4500139404772333, "learning_rate": 3.25085489485833e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.3050997257232666, "step": 790, "valid_targets_mean": 6118.1, "valid_targets_min": 5123 }, { "epoch": 2.5158227848101267, "grad_norm": 0.4158348076851014, "learning_rate": 3.238497817461519e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.27680695056915283, "step": 795, "valid_targets_mean": 6113.9, "valid_targets_min": 3881 }, { "epoch": 2.5316455696202533, "grad_norm": 0.4603920238857949, "learning_rate": 3.226063573957518e-05, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.30450594425201416, "step": 800, "valid_targets_mean": 5632.4, "valid_targets_min": 2030 }, { "epoch": 2.5474683544303796, "grad_norm": 0.42817337943378414, "learning_rate": 3.2135529390769364e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.30379846692085266, "step": 805, "valid_targets_mean": 6379.4, "valid_targets_min": 2224 }, { "epoch": 2.5632911392405062, "grad_norm": 0.4610425941332099, "learning_rate": 3.200966692310038e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2888951599597931, "step": 810, "valid_targets_mean": 6147.2, "valid_targets_min": 2198 }, { "epoch": 2.579113924050633, "grad_norm": 0.4942290487075236, "learning_rate": 3.1883056178581806e-05, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.28200429677963257, "step": 815, "valid_targets_mean": 5177.9, "valid_targets_min": 685 }, { "epoch": 2.5949367088607596, "grad_norm": 0.4388572833069293, "learning_rate": 3.1755705045849465e-05, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.3148422837257385, "step": 820, "valid_targets_mean": 6577.1, "valid_targets_min": 3687 }, { "epoch": 2.6107594936708862, "grad_norm": 0.4512748381822771, "learning_rate": 3.162762145967001e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.28762495517730713, "step": 825, "valid_targets_mean": 5885.2, "valid_targets_min": 2707 }, { "epoch": 2.6265822784810124, "grad_norm": 0.4612075125257181, "learning_rate": 3.149881340044646e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.2912214398384094, "step": 830, "valid_targets_mean": 5434.2, "valid_targets_min": 766 }, { "epoch": 2.642405063291139, "grad_norm": 0.4802794790594333, "learning_rate": 3.1369288893721036e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.3072575628757477, "step": 835, "valid_targets_mean": 5911.4, "valid_targets_min": 1609 }, { "epoch": 2.6582278481012658, "grad_norm": 0.44392324432819513, "learning_rate": 3.123905600967506e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.2849636971950531, "step": 840, "valid_targets_mean": 5639.6, "valid_targets_min": 2609 }, { "epoch": 2.6740506329113924, "grad_norm": 0.4632523986474561, "learning_rate": 3.110812286262618e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830730974674225, "step": 845, "valid_targets_mean": 5890.8, "valid_targets_min": 3121 }, { "epoch": 2.689873417721519, "grad_norm": 0.4501317007069297, "learning_rate": 3.097649761052278e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.3051697313785553, "step": 850, "valid_targets_mean": 5598.3, "valid_targets_min": 2592 }, { "epoch": 2.7056962025316453, "grad_norm": 0.46325393649233176, "learning_rate": 3.084418845443566e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.28344061970710754, "step": 855, "valid_targets_mean": 5272.2, "valid_targets_min": 570 }, { "epoch": 2.721518987341772, "grad_norm": 0.43355255805031406, "learning_rate": 3.0711203638047124e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.280727356672287, "step": 860, "valid_targets_mean": 6016.7, "valid_targets_min": 3875 }, { "epoch": 2.7373417721518987, "grad_norm": 0.5243573469765044, "learning_rate": 3.05775514471373e-05, "loss": 0.2819, "loss_nan_ranks": 0, "loss_rank_avg": 0.2778775095939636, "step": 865, "valid_targets_mean": 5218.6, "valid_targets_min": 805 }, { "epoch": 2.7531645569620253, "grad_norm": 0.45747491693031095, "learning_rate": 3.0443240209067863e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.25808537006378174, "step": 870, "valid_targets_mean": 5862.0, "valid_targets_min": 2501 }, { "epoch": 2.768987341772152, "grad_norm": 0.49891165828308487, "learning_rate": 3.0308278292263266e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.29467886686325073, "step": 875, "valid_targets_mean": 5912.4, "valid_targets_min": 3287 }, { "epoch": 2.7848101265822782, "grad_norm": 0.48235098411869953, "learning_rate": 3.0172674105689256e-05, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.31870269775390625, "step": 880, "valid_targets_mean": 5790.2, "valid_targets_min": 642 }, { "epoch": 2.8006329113924053, "grad_norm": 0.41869426026137824, "learning_rate": 3.003643609832899e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.27100610733032227, "step": 885, "valid_targets_mean": 5882.7, "valid_targets_min": 2918 }, { "epoch": 2.8164556962025316, "grad_norm": 0.49003311128203797, "learning_rate": 2.98995727586566e-05, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.28583741188049316, "step": 890, "valid_targets_mean": 5098.6, "valid_targets_min": 1482 }, { "epoch": 2.8322784810126582, "grad_norm": 0.4911196460814385, "learning_rate": 2.9762092614108288e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707781195640564, "step": 895, "valid_targets_mean": 5186.9, "valid_targets_min": 2133 }, { "epoch": 2.848101265822785, "grad_norm": 0.4509284368354034, "learning_rate": 2.9624004230551056e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.2792275547981262, "step": 900, "valid_targets_mean": 6446.4, "valid_targets_min": 4394 }, { "epoch": 2.8639240506329116, "grad_norm": 0.4697430774538071, "learning_rate": 2.9485316211748947e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.2734847664833069, "step": 905, "valid_targets_mean": 5766.9, "valid_targets_min": 3057 }, { "epoch": 2.879746835443038, "grad_norm": 0.4562524053984699, "learning_rate": 2.934603719882703e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.3326224684715271, "step": 910, "valid_targets_mean": 5974.5, "valid_targets_min": 465 }, { "epoch": 2.8955696202531644, "grad_norm": 0.45011259088694505, "learning_rate": 2.920617586973297e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.2704487442970276, "step": 915, "valid_targets_mean": 5862.4, "valid_targets_min": 2292 }, { "epoch": 2.911392405063291, "grad_norm": 0.4772485229953272, "learning_rate": 2.9065740938696333e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2805355191230774, "step": 920, "valid_targets_mean": 5758.2, "valid_targets_min": 3948 }, { "epoch": 2.9272151898734178, "grad_norm": 0.4727148738831468, "learning_rate": 2.8924741155685675e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.30549630522727966, "step": 925, "valid_targets_mean": 6252.5, "valid_targets_min": 1967 }, { "epoch": 2.9430379746835444, "grad_norm": 0.45775895170790065, "learning_rate": 2.8783185305863307e-05, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964749336242676, "step": 930, "valid_targets_mean": 5598.0, "valid_targets_min": 834 }, { "epoch": 2.958860759493671, "grad_norm": 0.4337416998396072, "learning_rate": 2.8641082209037984e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.2781994938850403, "step": 935, "valid_targets_mean": 6104.6, "valid_targets_min": 2587 }, { "epoch": 2.9746835443037973, "grad_norm": 0.43295170811481387, "learning_rate": 2.8498440719115344e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.29673928022384644, "step": 940, "valid_targets_mean": 6292.1, "valid_targets_min": 1984 }, { "epoch": 2.990506329113924, "grad_norm": 0.44789535466180536, "learning_rate": 2.8355269723546234e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.27013325691223145, "step": 945, "valid_targets_mean": 5349.1, "valid_targets_min": 1760 }, { "epoch": 3.0063291139240507, "grad_norm": 0.42162207814788233, "learning_rate": 2.821157814277304e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.27115151286125183, "step": 950, "valid_targets_mean": 5983.3, "valid_targets_min": 3679 }, { "epoch": 3.0221518987341773, "grad_norm": 0.4416759250384479, "learning_rate": 2.806737492967378e-05, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.2797127366065979, "step": 955, "valid_targets_mean": 6223.0, "valid_targets_min": 3355 }, { "epoch": 3.037974683544304, "grad_norm": 0.4679293009398521, "learning_rate": 2.7922669069004394e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.27050942182540894, "step": 960, "valid_targets_mean": 5775.5, "valid_targets_min": 2546 }, { "epoch": 3.0537974683544302, "grad_norm": 0.41810285637714373, "learning_rate": 2.7777469576838868e-05, "loss": 0.2876, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595946192741394, "step": 965, "valid_targets_mean": 5585.8, "valid_targets_min": 2470 }, { "epoch": 3.069620253164557, "grad_norm": 0.41670836098856057, "learning_rate": 2.76317855000075e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.26501375436782837, "step": 970, "valid_targets_mean": 6174.8, "valid_targets_min": 3179 }, { "epoch": 3.0854430379746836, "grad_norm": 0.4176187275484247, "learning_rate": 2.7485625915533215e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671218514442444, "step": 975, "valid_targets_mean": 6132.2, "valid_targets_min": 2633 }, { "epoch": 3.1012658227848102, "grad_norm": 0.46082577065514035, "learning_rate": 2.7338999930066016e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930499315261841, "step": 980, "valid_targets_mean": 5562.1, "valid_targets_min": 809 }, { "epoch": 3.117088607594937, "grad_norm": 0.42281633576231314, "learning_rate": 2.719191667931561e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.26106882095336914, "step": 985, "valid_targets_mean": 5840.2, "valid_targets_min": 900 }, { "epoch": 3.132911392405063, "grad_norm": 0.47392007897126087, "learning_rate": 2.7044385327482135e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.29251885414123535, "step": 990, "valid_targets_mean": 5295.4, "valid_targets_min": 548 }, { "epoch": 3.1487341772151898, "grad_norm": 0.47021600771641175, "learning_rate": 2.689641506668525e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.290133535861969, "step": 995, "valid_targets_mean": 5718.2, "valid_targets_min": 849 }, { "epoch": 3.1645569620253164, "grad_norm": 0.45553216877342095, "learning_rate": 2.674801511639133e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.2877347767353058, "step": 1000, "valid_targets_mean": 6502.6, "valid_targets_min": 5276 }, { "epoch": 3.180379746835443, "grad_norm": 0.4491892439143873, "learning_rate": 2.6599194722839097e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.28108590841293335, "step": 1005, "valid_targets_mean": 5940.3, "valid_targets_min": 1960 }, { "epoch": 3.1962025316455698, "grad_norm": 0.4448846946970026, "learning_rate": 2.64499631584635e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.2802794575691223, "step": 1010, "valid_targets_mean": 5671.4, "valid_targets_min": 2455 }, { "epoch": 3.212025316455696, "grad_norm": 0.4484367055515372, "learning_rate": 2.6300329721317973e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.26574909687042236, "step": 1015, "valid_targets_mean": 5304.2, "valid_targets_min": 789 }, { "epoch": 3.2278481012658227, "grad_norm": 0.43854176405636597, "learning_rate": 2.6150303734495138e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.2753145694732666, "step": 1020, "valid_targets_mean": 5756.1, "valid_targets_min": 823 }, { "epoch": 3.2436708860759493, "grad_norm": 0.42425115614897546, "learning_rate": 2.599989454554587e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607611417770386, "step": 1025, "valid_targets_mean": 5802.4, "valid_targets_min": 3111 }, { "epoch": 3.259493670886076, "grad_norm": 0.4504789142568739, "learning_rate": 2.584911152589695e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.28150200843811035, "step": 1030, "valid_targets_mean": 5944.2, "valid_targets_min": 650 }, { "epoch": 3.2753164556962027, "grad_norm": 0.4525200916510691, "learning_rate": 2.569796407026711e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.27071693539619446, "step": 1035, "valid_targets_mean": 5265.6, "valid_targets_min": 1782 }, { "epoch": 3.291139240506329, "grad_norm": 0.4478586364611807, "learning_rate": 2.5546461596081727e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.28119248151779175, "step": 1040, "valid_targets_mean": 5817.7, "valid_targets_min": 771 }, { "epoch": 3.3069620253164556, "grad_norm": 0.4994557894280622, "learning_rate": 2.539461354288602e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649917006492615, "step": 1045, "valid_targets_mean": 5387.4, "valid_targets_min": 2027 }, { "epoch": 3.3227848101265822, "grad_norm": 0.4212634476803461, "learning_rate": 2.5242429371756936e-05, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.2844800353050232, "step": 1050, "valid_targets_mean": 6229.3, "valid_targets_min": 3601 }, { "epoch": 3.338607594936709, "grad_norm": 0.47147792069734795, "learning_rate": 2.508991856471366e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.2720435559749603, "step": 1055, "valid_targets_mean": 5872.4, "valid_targets_min": 4683 }, { "epoch": 3.3544303797468356, "grad_norm": 0.45341683692445545, "learning_rate": 2.493709062412682e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2766611576080322, "step": 1060, "valid_targets_mean": 6110.9, "valid_targets_min": 4224 }, { "epoch": 3.370253164556962, "grad_norm": 0.42859174931725985, "learning_rate": 2.4783955072126436e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.2609805166721344, "step": 1065, "valid_targets_mean": 6118.9, "valid_targets_min": 4341 }, { "epoch": 3.3860759493670884, "grad_norm": 0.40346214436942013, "learning_rate": 2.463052145000863e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.26767057180404663, "step": 1070, "valid_targets_mean": 6161.4, "valid_targets_min": 3469 }, { "epoch": 3.401898734177215, "grad_norm": 0.46918080352369473, "learning_rate": 2.4476799317641126e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.30101579427719116, "step": 1075, "valid_targets_mean": 5820.3, "valid_targets_min": 685 }, { "epoch": 3.4177215189873418, "grad_norm": 0.4695439709744784, "learning_rate": 2.432279825286766e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.2902735769748688, "step": 1080, "valid_targets_mean": 5656.1, "valid_targets_min": 2328 }, { "epoch": 3.4335443037974684, "grad_norm": 0.4464240769598974, "learning_rate": 2.4168527850911167e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.27806729078292847, "step": 1085, "valid_targets_mean": 5907.1, "valid_targets_min": 1952 }, { "epoch": 3.449367088607595, "grad_norm": 0.45916771177387666, "learning_rate": 2.401399772377597e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.26612377166748047, "step": 1090, "valid_targets_mean": 5740.3, "valid_targets_min": 2251 }, { "epoch": 3.4651898734177213, "grad_norm": 0.43614438276566764, "learning_rate": 2.3859217499648893e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.2967340052127838, "step": 1095, "valid_targets_mean": 5992.1, "valid_targets_min": 767 }, { "epoch": 3.481012658227848, "grad_norm": 0.42047467518959086, "learning_rate": 2.3704196822299322e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.25916093587875366, "step": 1100, "valid_targets_mean": 5764.1, "valid_targets_min": 1060 }, { "epoch": 3.4968354430379747, "grad_norm": 0.4842338297714059, "learning_rate": 2.3548945350478416e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.32087451219558716, "step": 1105, "valid_targets_mean": 5177.1, "valid_targets_min": 753 }, { "epoch": 3.5126582278481013, "grad_norm": 0.46656590339014214, "learning_rate": 2.3393472757317236e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.295026957988739, "step": 1110, "valid_targets_mean": 5936.8, "valid_targets_min": 3333 }, { "epoch": 3.528481012658228, "grad_norm": 0.4972487400584799, "learning_rate": 2.323778872972408e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.2944778501987457, "step": 1115, "valid_targets_mean": 4811.2, "valid_targets_min": 877 }, { "epoch": 3.5443037974683547, "grad_norm": 0.45881784037617374, "learning_rate": 2.3081902967780935e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.2754046618938446, "step": 1120, "valid_targets_mean": 5554.3, "valid_targets_min": 2591 }, { "epoch": 3.560126582278481, "grad_norm": 0.43038062477562644, "learning_rate": 2.292582518413908e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.2747959792613983, "step": 1125, "valid_targets_mean": 5968.6, "valid_targets_min": 3979 }, { "epoch": 3.5759493670886076, "grad_norm": 0.4607696578365557, "learning_rate": 2.2769565103413935e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.25683754682540894, "step": 1130, "valid_targets_mean": 5161.8, "valid_targets_min": 1842 }, { "epoch": 3.5917721518987342, "grad_norm": 0.47711868798365914, "learning_rate": 2.2613132461579186e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.28505629301071167, "step": 1135, "valid_targets_mean": 5645.9, "valid_targets_min": 706 }, { "epoch": 3.607594936708861, "grad_norm": 0.4546045209649017, "learning_rate": 2.2456537005360105e-05, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.2820706069469452, "step": 1140, "valid_targets_mean": 6324.2, "valid_targets_min": 4468 }, { "epoch": 3.6234177215189876, "grad_norm": 0.4540725645210422, "learning_rate": 2.2299788491626362e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.30551356077194214, "step": 1145, "valid_targets_mean": 6043.6, "valid_targets_min": 1900 }, { "epoch": 3.6392405063291138, "grad_norm": 0.4607470691585838, "learning_rate": 2.2142896686784017e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.3159760534763336, "step": 1150, "valid_targets_mean": 5909.0, "valid_targets_min": 669 }, { "epoch": 3.6550632911392404, "grad_norm": 0.485657713940311, "learning_rate": 2.198587136616708e-05, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.2861446440219879, "step": 1155, "valid_targets_mean": 5887.2, "valid_targets_min": 1033 }, { "epoch": 3.670886075949367, "grad_norm": 0.44431348288850725, "learning_rate": 2.1828722313428425e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.2906510829925537, "step": 1160, "valid_targets_mean": 6221.4, "valid_targets_min": 4137 }, { "epoch": 3.6867088607594938, "grad_norm": 0.43442541085036207, "learning_rate": 2.167145931993019e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.2862897515296936, "step": 1165, "valid_targets_mean": 6012.8, "valid_targets_min": 2815 }, { "epoch": 3.7025316455696204, "grad_norm": 0.38176947662087063, "learning_rate": 2.151409218413374e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.2606070041656494, "step": 1170, "valid_targets_mean": 6584.1, "valid_targets_min": 4706 }, { "epoch": 3.7183544303797467, "grad_norm": 0.4536298731246358, "learning_rate": 2.135663071098915e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2756196856498718, "step": 1175, "valid_targets_mean": 5809.6, "valid_targets_min": 2501 }, { "epoch": 3.7341772151898733, "grad_norm": 0.44313775169197916, "learning_rate": 2.1199084711324298e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.2668633759021759, "step": 1180, "valid_targets_mean": 5518.7, "valid_targets_min": 2497 }, { "epoch": 3.75, "grad_norm": 0.4299516471156008, "learning_rate": 2.1041464001233595e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.2561643719673157, "step": 1185, "valid_targets_mean": 5885.6, "valid_targets_min": 3359 }, { "epoch": 3.7658227848101267, "grad_norm": 0.4478929646947557, "learning_rate": 2.0883778401466364e-05, "loss": 0.279, "loss_nan_ranks": 0, "loss_rank_avg": 0.2736479341983795, "step": 1190, "valid_targets_mean": 5109.4, "valid_targets_min": 1954 }, { "epoch": 3.7816455696202533, "grad_norm": 0.41061449931460264, "learning_rate": 2.0726037736814963e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618325352668762, "step": 1195, "valid_targets_mean": 6287.6, "valid_targets_min": 4065 }, { "epoch": 3.7974683544303796, "grad_norm": 0.4605604729306755, "learning_rate": 2.0568251835502647e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.26115620136260986, "step": 1200, "valid_targets_mean": 5568.8, "valid_targets_min": 2346 }, { "epoch": 3.8132911392405062, "grad_norm": 0.45057688611815, "learning_rate": 2.0410430528571174e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.2877865433692932, "step": 1205, "valid_targets_mean": 6449.9, "valid_targets_min": 3503 }, { "epoch": 3.829113924050633, "grad_norm": 0.5086771269895078, "learning_rate": 2.02525836492683e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.3087032437324524, "step": 1210, "valid_targets_mean": 5531.9, "valid_targets_min": 3800 }, { "epoch": 3.8449367088607596, "grad_norm": 0.4452489781308896, "learning_rate": 2.009472103243511e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.3064022660255432, "step": 1215, "valid_targets_mean": 5917.0, "valid_targets_min": 4748 }, { "epoch": 3.8607594936708862, "grad_norm": 0.4863342707710525, "learning_rate": 1.993685251389322e-05, "loss": 0.2745, "loss_nan_ranks": 0, "loss_rank_avg": 0.2625889182090759, "step": 1220, "valid_targets_mean": 5559.6, "valid_targets_min": 2258 }, { "epoch": 3.8765822784810124, "grad_norm": 0.4290653882064235, "learning_rate": 1.9778987929831972e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.29007023572921753, "step": 1225, "valid_targets_mean": 6616.1, "valid_targets_min": 5869 }, { "epoch": 3.892405063291139, "grad_norm": 0.4296040763825853, "learning_rate": 1.9621137116195548e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.2632428705692291, "step": 1230, "valid_targets_mean": 5761.6, "valid_targets_min": 3731 }, { "epoch": 3.9082278481012658, "grad_norm": 0.623945942618191, "learning_rate": 1.9463309908070164e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.26622751355171204, "step": 1235, "valid_targets_mean": 6114.1, "valid_targets_min": 4962 }, { "epoch": 3.9240506329113924, "grad_norm": 0.4793044781966833, "learning_rate": 1.9305516139071264e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.2645919919013977, "step": 1240, "valid_targets_mean": 5016.1, "valid_targets_min": 740 }, { "epoch": 3.939873417721519, "grad_norm": 0.45305985353592, "learning_rate": 1.9147765640730803e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768091559410095, "step": 1245, "valid_targets_mean": 5664.0, "valid_targets_min": 3534 }, { "epoch": 3.9556962025316453, "grad_norm": 0.4605421239088336, "learning_rate": 1.8990068241884748e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.2963486313819885, "step": 1250, "valid_targets_mean": 5677.1, "valid_targets_min": 570 }, { "epoch": 3.971518987341772, "grad_norm": 0.4597763295363824, "learning_rate": 1.88324337680606e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.2958153486251831, "step": 1255, "valid_targets_mean": 5865.9, "valid_targets_min": 2303 }, { "epoch": 3.9873417721518987, "grad_norm": 0.47799649075734507, "learning_rate": 1.8674872040865264e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.3197573125362396, "step": 1260, "valid_targets_mean": 5307.5, "valid_targets_min": 599 }, { "epoch": 4.003164556962025, "grad_norm": 0.43937378661184534, "learning_rate": 1.8517392877373062e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.25840771198272705, "step": 1265, "valid_targets_mean": 5393.1, "valid_targets_min": 1782 }, { "epoch": 4.018987341772152, "grad_norm": 0.4766511193828852, "learning_rate": 1.8360006089514083e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.2725266218185425, "step": 1270, "valid_targets_mean": 5521.6, "valid_targets_min": 3121 }, { "epoch": 4.034810126582278, "grad_norm": 0.4148691145081977, "learning_rate": 1.8202721483462864e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.29157158732414246, "step": 1275, "valid_targets_mean": 6168.4, "valid_targets_min": 2189 }, { "epoch": 4.050632911392405, "grad_norm": 0.4270401645062619, "learning_rate": 1.8045548859027354e-05, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.2323746681213379, "step": 1280, "valid_targets_mean": 5276.9, "valid_targets_min": 599 }, { "epoch": 4.0664556962025316, "grad_norm": 0.4282844537809516, "learning_rate": 1.7888498009038368e-05, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751336097717285, "step": 1285, "valid_targets_mean": 5892.6, "valid_targets_min": 2244 }, { "epoch": 4.082278481012658, "grad_norm": 0.47316582639020416, "learning_rate": 1.7731578718739414e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.30304911732673645, "step": 1290, "valid_targets_mean": 6108.2, "valid_targets_min": 2388 }, { "epoch": 4.098101265822785, "grad_norm": 0.4803746298155582, "learning_rate": 1.7574800765176994e-05, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.2848498225212097, "step": 1295, "valid_targets_mean": 4842.9, "valid_targets_min": 465 }, { "epoch": 4.113924050632911, "grad_norm": 0.4312417867244571, "learning_rate": 1.741817391659149e-05, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.26076751947402954, "step": 1300, "valid_targets_mean": 5613.5, "valid_targets_min": 2346 }, { "epoch": 4.129746835443038, "grad_norm": 0.4307261808714215, "learning_rate": 1.726170793180848e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.28067219257354736, "step": 1305, "valid_targets_mean": 6023.4, "valid_targets_min": 1905 }, { "epoch": 4.1455696202531644, "grad_norm": 0.4568416978649484, "learning_rate": 1.7105412559630735e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.27373552322387695, "step": 1310, "valid_targets_mean": 6107.5, "valid_targets_min": 2019 }, { "epoch": 4.1613924050632916, "grad_norm": 0.4500355857613447, "learning_rate": 1.6949297538230792e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.27843713760375977, "step": 1315, "valid_targets_mean": 5768.1, "valid_targets_min": 2215 }, { "epoch": 4.177215189873418, "grad_norm": 0.4388953953436056, "learning_rate": 1.6793372594544224e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.27434033155441284, "step": 1320, "valid_targets_mean": 5503.1, "valid_targets_min": 900 }, { "epoch": 4.193037974683544, "grad_norm": 0.4576763460557553, "learning_rate": 1.6637647443663593e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.2750262916088104, "step": 1325, "valid_targets_mean": 6009.2, "valid_targets_min": 4215 }, { "epoch": 4.208860759493671, "grad_norm": 0.46329839465044464, "learning_rate": 1.6482131788233097e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.28142502903938293, "step": 1330, "valid_targets_mean": 5375.4, "valid_targets_min": 767 }, { "epoch": 4.224683544303797, "grad_norm": 0.4434699499274513, "learning_rate": 1.6326835317844096e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.2833135724067688, "step": 1335, "valid_targets_mean": 5825.7, "valid_targets_min": 3592 }, { "epoch": 4.2405063291139244, "grad_norm": 0.44275524559779117, "learning_rate": 1.6171767708431343e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.24540019035339355, "step": 1340, "valid_targets_mean": 5436.6, "valid_targets_min": 973 }, { "epoch": 4.256329113924051, "grad_norm": 0.4253187110223974, "learning_rate": 1.601693862167013e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.27130672335624695, "step": 1345, "valid_targets_mean": 6132.4, "valid_targets_min": 3411 }, { "epoch": 4.272151898734177, "grad_norm": 0.44888455434609287, "learning_rate": 1.5862357704374328e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.29880720376968384, "step": 1350, "valid_targets_mean": 5640.2, "valid_targets_min": 577 }, { "epoch": 4.287974683544304, "grad_norm": 0.4447433594075796, "learning_rate": 1.5708034587895278e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.2827964425086975, "step": 1355, "valid_targets_mean": 5510.6, "valid_targets_min": 1400 }, { "epoch": 4.30379746835443, "grad_norm": 0.5005058691286197, "learning_rate": 1.5553978887521756e-05, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.24379396438598633, "step": 1360, "valid_targets_mean": 5517.3, "valid_targets_min": 1860 }, { "epoch": 4.319620253164557, "grad_norm": 0.4277824202684447, "learning_rate": 1.5400200201880832e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.2706229090690613, "step": 1365, "valid_targets_mean": 6064.0, "valid_targets_min": 3083 }, { "epoch": 4.3354430379746836, "grad_norm": 0.42891831640248634, "learning_rate": 1.5246708112339841e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757185697555542, "step": 1370, "valid_targets_mean": 6370.2, "valid_targets_min": 3108 }, { "epoch": 4.35126582278481, "grad_norm": 0.5680716223524007, "learning_rate": 1.5093512182409426e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.27294766902923584, "step": 1375, "valid_targets_mean": 5403.8, "valid_targets_min": 2218 }, { "epoch": 4.367088607594937, "grad_norm": 0.43343129168281397, "learning_rate": 1.4940621957147604e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2662773132324219, "step": 1380, "valid_targets_mean": 5882.5, "valid_targets_min": 4166 }, { "epoch": 4.382911392405063, "grad_norm": 0.41494002682269865, "learning_rate": 1.4788046962565137e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607043981552124, "step": 1385, "valid_targets_mean": 6177.9, "valid_targets_min": 2455 }, { "epoch": 4.39873417721519, "grad_norm": 0.43843034588316787, "learning_rate": 1.4635796705031921e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.27472174167633057, "step": 1390, "valid_targets_mean": 6159.9, "valid_targets_min": 3177 }, { "epoch": 4.4145569620253164, "grad_norm": 0.44829735270254406, "learning_rate": 1.4483880670684734e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803511619567871, "step": 1395, "valid_targets_mean": 6351.8, "valid_targets_min": 3409 }, { "epoch": 4.430379746835443, "grad_norm": 0.43784463660660367, "learning_rate": 1.4332308324836175e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.2583090662956238, "step": 1400, "valid_targets_mean": 5574.8, "valid_targets_min": 851 }, { "epoch": 4.44620253164557, "grad_norm": 0.41049241534830344, "learning_rate": 1.4181089111384897e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.2622532248497009, "step": 1405, "valid_targets_mean": 6493.8, "valid_targets_min": 5483 }, { "epoch": 4.462025316455696, "grad_norm": 0.4438465909763393, "learning_rate": 1.4030232452227247e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2785758376121521, "step": 1410, "valid_targets_mean": 5877.3, "valid_targets_min": 3379 }, { "epoch": 4.477848101265823, "grad_norm": 0.45409808589805667, "learning_rate": 1.3879747746670153e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.28627505898475647, "step": 1415, "valid_targets_mean": 5778.6, "valid_targets_min": 1930 }, { "epoch": 4.493670886075949, "grad_norm": 0.44565153269075114, "learning_rate": 1.3729644370845527e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.2990872263908386, "step": 1420, "valid_targets_mean": 6347.4, "valid_targets_min": 886 }, { "epoch": 4.509493670886076, "grad_norm": 0.4867505301206323, "learning_rate": 1.3579931677126095e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.2777697443962097, "step": 1425, "valid_targets_mean": 5492.8, "valid_targets_min": 963 }, { "epoch": 4.525316455696203, "grad_norm": 0.46892411857600824, "learning_rate": 1.3430618993542624e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.27069422602653503, "step": 1430, "valid_targets_mean": 4925.8, "valid_targets_min": 514 }, { "epoch": 4.541139240506329, "grad_norm": 0.4258887412808488, "learning_rate": 1.3281715623202805e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.25205692648887634, "step": 1435, "valid_targets_mean": 6138.2, "valid_targets_min": 1828 }, { "epoch": 4.556962025316456, "grad_norm": 0.43025376755770534, "learning_rate": 1.3133230843711542e-05, "loss": 0.2753, "loss_nan_ranks": 0, "loss_rank_avg": 0.2578020989894867, "step": 1440, "valid_targets_mean": 5396.9, "valid_targets_min": 648 }, { "epoch": 4.572784810126582, "grad_norm": 0.4121061717464447, "learning_rate": 1.2985173906592938e-05, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.2575612962245941, "step": 1445, "valid_targets_mean": 6095.8, "valid_targets_min": 3363 }, { "epoch": 4.588607594936709, "grad_norm": 0.4455401669257146, "learning_rate": 1.283755403671386e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595190107822418, "step": 1450, "valid_targets_mean": 5895.9, "valid_targets_min": 765 }, { "epoch": 4.6044303797468356, "grad_norm": 0.47995584984074363, "learning_rate": 1.2690380431709164e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.25681594014167786, "step": 1455, "valid_targets_mean": 5262.5, "valid_targets_min": 896 }, { "epoch": 4.620253164556962, "grad_norm": 0.44625916208811905, "learning_rate": 1.2543662261408651e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.26975834369659424, "step": 1460, "valid_targets_mean": 5787.6, "valid_targets_min": 3012 }, { "epoch": 4.636075949367089, "grad_norm": 0.45780589523131776, "learning_rate": 1.239740866726569e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.2560340166091919, "step": 1465, "valid_targets_mean": 5298.8, "valid_targets_min": 2302 }, { "epoch": 4.651898734177215, "grad_norm": 0.4374203751318027, "learning_rate": 1.2251628761787676e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.269504189491272, "step": 1470, "valid_targets_mean": 5891.4, "valid_targets_min": 976 }, { "epoch": 4.667721518987342, "grad_norm": 0.48912556917169475, "learning_rate": 1.2106331627968268e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.2673969268798828, "step": 1475, "valid_targets_mean": 5466.0, "valid_targets_min": 628 }, { "epoch": 4.6835443037974684, "grad_norm": 0.44150795560819456, "learning_rate": 1.1961526318721429e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.28151217103004456, "step": 1480, "valid_targets_mean": 5715.2, "valid_targets_min": 963 }, { "epoch": 4.699367088607595, "grad_norm": 0.42332732047910177, "learning_rate": 1.1817221856317426e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.2617891728878021, "step": 1485, "valid_targets_mean": 5987.8, "valid_targets_min": 3898 }, { "epoch": 4.715189873417722, "grad_norm": 0.4331817000713787, "learning_rate": 1.1673427231820637e-05, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.26096978783607483, "step": 1490, "valid_targets_mean": 6009.0, "valid_targets_min": 753 }, { "epoch": 4.731012658227848, "grad_norm": 0.43190281742549974, "learning_rate": 1.1530151404529362e-05, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.3024364113807678, "step": 1495, "valid_targets_mean": 6329.8, "valid_targets_min": 4300 }, { "epoch": 4.746835443037975, "grad_norm": 0.4270377021411673, "learning_rate": 1.1387403301417645e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.2895660400390625, "step": 1500, "valid_targets_mean": 5815.9, "valid_targets_min": 2026 }, { "epoch": 2.5336700336700337, "grad_norm": 0.47175833690416435, "learning_rate": 3.222069246473091e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.2578871548175812, "step": 1505, "valid_targets_mean": 5995.9, "valid_targets_min": 514 }, { "epoch": 2.542087542087542, "grad_norm": 0.4988144120109162, "learning_rate": 3.2154125959136395e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.26715636253356934, "step": 1510, "valid_targets_mean": 5125.2, "valid_targets_min": 809 }, { "epoch": 2.5505050505050506, "grad_norm": 0.49561294420836705, "learning_rate": 3.208734528519581e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.27658218145370483, "step": 1515, "valid_targets_mean": 5416.2, "valid_targets_min": 524 }, { "epoch": 2.558922558922559, "grad_norm": 0.4909723100319413, "learning_rate": 3.20203516196541e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.2683098316192627, "step": 1520, "valid_targets_mean": 5724.5, "valid_targets_min": 3716 }, { "epoch": 2.5673400673400675, "grad_norm": 0.46049058044117985, "learning_rate": 3.1953146143009367e-05, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.28621405363082886, "step": 1525, "valid_targets_mean": 6398.9, "valid_targets_min": 5081 }, { "epoch": 2.5757575757575757, "grad_norm": 0.5068485562732447, "learning_rate": 3.188573003949203e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784101963043213, "step": 1530, "valid_targets_mean": 5874.6, "valid_targets_min": 1807 }, { "epoch": 2.584175084175084, "grad_norm": 0.49170049168708563, "learning_rate": 3.181810449704399e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.2548806071281433, "step": 1535, "valid_targets_mean": 5808.4, "valid_targets_min": 2488 }, { "epoch": 2.5925925925925926, "grad_norm": 0.46857660364859843, "learning_rate": 3.175027070729768e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.27297866344451904, "step": 1540, "valid_targets_mean": 5892.1, "valid_targets_min": 1373 }, { "epoch": 2.601010101010101, "grad_norm": 0.4623443280958736, "learning_rate": 3.168222986555504e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.25697314739227295, "step": 1545, "valid_targets_mean": 5303.7, "valid_targets_min": 1735 }, { "epoch": 2.6094276094276094, "grad_norm": 0.4793035936728254, "learning_rate": 3.161398317076652e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.2764521837234497, "step": 1550, "valid_targets_mean": 5819.5, "valid_targets_min": 765 }, { "epoch": 2.6178451178451176, "grad_norm": 0.4668860860510128, "learning_rate": 3.154553182550986e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.26006996631622314, "step": 1555, "valid_targets_mean": 5489.5, "valid_targets_min": 3047 }, { "epoch": 2.6262626262626263, "grad_norm": 0.47796110140270853, "learning_rate": 3.1476877035969024e-05, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.27874821424484253, "step": 1560, "valid_targets_mean": 5781.8, "valid_targets_min": 963 }, { "epoch": 2.634680134680135, "grad_norm": 0.4581773426950499, "learning_rate": 3.140802001191283e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.237541064620018, "step": 1565, "valid_targets_mean": 6255.6, "valid_targets_min": 3544 }, { "epoch": 2.643097643097643, "grad_norm": 0.48335835010448197, "learning_rate": 3.133896196667369e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.29038745164871216, "step": 1570, "valid_targets_mean": 5953.4, "valid_targets_min": 3524 }, { "epoch": 2.6515151515151514, "grad_norm": 0.5426689425154643, "learning_rate": 3.1269704117126206e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.2984479069709778, "step": 1575, "valid_targets_mean": 5832.0, "valid_targets_min": 886 }, { "epoch": 2.65993265993266, "grad_norm": 0.45988998500840067, "learning_rate": 3.120024768366576e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751707434654236, "step": 1580, "valid_targets_mean": 5657.8, "valid_targets_min": 744 }, { "epoch": 2.6683501683501682, "grad_norm": 0.4792673772983562, "learning_rate": 3.113059389018699e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.2405269742012024, "step": 1585, "valid_targets_mean": 5396.2, "valid_targets_min": 1555 }, { "epoch": 2.676767676767677, "grad_norm": 0.5103650573018135, "learning_rate": 3.1060743964062194e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.23580007255077362, "step": 1590, "valid_targets_mean": 6230.6, "valid_targets_min": 4426 }, { "epoch": 2.685185185185185, "grad_norm": 0.4756410298275338, "learning_rate": 3.099069913611977e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.28566116094589233, "step": 1595, "valid_targets_mean": 5506.6, "valid_targets_min": 775 }, { "epoch": 2.6936026936026938, "grad_norm": 0.4745602293201921, "learning_rate": 3.0920460640622464e-05, "loss": 0.2891, "loss_nan_ranks": 0, "loss_rank_avg": 0.2973249554634094, "step": 1600, "valid_targets_mean": 6110.0, "valid_targets_min": 3333 }, { "epoch": 2.702020202020202, "grad_norm": 0.43970970369378504, "learning_rate": 3.085002971524564e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.26657000184059143, "step": 1605, "valid_targets_mean": 6084.0, "valid_targets_min": 5257 }, { "epoch": 2.71043771043771, "grad_norm": 0.4464368757498652, "learning_rate": 3.077940760105551e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.22137847542762756, "step": 1610, "valid_targets_mean": 6026.0, "valid_targets_min": 3654 }, { "epoch": 2.718855218855219, "grad_norm": 0.4996610996027433, "learning_rate": 3.070859554248719e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.26007986068725586, "step": 1615, "valid_targets_mean": 4993.4, "valid_targets_min": 1273 }, { "epoch": 2.7272727272727275, "grad_norm": 0.4658302368436588, "learning_rate": 3.063759478732284e-05, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.25886788964271545, "step": 1620, "valid_targets_mean": 5908.8, "valid_targets_min": 1880 }, { "epoch": 2.7356902356902357, "grad_norm": 0.4881933303892004, "learning_rate": 3.056640658666965e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2800159454345703, "step": 1625, "valid_targets_mean": 5548.6, "valid_targets_min": 3026 }, { "epoch": 2.744107744107744, "grad_norm": 0.4622627848229377, "learning_rate": 3.0495032194937785e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.29500848054885864, "step": 1630, "valid_targets_mean": 6286.5, "valid_targets_min": 1868 }, { "epoch": 2.7525252525252526, "grad_norm": 0.5224900072775827, "learning_rate": 3.042347286981829e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.26520195603370667, "step": 1635, "valid_targets_mean": 5687.2, "valid_targets_min": 767 }, { "epoch": 2.760942760942761, "grad_norm": 0.48341273547659325, "learning_rate": 3.0351729872260935e-05, "loss": 0.2699, "loss_nan_ranks": 0, "loss_rank_avg": 0.26769256591796875, "step": 1640, "valid_targets_mean": 5853.3, "valid_targets_min": 963 }, { "epoch": 2.7693602693602695, "grad_norm": 0.4759754441664444, "learning_rate": 3.0279804466451996e-05, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.27780115604400635, "step": 1645, "valid_targets_mean": 5861.6, "valid_targets_min": 2244 }, { "epoch": 2.7777777777777777, "grad_norm": 0.4934818313537275, "learning_rate": 3.0207697919791953e-05, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537994384765625, "step": 1650, "valid_targets_mean": 5367.6, "valid_targets_min": 2169 }, { "epoch": 2.7861952861952863, "grad_norm": 0.4802875983555916, "learning_rate": 3.0135411502873188e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672436535358429, "step": 1655, "valid_targets_mean": 5591.4, "valid_targets_min": 2148 }, { "epoch": 2.7946127946127945, "grad_norm": 0.4919537763945096, "learning_rate": 3.0062946489457588e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.2736820578575134, "step": 1660, "valid_targets_mean": 5776.6, "valid_targets_min": 2095 }, { "epoch": 2.8030303030303028, "grad_norm": 0.4874244346144825, "learning_rate": 2.9990304156454088e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.24358776211738586, "step": 1665, "valid_targets_mean": 5696.8, "valid_targets_min": 2170 }, { "epoch": 2.8114478114478114, "grad_norm": 0.4736894046023768, "learning_rate": 2.9917485783896184e-05, "loss": 0.278, "loss_nan_ranks": 0, "loss_rank_avg": 0.28212714195251465, "step": 1670, "valid_targets_mean": 5973.2, "valid_targets_min": 804 }, { "epoch": 2.81986531986532, "grad_norm": 0.5180701591667134, "learning_rate": 2.984449265491937e-05, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.2965032160282135, "step": 1675, "valid_targets_mean": 5538.2, "valid_targets_min": 642 }, { "epoch": 2.8282828282828283, "grad_norm": 0.48472099517020967, "learning_rate": 2.9771326055738524e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.257454514503479, "step": 1680, "valid_targets_mean": 5996.2, "valid_targets_min": 4286 }, { "epoch": 2.8367003367003365, "grad_norm": 0.4708230007906033, "learning_rate": 2.969798727562526e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.27739977836608887, "step": 1685, "valid_targets_mean": 5786.6, "valid_targets_min": 2952 }, { "epoch": 2.845117845117845, "grad_norm": 0.49972614462585313, "learning_rate": 2.9624477606885196e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.2510569989681244, "step": 1690, "valid_targets_mean": 5390.0, "valid_targets_min": 728 }, { "epoch": 2.8535353535353534, "grad_norm": 0.4488084533581549, "learning_rate": 2.9550798344835176e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.25537407398223877, "step": 1695, "valid_targets_mean": 6486.0, "valid_targets_min": 4394 }, { "epoch": 2.861952861952862, "grad_norm": 0.44624289950556423, "learning_rate": 2.947695078778047e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.24400271475315094, "step": 1700, "valid_targets_mean": 5361.6, "valid_targets_min": 1273 }, { "epoch": 2.8703703703703702, "grad_norm": 0.49323369912437803, "learning_rate": 2.940293623699187e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2662852108478546, "step": 1705, "valid_targets_mean": 5423.9, "valid_targets_min": 1761 }, { "epoch": 2.878787878787879, "grad_norm": 0.461964707436428, "learning_rate": 2.9328755996682784e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.2640298008918762, "step": 1710, "valid_targets_mean": 5557.8, "valid_targets_min": 1847 }, { "epoch": 2.887205387205387, "grad_norm": 0.4842785667166425, "learning_rate": 2.9254411373986218e-05, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.2701316475868225, "step": 1715, "valid_targets_mean": 5645.8, "valid_targets_min": 2087 }, { "epoch": 2.8956228956228958, "grad_norm": 0.4400726168230355, "learning_rate": 2.9179903678931798e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2720245122909546, "step": 1720, "valid_targets_mean": 6178.3, "valid_targets_min": 2283 }, { "epoch": 2.904040404040404, "grad_norm": 0.5039310956644923, "learning_rate": 2.910523422442262e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.2551863193511963, "step": 1725, "valid_targets_mean": 5084.2, "valid_targets_min": 572 }, { "epoch": 2.9124579124579126, "grad_norm": 0.48130526767640697, "learning_rate": 2.903040432621218e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.2813180088996887, "step": 1730, "valid_targets_mean": 5492.9, "valid_targets_min": 642 }, { "epoch": 2.920875420875421, "grad_norm": 0.4450566158621727, "learning_rate": 2.895541530288115e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.24626556038856506, "step": 1735, "valid_targets_mean": 5779.6, "valid_targets_min": 833 }, { "epoch": 2.929292929292929, "grad_norm": 0.4628884880600571, "learning_rate": 2.8880268475814132e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.2738983929157257, "step": 1740, "valid_targets_mean": 5713.9, "valid_targets_min": 2152 }, { "epoch": 2.9377104377104377, "grad_norm": 0.47146875329522886, "learning_rate": 2.880496516917642e-05, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.25897499918937683, "step": 1745, "valid_targets_mean": 5837.1, "valid_targets_min": 1954 }, { "epoch": 2.9461279461279464, "grad_norm": 0.44589205425484196, "learning_rate": 2.8729506709890645e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.26478633284568787, "step": 1750, "valid_targets_mean": 6132.0, "valid_targets_min": 3592 }, { "epoch": 2.9545454545454546, "grad_norm": 0.45812178416316796, "learning_rate": 2.865389442761336e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.26409947872161865, "step": 1755, "valid_targets_mean": 5849.6, "valid_targets_min": 3131 }, { "epoch": 2.962962962962963, "grad_norm": 0.4801446094642877, "learning_rate": 2.857812965471166e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.2876226603984833, "step": 1760, "valid_targets_mean": 5856.8, "valid_targets_min": 804 }, { "epoch": 2.9713804713804715, "grad_norm": 0.48367462710997594, "learning_rate": 2.8502213726239678e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.26591169834136963, "step": 1765, "valid_targets_mean": 5456.8, "valid_targets_min": 2276 }, { "epoch": 2.9797979797979797, "grad_norm": 0.4506297725367813, "learning_rate": 2.8426147979915067e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.24496473371982574, "step": 1770, "valid_targets_mean": 5691.6, "valid_targets_min": 3015 }, { "epoch": 2.9882154882154883, "grad_norm": 0.46527654760090237, "learning_rate": 2.8349933756095427e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.26362547278404236, "step": 1775, "valid_targets_mean": 6209.3, "valid_targets_min": 4577 }, { "epoch": 2.9966329966329965, "grad_norm": 0.44774308378539096, "learning_rate": 2.827357239775468e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.265911340713501, "step": 1780, "valid_targets_mean": 5725.1, "valid_targets_min": 2060 }, { "epoch": 3.005050505050505, "grad_norm": 0.4228834306946797, "learning_rate": 2.8197065250459422e-05, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.24547988176345825, "step": 1785, "valid_targets_mean": 5958.1, "valid_targets_min": 2375 }, { "epoch": 3.0134680134680134, "grad_norm": 0.5040780268885077, "learning_rate": 2.81204136623452e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.26460325717926025, "step": 1790, "valid_targets_mean": 5342.4, "valid_targets_min": 2552 }, { "epoch": 3.021885521885522, "grad_norm": 0.44455255554024603, "learning_rate": 2.804361898409274e-05, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.250008225440979, "step": 1795, "valid_targets_mean": 6092.6, "valid_targets_min": 3132 }, { "epoch": 3.0303030303030303, "grad_norm": 0.4888540010472703, "learning_rate": 2.796668256890419e-05, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.255595326423645, "step": 1800, "valid_targets_mean": 5412.1, "valid_targets_min": 599 }, { "epoch": 3.038720538720539, "grad_norm": 0.456272332197701, "learning_rate": 2.7889605772479233e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.26009058952331543, "step": 1805, "valid_targets_mean": 5873.6, "valid_targets_min": 3667 }, { "epoch": 3.047138047138047, "grad_norm": 0.47526162068172445, "learning_rate": 2.7812389952991234e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.2717510163784027, "step": 1810, "valid_targets_mean": 5074.5, "valid_targets_min": 465 }, { "epoch": 3.0555555555555554, "grad_norm": 0.46603159599538324, "learning_rate": 2.7735036471063265e-05, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.24621015787124634, "step": 1815, "valid_targets_mean": 5842.6, "valid_targets_min": 4595 }, { "epoch": 3.063973063973064, "grad_norm": 0.4562445024563088, "learning_rate": 2.7657546689744167e-05, "loss": 0.2554, "loss_nan_ranks": 0, "loss_rank_avg": 0.23575446009635925, "step": 1820, "valid_targets_mean": 5539.0, "valid_targets_min": 877 }, { "epoch": 3.0723905723905722, "grad_norm": 0.43940550371469234, "learning_rate": 2.7579921974484532e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.2583876848220825, "step": 1825, "valid_targets_mean": 6058.7, "valid_targets_min": 3841 }, { "epoch": 3.080808080808081, "grad_norm": 0.4757427901719824, "learning_rate": 2.7502163693112595e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.287031352519989, "step": 1830, "valid_targets_mean": 5939.2, "valid_targets_min": 1761 }, { "epoch": 3.089225589225589, "grad_norm": 0.47089901333182543, "learning_rate": 2.7424273215810192e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.25683337450027466, "step": 1835, "valid_targets_mean": 6200.4, "valid_targets_min": 4841 }, { "epoch": 3.0976430976430978, "grad_norm": 0.47079150260275704, "learning_rate": 2.7346251915088574e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.2823716402053833, "step": 1840, "valid_targets_mean": 5534.8, "valid_targets_min": 3315 }, { "epoch": 3.106060606060606, "grad_norm": 0.41384136717630904, "learning_rate": 2.7268101165764256e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.24914711713790894, "step": 1845, "valid_targets_mean": 5942.4, "valid_targets_min": 495 }, { "epoch": 3.1144781144781146, "grad_norm": 0.47799928718479734, "learning_rate": 2.7189822344934746e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.2740170359611511, "step": 1850, "valid_targets_mean": 5577.8, "valid_targets_min": 754 }, { "epoch": 3.122895622895623, "grad_norm": 0.4393256529310863, "learning_rate": 2.7111416831954324e-05, "loss": 0.2745, "loss_nan_ranks": 0, "loss_rank_avg": 0.2606737017631531, "step": 1855, "valid_targets_mean": 6356.8, "valid_targets_min": 4689 }, { "epoch": 3.1313131313131315, "grad_norm": 0.49227894096611585, "learning_rate": 2.7032886008409707e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.2675955891609192, "step": 1860, "valid_targets_mean": 5334.9, "valid_targets_min": 3591 }, { "epoch": 3.1397306397306397, "grad_norm": 0.44300019232744026, "learning_rate": 2.6954231258095728e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.24864640831947327, "step": 1865, "valid_targets_mean": 6035.8, "valid_targets_min": 5344 }, { "epoch": 3.148148148148148, "grad_norm": 0.48096371062581594, "learning_rate": 2.6875453966990924e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.24091598391532898, "step": 1870, "valid_targets_mean": 5171.2, "valid_targets_min": 896 }, { "epoch": 3.1565656565656566, "grad_norm": 0.4485606822042903, "learning_rate": 2.679655552323313e-05, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.2668924927711487, "step": 1875, "valid_targets_mean": 6351.5, "valid_targets_min": 3570 }, { "epoch": 3.164983164983165, "grad_norm": 0.47490151861785507, "learning_rate": 2.671753731709503e-05, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.2609248161315918, "step": 1880, "valid_targets_mean": 6502.5, "valid_targets_min": 4606 }, { "epoch": 3.1734006734006734, "grad_norm": 0.48491249046654883, "learning_rate": 2.663840074095963e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.2430686056613922, "step": 1885, "valid_targets_mean": 5501.4, "valid_targets_min": 834 }, { "epoch": 3.1818181818181817, "grad_norm": 0.48579484347272883, "learning_rate": 2.655914718929575e-05, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.24881702661514282, "step": 1890, "valid_targets_mean": 5342.8, "valid_targets_min": 3266 }, { "epoch": 3.1902356902356903, "grad_norm": 0.46339440739579857, "learning_rate": 2.6479778058633426e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.2772354185581207, "step": 1895, "valid_targets_mean": 6097.9, "valid_targets_min": 4994 }, { "epoch": 3.1986531986531985, "grad_norm": 0.47252401948247413, "learning_rate": 2.6400294747539338e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.2552820146083832, "step": 1900, "valid_targets_mean": 6086.3, "valid_targets_min": 3383 }, { "epoch": 3.207070707070707, "grad_norm": 0.4733757827268643, "learning_rate": 2.6320698656592126e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.2829735279083252, "step": 1905, "valid_targets_mean": 6193.1, "valid_targets_min": 4736 }, { "epoch": 3.2154882154882154, "grad_norm": 0.4545516302082259, "learning_rate": 2.6240991188357736e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541789412498474, "step": 1910, "valid_targets_mean": 5517.2, "valid_targets_min": 765 }, { "epoch": 3.223905723905724, "grad_norm": 0.477035335388407, "learning_rate": 2.6161173747364694e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.29022878408432007, "step": 1915, "valid_targets_mean": 6209.6, "valid_targets_min": 1807 }, { "epoch": 3.2323232323232323, "grad_norm": 0.4721123241784799, "learning_rate": 2.6081247740079363e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.27373164892196655, "step": 1920, "valid_targets_mean": 5637.5, "valid_targets_min": 720 }, { "epoch": 3.240740740740741, "grad_norm": 0.49909640283340984, "learning_rate": 2.600121457488116e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.26537537574768066, "step": 1925, "valid_targets_mean": 4531.2, "valid_targets_min": 753 }, { "epoch": 3.249158249158249, "grad_norm": 0.4508067303088388, "learning_rate": 2.5921075662037726e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.2458057701587677, "step": 1930, "valid_targets_mean": 5773.4, "valid_targets_min": 2719 }, { "epoch": 3.257575757575758, "grad_norm": 0.4986299908186157, "learning_rate": 2.5840832413680096e-05, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.255989670753479, "step": 1935, "valid_targets_mean": 5769.0, "valid_targets_min": 973 }, { "epoch": 3.265993265993266, "grad_norm": 0.4517947133476855, "learning_rate": 2.5760486243777797e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.27278995513916016, "step": 1940, "valid_targets_mean": 6153.6, "valid_targets_min": 954 }, { "epoch": 3.274410774410774, "grad_norm": 0.45871371182609605, "learning_rate": 2.5680038568113944e-05, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.2577679753303528, "step": 1945, "valid_targets_mean": 5734.0, "valid_targets_min": 3637 }, { "epoch": 3.282828282828283, "grad_norm": 0.4618326850988252, "learning_rate": 2.5599490804260305e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.27027878165245056, "step": 1950, "valid_targets_mean": 6097.2, "valid_targets_min": 2811 }, { "epoch": 3.291245791245791, "grad_norm": 0.49755407687551717, "learning_rate": 2.551884437155228e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2811235785484314, "step": 1955, "valid_targets_mean": 5254.4, "valid_targets_min": 789 }, { "epoch": 3.2996632996632997, "grad_norm": 0.457846159639027, "learning_rate": 2.5438100691063922e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.24545416235923767, "step": 1960, "valid_targets_mean": 6070.6, "valid_targets_min": 1828 }, { "epoch": 3.308080808080808, "grad_norm": 0.4758750298348739, "learning_rate": 2.5357261185582905e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.27742427587509155, "step": 1965, "valid_targets_mean": 5808.8, "valid_targets_min": 1796 }, { "epoch": 3.3164983164983166, "grad_norm": 0.46197179559249013, "learning_rate": 2.527632727958543e-05, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2675663232803345, "step": 1970, "valid_targets_mean": 6366.4, "valid_targets_min": 5123 }, { "epoch": 3.324915824915825, "grad_norm": 0.4867263212000984, "learning_rate": 2.5195300399211137e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2639455199241638, "step": 1975, "valid_targets_mean": 4910.4, "valid_targets_min": 634 }, { "epoch": 3.3333333333333335, "grad_norm": 0.4284195435461982, "learning_rate": 2.511418197223796e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.24187898635864258, "step": 1980, "valid_targets_mean": 5845.8, "valid_targets_min": 923 }, { "epoch": 3.3417508417508417, "grad_norm": 0.4135358228574883, "learning_rate": 2.5032973428057e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.2515963912010193, "step": 1985, "valid_targets_mean": 6830.1, "valid_targets_min": 5004 }, { "epoch": 3.3501683501683504, "grad_norm": 0.4377565753960238, "learning_rate": 2.49516761976473e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.23978541791439056, "step": 1990, "valid_targets_mean": 6151.1, "valid_targets_min": 5254 }, { "epoch": 3.3585858585858586, "grad_norm": 0.4993668860572999, "learning_rate": 2.4870291713550648e-05, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.27316054701805115, "step": 1995, "valid_targets_mean": 5725.8, "valid_targets_min": 2261 }, { "epoch": 3.3670033670033668, "grad_norm": 0.46810011894975945, "learning_rate": 2.4788821409846334e-05, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.24408294260501862, "step": 2000, "valid_targets_mean": 5991.2, "valid_targets_min": 3469 }, { "epoch": 3.3754208754208754, "grad_norm": 0.44354178389049237, "learning_rate": 2.4707266722125888e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.24701344966888428, "step": 2005, "valid_targets_mean": 5817.7, "valid_targets_min": 3108 }, { "epoch": 3.3838383838383836, "grad_norm": 0.4616401687442844, "learning_rate": 2.4625629087467776e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.26236820220947266, "step": 2010, "valid_targets_mean": 5806.8, "valid_targets_min": 2318 }, { "epoch": 3.3922558922558923, "grad_norm": 0.46918202560215155, "learning_rate": 2.4543909944412048e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.2738293409347534, "step": 2015, "valid_targets_mean": 6169.3, "valid_targets_min": 3881 }, { "epoch": 3.4006734006734005, "grad_norm": 0.45482866759373874, "learning_rate": 2.4462110732935043e-05, "loss": 0.2547, "loss_nan_ranks": 0, "loss_rank_avg": 0.25623035430908203, "step": 2020, "valid_targets_mean": 5538.8, "valid_targets_min": 710 }, { "epoch": 3.409090909090909, "grad_norm": 0.4410889962382104, "learning_rate": 2.438023289442399e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.26775211095809937, "step": 2025, "valid_targets_mean": 6071.1, "valid_targets_min": 2483 }, { "epoch": 3.4175084175084174, "grad_norm": 0.45428199396855873, "learning_rate": 2.4298277871651585e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.25729498267173767, "step": 2030, "valid_targets_mean": 6182.1, "valid_targets_min": 688 }, { "epoch": 3.425925925925926, "grad_norm": 0.4801004820149534, "learning_rate": 2.4216247108750613e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.24965059757232666, "step": 2035, "valid_targets_mean": 5397.3, "valid_targets_min": 775 }, { "epoch": 3.4343434343434343, "grad_norm": 0.4373441581395516, "learning_rate": 2.413414205118847e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.2545247972011566, "step": 2040, "valid_targets_mean": 6557.8, "valid_targets_min": 4539 }, { "epoch": 3.442760942760943, "grad_norm": 0.47614455354626983, "learning_rate": 2.405196414574171e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595536708831787, "step": 2045, "valid_targets_mean": 6224.1, "valid_targets_min": 4957 }, { "epoch": 3.451178451178451, "grad_norm": 0.4427047407389265, "learning_rate": 2.3969714840470526e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.25375697016716003, "step": 2050, "valid_targets_mean": 6163.6, "valid_targets_min": 4911 }, { "epoch": 3.45959595959596, "grad_norm": 0.4350812895960367, "learning_rate": 2.3887395584693258e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.22944723069667816, "step": 2055, "valid_targets_mean": 5471.1, "valid_targets_min": 1468 }, { "epoch": 3.468013468013468, "grad_norm": 0.44240321353041623, "learning_rate": 2.3805007828960855e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.2613484263420105, "step": 2060, "valid_targets_mean": 6239.8, "valid_targets_min": 5408 }, { "epoch": 3.4764309764309766, "grad_norm": 0.44476788322817057, "learning_rate": 2.3722553025031304e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.2447347342967987, "step": 2065, "valid_targets_mean": 5525.6, "valid_targets_min": 650 }, { "epoch": 3.484848484848485, "grad_norm": 0.47337002524786304, "learning_rate": 2.364003262584403e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.26840806007385254, "step": 2070, "valid_targets_mean": 6076.1, "valid_targets_min": 3742 }, { "epoch": 3.493265993265993, "grad_norm": 0.46884526171525137, "learning_rate": 2.3557448085494343e-05, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.2716432511806488, "step": 2075, "valid_targets_mean": 5966.1, "valid_targets_min": 4596 }, { "epoch": 3.5016835016835017, "grad_norm": 0.4782651673999994, "learning_rate": 2.347480085920778e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.24839454889297485, "step": 2080, "valid_targets_mean": 5711.4, "valid_targets_min": 2042 }, { "epoch": 3.51010101010101, "grad_norm": 0.47733783992450113, "learning_rate": 2.3392092403314447e-05, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.2837388515472412, "step": 2085, "valid_targets_mean": 6067.6, "valid_targets_min": 2048 }, { "epoch": 3.5185185185185186, "grad_norm": 0.4782687051339394, "learning_rate": 2.3309324175223415e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2605840563774109, "step": 2090, "valid_targets_mean": 5370.0, "valid_targets_min": 799 }, { "epoch": 3.526936026936027, "grad_norm": 0.4872076274161844, "learning_rate": 2.3226497633396978e-05, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.26101091504096985, "step": 2095, "valid_targets_mean": 5702.2, "valid_targets_min": 2030 }, { "epoch": 3.5353535353535355, "grad_norm": 0.47862375556228315, "learning_rate": 2.3143614237324986e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.24673721194267273, "step": 2100, "valid_targets_mean": 5217.2, "valid_targets_min": 882 }, { "epoch": 3.5437710437710437, "grad_norm": 0.46837329902348335, "learning_rate": 2.3060675447499116e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.2669448256492615, "step": 2105, "valid_targets_mean": 5955.2, "valid_targets_min": 3111 }, { "epoch": 3.5521885521885523, "grad_norm": 0.5013173665418452, "learning_rate": 2.2977682725387154e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.26355600357055664, "step": 2110, "valid_targets_mean": 5380.4, "valid_targets_min": 634 }, { "epoch": 3.5606060606060606, "grad_norm": 0.4850228761732901, "learning_rate": 2.2894637533407212e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803172469139099, "step": 2115, "valid_targets_mean": 5126.5, "valid_targets_min": 828 }, { "epoch": 3.569023569023569, "grad_norm": 0.523494145167435, "learning_rate": 2.2811541334901993e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.2550443410873413, "step": 2120, "valid_targets_mean": 5063.9, "valid_targets_min": 1239 }, { "epoch": 3.5774410774410774, "grad_norm": 0.4942692493742798, "learning_rate": 2.2728395594112965e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.2536007761955261, "step": 2125, "valid_targets_mean": 5600.1, "valid_targets_min": 1971 }, { "epoch": 3.5858585858585856, "grad_norm": 0.4616263962222559, "learning_rate": 2.264520177615461e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2446945160627365, "step": 2130, "valid_targets_mean": 5717.0, "valid_targets_min": 710 }, { "epoch": 3.5942760942760943, "grad_norm": 0.47379121647220346, "learning_rate": 2.2561961346988553e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.2528979778289795, "step": 2135, "valid_targets_mean": 5486.9, "valid_targets_min": 1782 }, { "epoch": 3.602693602693603, "grad_norm": 0.4624142451949401, "learning_rate": 2.2478675773397775e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.255023330450058, "step": 2140, "valid_targets_mean": 6134.9, "valid_targets_min": 2221 }, { "epoch": 3.611111111111111, "grad_norm": 0.4935821545925253, "learning_rate": 2.2395346522960742e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875485420227051, "step": 2145, "valid_targets_mean": 5438.0, "valid_targets_min": 1249 }, { "epoch": 3.6195286195286194, "grad_norm": 0.4709964419857675, "learning_rate": 2.231197506402556e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643469572067261, "step": 2150, "valid_targets_mean": 5791.2, "valid_targets_min": 916 }, { "epoch": 3.627946127946128, "grad_norm": 0.44196735316646596, "learning_rate": 2.222856286568408e-05, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.262684166431427, "step": 2155, "valid_targets_mean": 6122.8, "valid_targets_min": 4714 }, { "epoch": 3.6363636363636362, "grad_norm": 0.43497103101851703, "learning_rate": 2.2145111397746027e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.26448798179626465, "step": 2160, "valid_targets_mean": 6194.3, "valid_targets_min": 2164 }, { "epoch": 3.644781144781145, "grad_norm": 0.4655861221362141, "learning_rate": 2.2061622130713097e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.26554441452026367, "step": 2165, "valid_targets_mean": 5773.9, "valid_targets_min": 702 }, { "epoch": 3.653198653198653, "grad_norm": 0.44414860807418716, "learning_rate": 2.197809653575306e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.247327983379364, "step": 2170, "valid_targets_mean": 5814.2, "valid_targets_min": 2019 }, { "epoch": 3.6616161616161618, "grad_norm": 0.4752089032694026, "learning_rate": 2.18945360846738e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.26908397674560547, "step": 2175, "valid_targets_mean": 6000.1, "valid_targets_min": 1468 }, { "epoch": 3.67003367003367, "grad_norm": 0.4721150110395281, "learning_rate": 2.1810942249897416e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.2538966238498688, "step": 2180, "valid_targets_mean": 5865.1, "valid_targets_min": 3149 }, { "epoch": 3.678451178451178, "grad_norm": 0.4513682828405357, "learning_rate": 2.172731650443425e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.2598488926887512, "step": 2185, "valid_targets_mean": 5767.9, "valid_targets_min": 2936 }, { "epoch": 3.686868686868687, "grad_norm": 0.4840032550986964, "learning_rate": 2.1643660321856973e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2745859622955322, "step": 2190, "valid_targets_mean": 5705.9, "valid_targets_min": 728 }, { "epoch": 3.6952861952861955, "grad_norm": 0.4658741775575672, "learning_rate": 2.1559975176274545e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.24418890476226807, "step": 2195, "valid_targets_mean": 5492.0, "valid_targets_min": 677 }, { "epoch": 3.7037037037037037, "grad_norm": 0.4825279150558414, "learning_rate": 2.147626254230631e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.28623268008232117, "step": 2200, "valid_targets_mean": 5611.0, "valid_targets_min": 627 }, { "epoch": 3.712121212121212, "grad_norm": 0.47492010284265773, "learning_rate": 2.1392523895056e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.2459857016801834, "step": 2205, "valid_targets_mean": 6181.9, "valid_targets_min": 2042 }, { "epoch": 3.7205387205387206, "grad_norm": 0.4330257446398321, "learning_rate": 2.1308760710085706e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.23315058648586273, "step": 2210, "valid_targets_mean": 6284.3, "valid_targets_min": 3800 }, { "epoch": 3.728956228956229, "grad_norm": 0.4590373305942424, "learning_rate": 2.1224974463389892e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.24978694319725037, "step": 2215, "valid_targets_mean": 6140.1, "valid_targets_min": 3554 }, { "epoch": 3.7373737373737375, "grad_norm": 0.48529430064128043, "learning_rate": 2.1141166631369418e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.24444152414798737, "step": 2220, "valid_targets_mean": 4900.2, "valid_targets_min": 834 }, { "epoch": 3.7457912457912457, "grad_norm": 0.48562007061040907, "learning_rate": 2.1057338690805485e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.2763746678829193, "step": 2225, "valid_targets_mean": 5667.4, "valid_targets_min": 2152 }, { "epoch": 3.7542087542087543, "grad_norm": 0.45153067684291887, "learning_rate": 2.0973492118833633e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.2593878209590912, "step": 2230, "valid_targets_mean": 5811.3, "valid_targets_min": 2868 }, { "epoch": 3.7626262626262625, "grad_norm": 0.46947043053986687, "learning_rate": 2.08896283929177e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.2528648376464844, "step": 2235, "valid_targets_mean": 5667.5, "valid_targets_min": 577 }, { "epoch": 3.771043771043771, "grad_norm": 0.443062772560876, "learning_rate": 2.0805748990823808e-05, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.23090139031410217, "step": 2240, "valid_targets_mean": 5894.3, "valid_targets_min": 4097 }, { "epoch": 3.7794612794612794, "grad_norm": 0.46928488809946345, "learning_rate": 2.0721855390594294e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.23324617743492126, "step": 2245, "valid_targets_mean": 6142.8, "valid_targets_min": 3662 }, { "epoch": 3.787878787878788, "grad_norm": 0.4713367550706847, "learning_rate": 2.0637949070521688e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.2696024775505066, "step": 2250, "valid_targets_mean": 6141.5, "valid_targets_min": 2133 }, { "epoch": 3.7962962962962963, "grad_norm": 0.4392650932413215, "learning_rate": 2.0554031509122656e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.2330874651670456, "step": 2255, "valid_targets_mean": 5963.0, "valid_targets_min": 3554 }, { "epoch": 3.8047138047138045, "grad_norm": 0.5082714907464522, "learning_rate": 2.0470104185111946e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.24720750749111176, "step": 2260, "valid_targets_mean": 5415.8, "valid_targets_min": 1997 }, { "epoch": 3.813131313131313, "grad_norm": 0.4335382849960993, "learning_rate": 2.0386168577376346e-05, "loss": 0.26, "loss_nan_ranks": 0, "loss_rank_avg": 0.2274424135684967, "step": 2265, "valid_targets_mean": 5680.9, "valid_targets_min": 529 }, { "epoch": 3.821548821548822, "grad_norm": 0.46601152865749573, "learning_rate": 2.0302226164948592e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.2622186541557312, "step": 2270, "valid_targets_mean": 5564.1, "valid_targets_min": 1668 }, { "epoch": 3.82996632996633, "grad_norm": 0.4340781482822856, "learning_rate": 2.0218278426981332e-05, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.23421743512153625, "step": 2275, "valid_targets_mean": 5899.7, "valid_targets_min": 738 }, { "epoch": 3.8383838383838382, "grad_norm": 0.4734907148873857, "learning_rate": 2.013432684272107e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2441825568675995, "step": 2280, "valid_targets_mean": 5232.0, "valid_targets_min": 572 }, { "epoch": 3.846801346801347, "grad_norm": 0.5215053718016555, "learning_rate": 2.0050372891482065e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.26573556661605835, "step": 2285, "valid_targets_mean": 5406.9, "valid_targets_min": 877 }, { "epoch": 3.855218855218855, "grad_norm": 0.43539608646753364, "learning_rate": 1.99664180526203e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2478955239057541, "step": 2290, "valid_targets_mean": 6055.0, "valid_targets_min": 3749 }, { "epoch": 3.8636363636363638, "grad_norm": 0.44650430172333616, "learning_rate": 1.988246380550739e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.23736608028411865, "step": 2295, "valid_targets_mean": 5916.8, "valid_targets_min": 766 }, { "epoch": 3.872053872053872, "grad_norm": 0.4753554150730085, "learning_rate": 1.9798511629504526e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.26632919907569885, "step": 2300, "valid_targets_mean": 5875.3, "valid_targets_min": 2644 }, { "epoch": 3.8804713804713806, "grad_norm": 0.663332930647706, "learning_rate": 1.9714563003936414e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.28136366605758667, "step": 2305, "valid_targets_mean": 5596.1, "valid_targets_min": 851 }, { "epoch": 3.888888888888889, "grad_norm": 0.4370023219399334, "learning_rate": 1.9630619408065166e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.23587965965270996, "step": 2310, "valid_targets_mean": 5893.2, "valid_targets_min": 570 }, { "epoch": 3.897306397306397, "grad_norm": 0.46508686514621095, "learning_rate": 1.9546682321064296e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2453293353319168, "step": 2315, "valid_targets_mean": 5837.5, "valid_targets_min": 2215 }, { "epoch": 3.9057239057239057, "grad_norm": 0.4982192014247366, "learning_rate": 1.9462753221992625e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.24440611898899078, "step": 2320, "valid_targets_mean": 5267.2, "valid_targets_min": 465 }, { "epoch": 3.9141414141414144, "grad_norm": 0.4805922369728175, "learning_rate": 1.9378833589768196e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.24339064955711365, "step": 2325, "valid_targets_mean": 5242.2, "valid_targets_min": 2388 }, { "epoch": 3.9225589225589226, "grad_norm": 0.451836362923565, "learning_rate": 1.9294924903142252e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.2769237458705902, "step": 2330, "valid_targets_mean": 6302.6, "valid_targets_min": 2157 }, { "epoch": 3.930976430976431, "grad_norm": 0.4735168791034422, "learning_rate": 1.9211028640673173e-05, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.25596874952316284, "step": 2335, "valid_targets_mean": 5781.4, "valid_targets_min": 1809 }, { "epoch": 3.9393939393939394, "grad_norm": 0.49285584030359986, "learning_rate": 1.9127146280700384e-05, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413105070590973, "step": 2340, "valid_targets_mean": 5354.1, "valid_targets_min": 580 }, { "epoch": 3.9478114478114477, "grad_norm": 0.45921191146130463, "learning_rate": 1.9043279301318365e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.2670944333076477, "step": 2345, "valid_targets_mean": 5593.6, "valid_targets_min": 736 }, { "epoch": 3.9562289562289563, "grad_norm": 0.46211290571675284, "learning_rate": 1.895942918035054e-05, "loss": 0.2517, "loss_nan_ranks": 0, "loss_rank_avg": 0.24511289596557617, "step": 2350, "valid_targets_mean": 5811.6, "valid_targets_min": 2208 }, { "epoch": 3.9646464646464645, "grad_norm": 0.4794002903772811, "learning_rate": 1.88755973953233e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.2600766122341156, "step": 2355, "valid_targets_mean": 5570.6, "valid_targets_min": 3574 }, { "epoch": 3.973063973063973, "grad_norm": 0.4611418225959471, "learning_rate": 1.8791785423439926e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.2635408043861389, "step": 2360, "valid_targets_mean": 5771.7, "valid_targets_min": 753 }, { "epoch": 3.9814814814814814, "grad_norm": 0.4364240728827987, "learning_rate": 1.8707994741554565e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.24071215093135834, "step": 2365, "valid_targets_mean": 6022.0, "valid_targets_min": 2766 }, { "epoch": 3.98989898989899, "grad_norm": 0.4868677738278521, "learning_rate": 1.8624226826146228e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.2623073160648346, "step": 2370, "valid_targets_mean": 5395.6, "valid_targets_min": 2961 }, { "epoch": 3.9983164983164983, "grad_norm": 0.43425493407176013, "learning_rate": 1.8540483153292736e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.24014857411384583, "step": 2375, "valid_targets_mean": 6008.5, "valid_targets_min": 4815 }, { "epoch": 4.006734006734007, "grad_norm": 0.47405743239962633, "learning_rate": 1.8456765198644747e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2570481300354004, "step": 2380, "valid_targets_mean": 5911.1, "valid_targets_min": 5134 }, { "epoch": 4.015151515151516, "grad_norm": 0.4869860772722204, "learning_rate": 1.8373074437399744e-05, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.23833802342414856, "step": 2385, "valid_targets_mean": 5891.4, "valid_targets_min": 3355 }, { "epoch": 4.023569023569023, "grad_norm": 0.4846976942136745, "learning_rate": 1.8289412344276004e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.2526353597640991, "step": 2390, "valid_targets_mean": 5712.9, "valid_targets_min": 1880 }, { "epoch": 4.031986531986532, "grad_norm": 0.47446175331935553, "learning_rate": 1.8205780393486675e-05, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.24016064405441284, "step": 2395, "valid_targets_mean": 6065.6, "valid_targets_min": 3815 }, { "epoch": 4.040404040404041, "grad_norm": 0.5119722118605593, "learning_rate": 1.8122180058713738e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2695065438747406, "step": 2400, "valid_targets_mean": 5231.4, "valid_targets_min": 2031 }, { "epoch": 4.048821548821548, "grad_norm": 0.4738469599038624, "learning_rate": 1.8038612813082084e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.23778414726257324, "step": 2405, "valid_targets_mean": 5650.5, "valid_targets_min": 777 }, { "epoch": 4.057239057239057, "grad_norm": 0.46284060268484284, "learning_rate": 1.7955080129133543e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.24119344353675842, "step": 2410, "valid_targets_mean": 6040.1, "valid_targets_min": 3473 }, { "epoch": 4.065656565656566, "grad_norm": 0.4970401933263894, "learning_rate": 1.7871583478800915e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.24557490646839142, "step": 2415, "valid_targets_mean": 5264.2, "valid_targets_min": 1960 }, { "epoch": 4.074074074074074, "grad_norm": 0.45239648329446647, "learning_rate": 1.7788124333382064e-05, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602667510509491, "step": 2420, "valid_targets_mean": 6043.5, "valid_targets_min": 2042 }, { "epoch": 4.082491582491582, "grad_norm": 0.4456410655388535, "learning_rate": 1.770470416351398e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.234627828001976, "step": 2425, "valid_targets_mean": 5970.1, "valid_targets_min": 2800 }, { "epoch": 4.090909090909091, "grad_norm": 0.5192498075506568, "learning_rate": 1.7621324439146843e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.2598259150981903, "step": 2430, "valid_targets_mean": 5802.1, "valid_targets_min": 1828 }, { "epoch": 4.0993265993265995, "grad_norm": 0.5023479734758095, "learning_rate": 1.753798662951816e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.23720863461494446, "step": 2435, "valid_targets_mean": 5042.8, "valid_targets_min": 1555 }, { "epoch": 4.107744107744108, "grad_norm": 0.5293355450065484, "learning_rate": 1.745469220312685e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.24346238374710083, "step": 2440, "valid_targets_mean": 6005.5, "valid_targets_min": 3947 }, { "epoch": 4.116161616161616, "grad_norm": 0.46485453409872673, "learning_rate": 1.7371442627707385e-05, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.24842385947704315, "step": 2445, "valid_targets_mean": 6210.0, "valid_targets_min": 2189 }, { "epoch": 4.124579124579125, "grad_norm": 0.4401011838255257, "learning_rate": 1.72882393702039e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.2509979009628296, "step": 2450, "valid_targets_mean": 5898.5, "valid_targets_min": 2221 }, { "epoch": 4.132996632996633, "grad_norm": 0.4977857748823478, "learning_rate": 1.7205083896744365e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.24902662634849548, "step": 2455, "valid_targets_mean": 5446.1, "valid_targets_min": 2169 }, { "epoch": 4.141414141414141, "grad_norm": 0.4736888568431637, "learning_rate": 1.712197767261476e-05, "loss": 0.247, "loss_nan_ranks": 0, "loss_rank_avg": 0.24341030418872833, "step": 2460, "valid_targets_mean": 5585.1, "valid_targets_min": 789 }, { "epoch": 4.14983164983165, "grad_norm": 0.47946329643831576, "learning_rate": 1.7038922162233224e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.23274879157543182, "step": 2465, "valid_targets_mean": 5161.8, "valid_targets_min": 1937 }, { "epoch": 4.158249158249158, "grad_norm": 0.4776304140534067, "learning_rate": 1.6955918829124252e-05, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.2704820930957794, "step": 2470, "valid_targets_mean": 6214.0, "valid_targets_min": 2880 }, { "epoch": 4.166666666666667, "grad_norm": 0.48354690048207816, "learning_rate": 1.6872969135892963e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.261080801486969, "step": 2475, "valid_targets_mean": 5749.2, "valid_targets_min": 2662 }, { "epoch": 4.175084175084175, "grad_norm": 0.51929036494525, "learning_rate": 1.6790074544199257e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.2342805117368698, "step": 2480, "valid_targets_mean": 4718.4, "valid_targets_min": 596 }, { "epoch": 4.183501683501683, "grad_norm": 0.4767487596980206, "learning_rate": 1.670723651473209e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.2481677085161209, "step": 2485, "valid_targets_mean": 6451.2, "valid_targets_min": 3580 }, { "epoch": 4.191919191919192, "grad_norm": 0.4908992003019385, "learning_rate": 1.6624456507183735e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.2497548609972, "step": 2490, "valid_targets_mean": 5495.7, "valid_targets_min": 524 }, { "epoch": 4.200336700336701, "grad_norm": 0.464864052610427, "learning_rate": 1.654173598022407e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.23745915293693542, "step": 2495, "valid_targets_mean": 5795.8, "valid_targets_min": 744 }, { "epoch": 4.2087542087542085, "grad_norm": 0.5125678578793912, "learning_rate": 1.645907639147484e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.27014249563217163, "step": 2500, "valid_targets_mean": 5685.8, "valid_targets_min": 778 }, { "epoch": 4.217171717171717, "grad_norm": 0.47049554426126494, "learning_rate": 1.6376479197484028e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.21898922324180603, "step": 2505, "valid_targets_mean": 5405.2, "valid_targets_min": 1019 }, { "epoch": 4.225589225589226, "grad_norm": 0.47870546675653486, "learning_rate": 1.629394585370011e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.25341683626174927, "step": 2510, "valid_targets_mean": 6033.2, "valid_targets_min": 1807 }, { "epoch": 4.2340067340067336, "grad_norm": 0.46327108777649934, "learning_rate": 1.6211477814446498e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.25074249505996704, "step": 2515, "valid_targets_mean": 5824.4, "valid_targets_min": 2207 }, { "epoch": 4.242424242424242, "grad_norm": 0.46668716627675316, "learning_rate": 1.6129076532895853e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.23657959699630737, "step": 2520, "valid_targets_mean": 5824.7, "valid_targets_min": 2845 }, { "epoch": 4.250841750841751, "grad_norm": 0.5225102540153259, "learning_rate": 1.604674346104449e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.26022762060165405, "step": 2525, "valid_targets_mean": 4983.4, "valid_targets_min": 809 }, { "epoch": 4.2592592592592595, "grad_norm": 0.47507759485734535, "learning_rate": 1.596448004968681e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.21946153044700623, "step": 2530, "valid_targets_mean": 5204.6, "valid_targets_min": 806 }, { "epoch": 4.267676767676767, "grad_norm": 0.4691020718582385, "learning_rate": 1.5882287748389716e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.2251463383436203, "step": 2535, "valid_targets_mean": 5837.6, "valid_targets_min": 3772 }, { "epoch": 4.276094276094276, "grad_norm": 0.508551212418667, "learning_rate": 1.5800168005467083e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.24717667698860168, "step": 2540, "valid_targets_mean": 5223.6, "valid_targets_min": 1273 }, { "epoch": 4.284511784511785, "grad_norm": 0.49267867623234085, "learning_rate": 1.5718122267954232e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.2596457302570343, "step": 2545, "valid_targets_mean": 5383.6, "valid_targets_min": 1619 }, { "epoch": 4.292929292929293, "grad_norm": 0.48887693296457063, "learning_rate": 1.5636151981582417e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524750232696533, "step": 2550, "valid_targets_mean": 5214.6, "valid_targets_min": 2469 }, { "epoch": 4.301346801346801, "grad_norm": 0.47058944318885165, "learning_rate": 1.5554258590753388e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.24721063673496246, "step": 2555, "valid_targets_mean": 5628.5, "valid_targets_min": 3056 }, { "epoch": 4.30976430976431, "grad_norm": 0.4695975900983712, "learning_rate": 1.5472443538513894e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.23654913902282715, "step": 2560, "valid_targets_mean": 5601.7, "valid_targets_min": 648 }, { "epoch": 4.318181818181818, "grad_norm": 0.4853336295956766, "learning_rate": 1.5390708266530288e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.257931113243103, "step": 2565, "valid_targets_mean": 5604.9, "valid_targets_min": 706 }, { "epoch": 4.326599326599327, "grad_norm": 0.469469857279881, "learning_rate": 1.530905421506312e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.25359490513801575, "step": 2570, "valid_targets_mean": 5639.9, "valid_targets_min": 1609 }, { "epoch": 4.335016835016835, "grad_norm": 0.49705236539026776, "learning_rate": 1.5227482822941725e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.2658868134021759, "step": 2575, "valid_targets_mean": 5859.4, "valid_targets_min": 702 }, { "epoch": 4.343434343434343, "grad_norm": 0.5576981250686313, "learning_rate": 1.5145995527538918e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.2369997501373291, "step": 2580, "valid_targets_mean": 5897.0, "valid_targets_min": 1842 }, { "epoch": 4.351851851851852, "grad_norm": 0.4688656894324779, "learning_rate": 1.506459376474564e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.24687042832374573, "step": 2585, "valid_targets_mean": 5883.9, "valid_targets_min": 3493 }, { "epoch": 4.36026936026936, "grad_norm": 0.47447175952384196, "learning_rate": 1.4983278968945638e-05, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.24589446187019348, "step": 2590, "valid_targets_mean": 6050.8, "valid_targets_min": 3455 }, { "epoch": 4.3686868686868685, "grad_norm": 0.4834177789093981, "learning_rate": 1.4902052572990236e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.2334013432264328, "step": 2595, "valid_targets_mean": 5976.0, "valid_targets_min": 4277 }, { "epoch": 4.377104377104377, "grad_norm": 0.4725416804232908, "learning_rate": 1.4820916008173039e-05, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.24257586896419525, "step": 2600, "valid_targets_mean": 6083.2, "valid_targets_min": 5017 }, { "epoch": 4.385521885521886, "grad_norm": 0.4945988617073285, "learning_rate": 1.4739870704204746e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2596173882484436, "step": 2605, "valid_targets_mean": 5484.8, "valid_targets_min": 495 }, { "epoch": 4.393939393939394, "grad_norm": 0.4455712778477704, "learning_rate": 1.4658918089187952e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.2324620634317398, "step": 2610, "valid_targets_mean": 6543.8, "valid_targets_min": 5223 }, { "epoch": 4.402356902356902, "grad_norm": 0.4682972971703617, "learning_rate": 1.4578059589591953e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.24419406056404114, "step": 2615, "valid_targets_mean": 6016.2, "valid_targets_min": 3048 }, { "epoch": 4.410774410774411, "grad_norm": 0.7488896871745445, "learning_rate": 1.4497296630227658e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.2361116111278534, "step": 2620, "valid_targets_mean": 4575.4, "valid_targets_min": 509 }, { "epoch": 4.41919191919192, "grad_norm": 0.49298367487554073, "learning_rate": 1.4416630634222449e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.2516939043998718, "step": 2625, "valid_targets_mean": 6001.4, "valid_targets_min": 4759 }, { "epoch": 4.427609427609427, "grad_norm": 0.4773695575753377, "learning_rate": 1.4336063022995102e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.2478029727935791, "step": 2630, "valid_targets_mean": 6015.2, "valid_targets_min": 1735 }, { "epoch": 4.436026936026936, "grad_norm": 0.4858496060742026, "learning_rate": 1.4255595216230753e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524571418762207, "step": 2635, "valid_targets_mean": 5901.1, "valid_targets_min": 4608 }, { "epoch": 4.444444444444445, "grad_norm": 0.46779566482936225, "learning_rate": 1.4175228631855902e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.27151983976364136, "step": 2640, "valid_targets_mean": 6261.8, "valid_targets_min": 2048 }, { "epoch": 4.452861952861953, "grad_norm": 0.5098921296763699, "learning_rate": 1.4094964686013381e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.2560115456581116, "step": 2645, "valid_targets_mean": 5527.9, "valid_targets_min": 771 }, { "epoch": 4.461279461279461, "grad_norm": 0.4963397756532333, "learning_rate": 1.4014804793037434e-05, "loss": 0.2407, "loss_nan_ranks": 0, "loss_rank_avg": 0.24187448620796204, "step": 2650, "valid_targets_mean": 5302.6, "valid_targets_min": 791 }, { "epoch": 4.46969696969697, "grad_norm": 0.4720446760534927, "learning_rate": 1.3934750365428783e-05, "loss": 0.2402, "loss_nan_ranks": 0, "loss_rank_avg": 0.24175631999969482, "step": 2655, "valid_targets_mean": 6306.9, "valid_targets_min": 3272 }, { "epoch": 4.478114478114478, "grad_norm": 0.4494062792812156, "learning_rate": 1.3854802813829744e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.23085647821426392, "step": 2660, "valid_targets_mean": 6597.3, "valid_targets_min": 5296 }, { "epoch": 4.486531986531986, "grad_norm": 0.5505872162256524, "learning_rate": 1.3774963546999364e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.2597641348838806, "step": 2665, "valid_targets_mean": 4935.4, "valid_targets_min": 728 }, { "epoch": 4.494949494949495, "grad_norm": 0.4547480815464649, "learning_rate": 1.3695233971788592e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2259209305047989, "step": 2670, "valid_targets_mean": 5772.8, "valid_targets_min": 1067 }, { "epoch": 4.5033670033670035, "grad_norm": 0.49796826408398476, "learning_rate": 1.3615615493115509e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.2491885870695114, "step": 2675, "valid_targets_mean": 5509.8, "valid_targets_min": 2095 }, { "epoch": 4.511784511784512, "grad_norm": 0.4675189339816609, "learning_rate": 1.3536109513940556e-05, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.2503166198730469, "step": 2680, "valid_targets_mean": 6271.0, "valid_targets_min": 3815 }, { "epoch": 4.52020202020202, "grad_norm": 0.4910407602321847, "learning_rate": 1.3456717435241808e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.2446977198123932, "step": 2685, "valid_targets_mean": 5576.9, "valid_targets_min": 3428 }, { "epoch": 4.5286195286195285, "grad_norm": 0.4834526315851509, "learning_rate": 1.3377440655990307e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.2552727460861206, "step": 2690, "valid_targets_mean": 5595.2, "valid_targets_min": 1965 }, { "epoch": 4.537037037037037, "grad_norm": 0.501007163784396, "learning_rate": 1.3298280573125392e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.22512459754943848, "step": 2695, "valid_targets_mean": 5356.6, "valid_targets_min": 2819 }, { "epoch": 4.545454545454545, "grad_norm": 0.49703879208215895, "learning_rate": 1.321923858153009e-05, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.24406014382839203, "step": 2700, "valid_targets_mean": 5361.9, "valid_targets_min": 875 }, { "epoch": 4.553872053872054, "grad_norm": 0.4660714609745113, "learning_rate": 1.3140316074006545e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.22664999961853027, "step": 2705, "valid_targets_mean": 5331.6, "valid_targets_min": 2224 }, { "epoch": 4.562289562289562, "grad_norm": 0.49471186723664107, "learning_rate": 1.3061514441251446e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508906424045563, "step": 2710, "valid_targets_mean": 5700.0, "valid_targets_min": 3778 }, { "epoch": 4.570707070707071, "grad_norm": 0.48226739181141126, "learning_rate": 1.2982835071831565e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557341456413269, "step": 2715, "valid_targets_mean": 6064.6, "valid_targets_min": 3898 }, { "epoch": 4.57912457912458, "grad_norm": 0.5920571149767186, "learning_rate": 1.2904279352159264e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.23203839361667633, "step": 2720, "valid_targets_mean": 5828.5, "valid_targets_min": 3282 }, { "epoch": 4.587542087542087, "grad_norm": 0.5112076721317061, "learning_rate": 1.2825848666468052e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.26419830322265625, "step": 2725, "valid_targets_mean": 6003.7, "valid_targets_min": 4170 }, { "epoch": 4.595959595959596, "grad_norm": 0.5154589913874446, "learning_rate": 1.274754439678823e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602817416191101, "step": 2730, "valid_targets_mean": 5174.1, "valid_targets_min": 1954 }, { "epoch": 4.604377104377105, "grad_norm": 0.4792667230253282, "learning_rate": 1.2669367922922504e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.24768483638763428, "step": 2735, "valid_targets_mean": 6099.4, "valid_targets_min": 4942 }, { "epoch": 4.6127946127946124, "grad_norm": 0.48102648961761757, "learning_rate": 1.2591320622421686e-05, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.23812749981880188, "step": 2740, "valid_targets_mean": 5808.0, "valid_targets_min": 2587 }, { "epoch": 4.621212121212121, "grad_norm": 0.48280565166454636, "learning_rate": 1.2513403870560429e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.2352055013179779, "step": 2745, "valid_targets_mean": 5633.4, "valid_targets_min": 3291 }, { "epoch": 4.62962962962963, "grad_norm": 0.5394317361742055, "learning_rate": 1.2435619040312963e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.2418336272239685, "step": 2750, "valid_targets_mean": 6345.4, "valid_targets_min": 4447 }, { "epoch": 4.638047138047138, "grad_norm": 0.5264541632883329, "learning_rate": 1.2357967502328943e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.2687990367412567, "step": 2755, "valid_targets_mean": 6275.9, "valid_targets_min": 4262 }, { "epoch": 4.646464646464646, "grad_norm": 0.49314757440762375, "learning_rate": 1.2280450624909257e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.2628011107444763, "step": 2760, "valid_targets_mean": 5708.2, "valid_targets_min": 806 }, { "epoch": 4.654882154882155, "grad_norm": 0.4595389422928486, "learning_rate": 1.2203069773981953e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.2331043779850006, "step": 2765, "valid_targets_mean": 6120.2, "valid_targets_min": 2674 }, { "epoch": 4.6632996632996635, "grad_norm": 0.5303579086202546, "learning_rate": 1.2125826313078144e-05, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.24351969361305237, "step": 2770, "valid_targets_mean": 4967.9, "valid_targets_min": 789 }, { "epoch": 4.671717171717171, "grad_norm": 0.4757122640440963, "learning_rate": 1.2048721603307971e-05, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.21351343393325806, "step": 2775, "valid_targets_mean": 5402.2, "valid_targets_min": 2497 }, { "epoch": 4.68013468013468, "grad_norm": 0.49558312945900046, "learning_rate": 1.1971757003336661e-05, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.23598149418830872, "step": 2780, "valid_targets_mean": 5560.8, "valid_targets_min": 3411 }, { "epoch": 4.688552188552189, "grad_norm": 0.5070715903913475, "learning_rate": 1.1894933869360555e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.2461165487766266, "step": 2785, "valid_targets_mean": 5727.7, "valid_targets_min": 4203 }, { "epoch": 4.696969696969697, "grad_norm": 0.5205203781186487, "learning_rate": 1.1818253555083192e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.27181577682495117, "step": 2790, "valid_targets_mean": 5783.8, "valid_targets_min": 1486 }, { "epoch": 4.705387205387205, "grad_norm": 0.4816612147414662, "learning_rate": 1.1741717411691509e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.2371402531862259, "step": 2795, "valid_targets_mean": 5769.2, "valid_targets_min": 1968 }, { "epoch": 4.713804713804714, "grad_norm": 0.47718296915439024, "learning_rate": 1.1665326787831983e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.22365979850292206, "step": 2800, "valid_targets_mean": 6007.6, "valid_targets_min": 3942 }, { "epoch": 4.722222222222222, "grad_norm": 0.4796220783634332, "learning_rate": 1.1589083029586906e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.23196230828762054, "step": 2805, "valid_targets_mean": 5937.4, "valid_targets_min": 2363 }, { "epoch": 4.730639730639731, "grad_norm": 0.47684003132237357, "learning_rate": 1.1512987480450612e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604638934135437, "step": 2810, "valid_targets_mean": 5854.0, "valid_targets_min": 2407 }, { "epoch": 4.739057239057239, "grad_norm": 0.4874748967420592, "learning_rate": 1.1437041481305877e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.24680189788341522, "step": 2815, "valid_targets_mean": 5404.6, "valid_targets_min": 688 }, { "epoch": 4.747474747474747, "grad_norm": 0.48612021159408475, "learning_rate": 1.1361246370400221e-05, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.24513094127178192, "step": 2820, "valid_targets_mean": 5797.8, "valid_targets_min": 2659 }, { "epoch": 4.755892255892256, "grad_norm": 0.48208763672646515, "learning_rate": 1.1285603483322362e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.26105183362960815, "step": 2825, "valid_targets_mean": 5589.4, "valid_targets_min": 572 }, { "epoch": 4.764309764309765, "grad_norm": 0.5015272529735295, "learning_rate": 1.1210114152978683e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.23148992657661438, "step": 2830, "valid_targets_mean": 5191.4, "valid_targets_min": 1249 }, { "epoch": 4.7727272727272725, "grad_norm": 0.47511244937891034, "learning_rate": 1.1134779709569732e-05, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.22913163900375366, "step": 2835, "valid_targets_mean": 6066.2, "valid_targets_min": 963 }, { "epoch": 4.781144781144781, "grad_norm": 0.47372641919213665, "learning_rate": 1.1059601480566781e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.24431616067886353, "step": 2840, "valid_targets_mean": 6332.1, "valid_targets_min": 4314 }, { "epoch": 4.78956228956229, "grad_norm": 0.49151338626590396, "learning_rate": 1.0984580790688463e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.257941335439682, "step": 2845, "valid_targets_mean": 5998.0, "valid_targets_min": 4609 }, { "epoch": 4.797979797979798, "grad_norm": 0.4624557972804474, "learning_rate": 1.0909718961877385e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.21516473591327667, "step": 2850, "valid_targets_mean": 6487.0, "valid_targets_min": 4000 }, { "epoch": 4.806397306397306, "grad_norm": 0.48375209307777617, "learning_rate": 1.0835017313276874e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.22575807571411133, "step": 2855, "valid_targets_mean": 5556.9, "valid_targets_min": 807 }, { "epoch": 4.814814814814815, "grad_norm": 0.47388280379263475, "learning_rate": 1.0760477161207707e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.21567316353321075, "step": 2860, "valid_targets_mean": 5498.6, "valid_targets_min": 737 }, { "epoch": 4.8232323232323235, "grad_norm": 0.45953983274977706, "learning_rate": 1.068609981914492e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.24462053179740906, "step": 2865, "valid_targets_mean": 5789.3, "valid_targets_min": 1753 }, { "epoch": 4.831649831649831, "grad_norm": 0.6013089443836538, "learning_rate": 1.0611886597694672e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.22891020774841309, "step": 2870, "valid_targets_mean": 6236.3, "valid_targets_min": 2824 }, { "epoch": 4.84006734006734, "grad_norm": 0.4765798783055637, "learning_rate": 1.0537838804571145e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.2332342267036438, "step": 2875, "valid_targets_mean": 5363.1, "valid_targets_min": 1997 }, { "epoch": 4.848484848484849, "grad_norm": 0.4850073815980291, "learning_rate": 1.0463957744573502e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.23898157477378845, "step": 2880, "valid_targets_mean": 5507.9, "valid_targets_min": 1004 }, { "epoch": 4.856902356902357, "grad_norm": 0.4732284576996267, "learning_rate": 1.0390244719562901e-05, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.2569975256919861, "step": 2885, "valid_targets_mean": 6173.3, "valid_targets_min": 2158 }, { "epoch": 4.865319865319865, "grad_norm": 0.5066251528378924, "learning_rate": 1.031670102843954e-05, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.23153352737426758, "step": 2890, "valid_targets_mean": 5168.5, "valid_targets_min": 786 }, { "epoch": 4.873737373737374, "grad_norm": 0.4927142942425226, "learning_rate": 1.0243327967119772e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.24447093904018402, "step": 2895, "valid_targets_mean": 5767.2, "valid_targets_min": 3057 }, { "epoch": 4.882154882154882, "grad_norm": 0.47799262367577505, "learning_rate": 1.0170126828513301e-05, "loss": 0.239, "loss_nan_ranks": 0, "loss_rank_avg": 0.23044052720069885, "step": 2900, "valid_targets_mean": 5838.8, "valid_targets_min": 2031 }, { "epoch": 4.890572390572391, "grad_norm": 0.47677839550243056, "learning_rate": 1.0097098902500346e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.23265433311462402, "step": 2905, "valid_targets_mean": 5649.4, "valid_targets_min": 713 }, { "epoch": 4.898989898989899, "grad_norm": 0.46809374636357964, "learning_rate": 1.0024245475908956e-05, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.2440536618232727, "step": 2910, "valid_targets_mean": 6046.9, "valid_targets_min": 4710 }, { "epoch": 4.907407407407407, "grad_norm": 0.5025997220995649, "learning_rate": 9.951567832492308e-06, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.2694641351699829, "step": 2915, "valid_targets_mean": 5369.6, "valid_targets_min": 1971 }, { "epoch": 4.915824915824916, "grad_norm": 0.5128476244209108, "learning_rate": 9.879067252906098e-06, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.2652130126953125, "step": 2920, "valid_targets_mean": 5546.7, "valid_targets_min": 628 }, { "epoch": 4.924242424242424, "grad_norm": 0.46637613972668973, "learning_rate": 9.80674501468599e-06, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2279430627822876, "step": 2925, "valid_targets_mean": 5847.3, "valid_targets_min": 2707 }, { "epoch": 4.9326599326599325, "grad_norm": 0.48287729943481417, "learning_rate": 9.734602392225068e-06, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.22361034154891968, "step": 2930, "valid_targets_mean": 5502.1, "valid_targets_min": 3942 }, { "epoch": 4.941077441077441, "grad_norm": 0.46786670784817613, "learning_rate": 9.662640656751396e-06, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.2460593581199646, "step": 2935, "valid_targets_mean": 6188.2, "valid_targets_min": 3514 }, { "epoch": 4.94949494949495, "grad_norm": 0.5252202199058081, "learning_rate": 9.59086107630565e-06, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.2338843047618866, "step": 2940, "valid_targets_mean": 4835.6, "valid_targets_min": 923 }, { "epoch": 4.957912457912458, "grad_norm": 0.4519621375125666, "learning_rate": 9.519264915718717e-06, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.22045472264289856, "step": 2945, "valid_targets_mean": 6158.5, "valid_targets_min": 2283 }, { "epoch": 4.966329966329966, "grad_norm": 0.4651056142527175, "learning_rate": 9.447853436589444e-06, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.23641371726989746, "step": 2950, "valid_targets_mean": 5869.6, "valid_targets_min": 2270 }, { "epoch": 4.974747474747475, "grad_norm": 0.48650730476506754, "learning_rate": 9.3766278972624e-06, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.2378322184085846, "step": 2955, "valid_targets_mean": 5616.4, "valid_targets_min": 627 }, { "epoch": 4.983164983164983, "grad_norm": 0.48351848812987125, "learning_rate": 9.305589552805691e-06, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.21766245365142822, "step": 2960, "valid_targets_mean": 5461.8, "valid_targets_min": 524 }, { "epoch": 4.991582491582491, "grad_norm": 0.4855323304121959, "learning_rate": 9.234739654988879e-06, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.22696718573570251, "step": 2965, "valid_targets_mean": 6261.7, "valid_targets_min": 1713 }, { "epoch": 5.0, "grad_norm": 0.4832993346496243, "learning_rate": 9.164079452260874e-06, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.23409955203533173, "step": 2970, "valid_targets_mean": 5369.6, "valid_targets_min": 976 }, { "epoch": 5.008417508417509, "grad_norm": 0.485975550813503, "learning_rate": 9.09361018972797e-06, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.2630172371864319, "step": 2975, "valid_targets_mean": 6245.8, "valid_targets_min": 875 }, { "epoch": 5.016835016835016, "grad_norm": 0.5183945191375198, "learning_rate": 9.02333310913191e-06, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.22702479362487793, "step": 2980, "valid_targets_mean": 6026.0, "valid_targets_min": 2934 }, { "epoch": 5.025252525252525, "grad_norm": 0.5186739982406766, "learning_rate": 8.953249448827971e-06, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.22462819516658783, "step": 2985, "valid_targets_mean": 5457.3, "valid_targets_min": 2304 }, { "epoch": 5.033670033670034, "grad_norm": 0.47871125321551317, "learning_rate": 8.883360443763174e-06, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.22352522611618042, "step": 2990, "valid_targets_mean": 5989.8, "valid_targets_min": 3942 }, { "epoch": 5.042087542087542, "grad_norm": 0.47853857657725507, "learning_rate": 8.813667325454507e-06, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.21468524634838104, "step": 2995, "valid_targets_mean": 5990.2, "valid_targets_min": 4922 }, { "epoch": 5.05050505050505, "grad_norm": 0.5165248585624271, "learning_rate": 8.744171321967233e-06, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.2386196106672287, "step": 3000, "valid_targets_mean": 5385.9, "valid_targets_min": 642 }, { "epoch": 5.058922558922559, "grad_norm": 0.46595854294199934, "learning_rate": 8.674873657893236e-06, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.23446813225746155, "step": 3005, "valid_targets_mean": 6161.8, "valid_targets_min": 3469 }, { "epoch": 5.0673400673400675, "grad_norm": 0.5168319359581155, "learning_rate": 8.605775554329486e-06, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.23876196146011353, "step": 3010, "valid_targets_mean": 5390.1, "valid_targets_min": 577 }, { "epoch": 5.075757575757576, "grad_norm": 0.46775467689427314, "learning_rate": 8.536878228856447e-06, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.2268284261226654, "step": 3015, "valid_targets_mean": 6205.7, "valid_targets_min": 2397 }, { "epoch": 5.084175084175084, "grad_norm": 0.5205111573678236, "learning_rate": 8.468182895516685e-06, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.2528153657913208, "step": 3020, "valid_targets_mean": 6040.9, "valid_targets_min": 1732 }, { "epoch": 5.092592592592593, "grad_norm": 0.5195827014329844, "learning_rate": 8.399690764793464e-06, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.22744807600975037, "step": 3025, "valid_targets_mean": 5111.1, "valid_targets_min": 882 }, { "epoch": 5.101010101010101, "grad_norm": 0.49170918864423774, "learning_rate": 8.331403043589387e-06, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.2277529537677765, "step": 3030, "valid_targets_mean": 5587.4, "valid_targets_min": 3947 }, { "epoch": 5.109427609427609, "grad_norm": 0.47195012869371583, "learning_rate": 8.26332093520516e-06, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2412089854478836, "step": 3035, "valid_targets_mean": 6275.1, "valid_targets_min": 3853 }, { "epoch": 5.117845117845118, "grad_norm": 0.5116529738273514, "learning_rate": 8.195445639318369e-06, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.22236831486225128, "step": 3040, "valid_targets_mean": 5911.4, "valid_targets_min": 963 }, { "epoch": 5.126262626262626, "grad_norm": 0.5188254282626279, "learning_rate": 8.127778351962349e-06, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.2555454969406128, "step": 3045, "valid_targets_mean": 5581.8, "valid_targets_min": 834 }, { "epoch": 5.134680134680135, "grad_norm": 0.47352791612280154, "learning_rate": 8.06032026550513e-06, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.22536420822143555, "step": 3050, "valid_targets_mean": 6212.1, "valid_targets_min": 3591 }, { "epoch": 5.143097643097643, "grad_norm": 0.5161817528182612, "learning_rate": 7.993072568628378e-06, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.21615377068519592, "step": 3055, "valid_targets_mean": 5326.1, "valid_targets_min": 1984 }, { "epoch": 5.151515151515151, "grad_norm": 0.4674652659739291, "learning_rate": 7.926036446306473e-06, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.23871754109859467, "step": 3060, "valid_targets_mean": 6839.7, "valid_targets_min": 4102 }, { "epoch": 5.15993265993266, "grad_norm": 0.5193304210527502, "learning_rate": 7.859213079785665e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.21915632486343384, "step": 3065, "valid_targets_mean": 5766.3, "valid_targets_min": 3637 }, { "epoch": 5.168350168350169, "grad_norm": 0.52661788686289, "learning_rate": 7.79260364656319e-06, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.24809540808200836, "step": 3070, "valid_targets_mean": 5621.6, "valid_targets_min": 744 }, { "epoch": 5.1767676767676765, "grad_norm": 0.5034046143594989, "learning_rate": 7.726209320366575e-06, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.22819620370864868, "step": 3075, "valid_targets_mean": 6095.1, "valid_targets_min": 3789 }, { "epoch": 5.185185185185185, "grad_norm": 0.5157047863687968, "learning_rate": 7.660031271132933e-06, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.2319592982530594, "step": 3080, "valid_targets_mean": 5742.2, "valid_targets_min": 2157 }, { "epoch": 5.193602693602694, "grad_norm": 0.5392072929319364, "learning_rate": 7.594070664988338e-06, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.2188304364681244, "step": 3085, "valid_targets_mean": 5194.3, "valid_targets_min": 828 }, { "epoch": 5.202020202020202, "grad_norm": 0.529921176347278, "learning_rate": 7.528328664227324e-06, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.244046151638031, "step": 3090, "valid_targets_mean": 5709.8, "valid_targets_min": 628 }, { "epoch": 5.21043771043771, "grad_norm": 0.5240479163794681, "learning_rate": 7.462806427292342e-06, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.22765925526618958, "step": 3095, "valid_targets_mean": 5149.2, "valid_targets_min": 753 }, { "epoch": 5.218855218855219, "grad_norm": 0.5136782077308949, "learning_rate": 7.397505108753378e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.2189491093158722, "step": 3100, "valid_targets_mean": 5187.2, "valid_targets_min": 1968 }, { "epoch": 5.2272727272727275, "grad_norm": 0.5058540114550893, "learning_rate": 7.332425859287624e-06, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.262953519821167, "step": 3105, "valid_targets_mean": 6108.0, "valid_targets_min": 2633 }, { "epoch": 5.235690235690235, "grad_norm": 0.5158981797860003, "learning_rate": 7.2675698256591735e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.22714978456497192, "step": 3110, "valid_targets_mean": 5883.8, "valid_targets_min": 2261 }, { "epoch": 5.244107744107744, "grad_norm": 0.5372180066384188, "learning_rate": 7.202938150698804e-06, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.22206753492355347, "step": 3115, "valid_targets_mean": 4753.1, "valid_targets_min": 769 }, { "epoch": 5.252525252525253, "grad_norm": 0.46082204133963633, "learning_rate": 7.138531973283898e-06, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.2284386157989502, "step": 3120, "valid_targets_mean": 6732.4, "valid_targets_min": 4606 }, { "epoch": 5.260942760942761, "grad_norm": 0.5258612308182962, "learning_rate": 7.074352428318312e-06, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.23692598938941956, "step": 3125, "valid_targets_mean": 5280.9, "valid_targets_min": 927 }, { "epoch": 5.269360269360269, "grad_norm": 0.47852423674654065, "learning_rate": 7.010400646712401e-06, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.20909680426120758, "step": 3130, "valid_targets_mean": 5772.5, "valid_targets_min": 2157 }, { "epoch": 5.277777777777778, "grad_norm": 0.4670349699487819, "learning_rate": 6.946677755363116e-06, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.21536147594451904, "step": 3135, "valid_targets_mean": 6276.1, "valid_targets_min": 3836 }, { "epoch": 5.286195286195286, "grad_norm": 0.47317451479187395, "learning_rate": 6.883184877134099e-06, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.2287386655807495, "step": 3140, "valid_targets_mean": 6471.6, "valid_targets_min": 2095 }, { "epoch": 5.294612794612795, "grad_norm": 0.4992948685768268, "learning_rate": 6.819923130835926e-06, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.22403103113174438, "step": 3145, "valid_targets_mean": 5905.2, "valid_targets_min": 2270 }, { "epoch": 5.303030303030303, "grad_norm": 0.49261776085093156, "learning_rate": 6.756893631206409e-06, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.24229532480239868, "step": 3150, "valid_targets_mean": 6232.4, "valid_targets_min": 2027 }, { "epoch": 5.311447811447811, "grad_norm": 0.5028192511116332, "learning_rate": 6.694097488890889e-06, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.260204553604126, "step": 3155, "valid_targets_mean": 5657.8, "valid_targets_min": 1273 }, { "epoch": 5.31986531986532, "grad_norm": 0.48478369016215206, "learning_rate": 6.63153581042276e-06, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.23380783200263977, "step": 3160, "valid_targets_mean": 6147.7, "valid_targets_min": 2819 }, { "epoch": 5.328282828282829, "grad_norm": 0.5458848519398222, "learning_rate": 6.56920969820388e-06, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.24366281926631927, "step": 3165, "valid_targets_mean": 5250.1, "valid_targets_min": 693 }, { "epoch": 5.3367003367003365, "grad_norm": 0.534336924740091, "learning_rate": 6.507120250485195e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.225617915391922, "step": 3170, "valid_targets_mean": 5071.1, "valid_targets_min": 743 }, { "epoch": 5.345117845117845, "grad_norm": 0.5311919196381524, "learning_rate": 6.445268561347393e-06, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.23042187094688416, "step": 3175, "valid_targets_mean": 5667.2, "valid_targets_min": 1807 }, { "epoch": 5.353535353535354, "grad_norm": 0.6646559705802462, "learning_rate": 6.383655720681588e-06, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.22798696160316467, "step": 3180, "valid_targets_mean": 5714.7, "valid_targets_min": 2030 }, { "epoch": 5.361952861952862, "grad_norm": 0.48527450594210503, "learning_rate": 6.3222828141701335e-06, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.22262442111968994, "step": 3185, "valid_targets_mean": 5532.1, "valid_targets_min": 849 }, { "epoch": 5.37037037037037, "grad_norm": 0.5089773350495819, "learning_rate": 6.261150923267525e-06, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.22977544367313385, "step": 3190, "valid_targets_mean": 5720.7, "valid_targets_min": 2546 }, { "epoch": 5.378787878787879, "grad_norm": 0.48608571702885467, "learning_rate": 6.200261125181262e-06, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.258963018655777, "step": 3195, "valid_targets_mean": 6741.2, "valid_targets_min": 5102 }, { "epoch": 5.3872053872053876, "grad_norm": 0.5024329241116928, "learning_rate": 6.1396144928529614e-06, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.2263956516981125, "step": 3200, "valid_targets_mean": 5581.6, "valid_targets_min": 529 }, { "epoch": 5.395622895622895, "grad_norm": 0.49165929762887833, "learning_rate": 6.0792120949393885e-06, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.21596331894397736, "step": 3205, "valid_targets_mean": 5900.8, "valid_targets_min": 4528 }, { "epoch": 5.404040404040404, "grad_norm": 0.4624623310895367, "learning_rate": 6.019054995793634e-06, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.24683353304862976, "step": 3210, "valid_targets_mean": 6548.0, "valid_targets_min": 4096 }, { "epoch": 5.412457912457913, "grad_norm": 0.4918872774950123, "learning_rate": 5.959144255446392e-06, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.22914943099021912, "step": 3215, "valid_targets_mean": 5636.7, "valid_targets_min": 2221 }, { "epoch": 5.420875420875421, "grad_norm": 0.5236989395915803, "learning_rate": 5.899480929587243e-06, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.23069006204605103, "step": 3220, "valid_targets_mean": 5107.2, "valid_targets_min": 2261 }, { "epoch": 5.429292929292929, "grad_norm": 0.49362777785329914, "learning_rate": 5.840066069546062e-06, "loss": 0.2258, "loss_nan_ranks": 0, "loss_rank_avg": 0.23647350072860718, "step": 3225, "valid_targets_mean": 6049.1, "valid_targets_min": 2780 }, { "epoch": 5.437710437710438, "grad_norm": 0.5387261419400055, "learning_rate": 5.780900722274522e-06, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.25978630781173706, "step": 3230, "valid_targets_mean": 5692.9, "valid_targets_min": 2371 }, { "epoch": 5.446127946127946, "grad_norm": 0.5097787365388916, "learning_rate": 5.721985930327585e-06, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.22551800310611725, "step": 3235, "valid_targets_mean": 5662.1, "valid_targets_min": 1900 }, { "epoch": 5.454545454545454, "grad_norm": 0.4732570960654139, "learning_rate": 5.663322731845204e-06, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.21448811888694763, "step": 3240, "valid_targets_mean": 6084.2, "valid_targets_min": 5120 }, { "epoch": 5.462962962962963, "grad_norm": 0.504245619409664, "learning_rate": 5.604912160533968e-06, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.23949390649795532, "step": 3245, "valid_targets_mean": 6064.9, "valid_targets_min": 4162 }, { "epoch": 5.4713804713804715, "grad_norm": 0.4844841529391725, "learning_rate": 5.546755245648918e-06, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.214034304022789, "step": 3250, "valid_targets_mean": 5519.1, "valid_targets_min": 1900 }, { "epoch": 5.47979797979798, "grad_norm": 0.5148425473218765, "learning_rate": 5.488853011975421e-06, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.2293565422296524, "step": 3255, "valid_targets_mean": 5810.1, "valid_targets_min": 3554 }, { "epoch": 5.488215488215488, "grad_norm": 0.5043263239532035, "learning_rate": 5.431206479811076e-06, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.23567970097064972, "step": 3260, "valid_targets_mean": 5856.5, "valid_targets_min": 3514 }, { "epoch": 5.4966329966329965, "grad_norm": 0.5234246855324006, "learning_rate": 5.373816664947753e-06, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.2325543314218521, "step": 3265, "valid_targets_mean": 5819.9, "valid_targets_min": 2170 }, { "epoch": 5.505050505050505, "grad_norm": 0.48084978877344153, "learning_rate": 5.316684578653728e-06, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.23692665994167328, "step": 3270, "valid_targets_mean": 6192.4, "valid_targets_min": 4568 }, { "epoch": 5.513468013468014, "grad_norm": 0.46469157525134236, "learning_rate": 5.259811227655789e-06, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.23742267489433289, "step": 3275, "valid_targets_mean": 6736.9, "valid_targets_min": 4696 }, { "epoch": 5.521885521885522, "grad_norm": 0.5248519679171413, "learning_rate": 5.203197614121558e-06, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.25347089767456055, "step": 3280, "valid_targets_mean": 5189.9, "valid_targets_min": 962 }, { "epoch": 5.53030303030303, "grad_norm": 0.5158347840082577, "learning_rate": 5.146844735641827e-06, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.2295902818441391, "step": 3285, "valid_targets_mean": 5830.0, "valid_targets_min": 1486 }, { "epoch": 5.538720538720539, "grad_norm": 0.5028953980064815, "learning_rate": 5.090753585212947e-06, "loss": 0.2402, "loss_nan_ranks": 0, "loss_rank_avg": 0.24436822533607483, "step": 3290, "valid_targets_mean": 5826.0, "valid_targets_min": 851 }, { "epoch": 5.547138047138047, "grad_norm": 0.4936768840129265, "learning_rate": 5.034925151219343e-06, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.23498250544071198, "step": 3295, "valid_targets_mean": 5751.9, "valid_targets_min": 2591 }, { "epoch": 5.555555555555555, "grad_norm": 0.5050995601396032, "learning_rate": 4.979360417416126e-06, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.24720489978790283, "step": 3300, "valid_targets_mean": 5693.1, "valid_targets_min": 4156 }, { "epoch": 5.563973063973064, "grad_norm": 0.4969926232957146, "learning_rate": 4.9240603629117175e-06, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.20771655440330505, "step": 3305, "valid_targets_mean": 5534.0, "valid_targets_min": 3133 }, { "epoch": 5.572390572390573, "grad_norm": 0.5530553002623905, "learning_rate": 4.869025962150617e-06, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.2520415186882019, "step": 3310, "valid_targets_mean": 5264.3, "valid_targets_min": 1400 }, { "epoch": 5.58080808080808, "grad_norm": 0.47824826642439083, "learning_rate": 4.814258184896234e-06, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.23448395729064941, "step": 3315, "valid_targets_mean": 5964.6, "valid_targets_min": 3968 }, { "epoch": 5.589225589225589, "grad_norm": 0.5333562093887002, "learning_rate": 4.759757996213783e-06, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.21456602215766907, "step": 3320, "valid_targets_mean": 5262.3, "valid_targets_min": 1919 }, { "epoch": 5.597643097643098, "grad_norm": 0.5291019973267682, "learning_rate": 4.7055263564533096e-06, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.22403772175312042, "step": 3325, "valid_targets_mean": 4866.6, "valid_targets_min": 740 }, { "epoch": 5.606060606060606, "grad_norm": 0.5520805495799307, "learning_rate": 4.651564221232728e-06, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.23195771872997284, "step": 3330, "valid_targets_mean": 4537.1, "valid_targets_min": 775 }, { "epoch": 5.614478114478114, "grad_norm": 0.5108188611657087, "learning_rate": 4.597872541421007e-06, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.23533491790294647, "step": 3335, "valid_targets_mean": 5605.8, "valid_targets_min": 706 }, { "epoch": 5.622895622895623, "grad_norm": 0.5157543076277402, "learning_rate": 4.544452263121422e-06, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.2332892119884491, "step": 3340, "valid_targets_mean": 5331.5, "valid_targets_min": 577 }, { "epoch": 5.6313131313131315, "grad_norm": 0.49379242379442295, "learning_rate": 4.491304327654855e-06, "loss": 0.2115, "loss_nan_ranks": 0, "loss_rank_avg": 0.21516942977905273, "step": 3345, "valid_targets_mean": 5680.6, "valid_targets_min": 1033 }, { "epoch": 5.63973063973064, "grad_norm": 0.46555609809855103, "learning_rate": 4.438429671543234e-06, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.2280246913433075, "step": 3350, "valid_targets_mean": 6279.8, "valid_targets_min": 4022 }, { "epoch": 5.648148148148148, "grad_norm": 0.4853473764029863, "learning_rate": 4.385829226493015e-06, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.231397345662117, "step": 3355, "valid_targets_mean": 5583.8, "valid_targets_min": 2088 }, { "epoch": 5.656565656565657, "grad_norm": 0.4657647618680769, "learning_rate": 4.333503919378767e-06, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.24527719616889954, "step": 3360, "valid_targets_mean": 6640.7, "valid_targets_min": 4507 }, { "epoch": 5.664983164983165, "grad_norm": 0.5317871094974028, "learning_rate": 4.2814546722268595e-06, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.23336941003799438, "step": 3365, "valid_targets_mean": 5179.6, "valid_targets_min": 753 }, { "epoch": 5.673400673400673, "grad_norm": 0.532977311370893, "learning_rate": 4.229682402199175e-06, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.23605574667453766, "step": 3370, "valid_targets_mean": 5920.1, "valid_targets_min": 2042 }, { "epoch": 5.681818181818182, "grad_norm": 0.5750924142313466, "learning_rate": 4.178188021576983e-06, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.23879092931747437, "step": 3375, "valid_targets_mean": 5165.8, "valid_targets_min": 529 }, { "epoch": 5.69023569023569, "grad_norm": 0.48765554257352756, "learning_rate": 4.126972437744861e-06, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.23397740721702576, "step": 3380, "valid_targets_mean": 5988.1, "valid_targets_min": 4242 }, { "epoch": 5.698653198653199, "grad_norm": 0.5294602681979758, "learning_rate": 4.076036553174678e-06, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.23284104466438293, "step": 3385, "valid_targets_mean": 5681.9, "valid_targets_min": 2217 }, { "epoch": 5.707070707070707, "grad_norm": 0.49114433501009724, "learning_rate": 4.025381265409722e-06, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.22848021984100342, "step": 3390, "valid_targets_mean": 6036.4, "valid_targets_min": 4350 }, { "epoch": 5.715488215488215, "grad_norm": 0.5110269277385011, "learning_rate": 3.975007467048875e-06, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.22457490861415863, "step": 3395, "valid_targets_mean": 5598.8, "valid_targets_min": 495 }, { "epoch": 5.723905723905724, "grad_norm": 0.5155941569501963, "learning_rate": 3.924916045730873e-06, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.20673015713691711, "step": 3400, "valid_targets_mean": 4903.1, "valid_targets_min": 1735 }, { "epoch": 5.732323232323233, "grad_norm": 0.5433799296336833, "learning_rate": 3.875107884118681e-06, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.26549580693244934, "step": 3405, "valid_targets_mean": 5974.6, "valid_targets_min": 648 }, { "epoch": 5.7407407407407405, "grad_norm": 0.5256583886737612, "learning_rate": 3.825583859883941e-06, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.23430989682674408, "step": 3410, "valid_targets_mean": 5242.2, "valid_targets_min": 836 }, { "epoch": 5.749158249158249, "grad_norm": 0.4716795001316659, "learning_rate": 3.7763448456914886e-06, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.23861783742904663, "step": 3415, "valid_targets_mean": 6166.8, "valid_targets_min": 2042 }, { "epoch": 5.757575757575758, "grad_norm": 0.5261853664922447, "learning_rate": 3.7273917091839806e-06, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.25470608472824097, "step": 3420, "valid_targets_mean": 5424.5, "valid_targets_min": 634 }, { "epoch": 5.7659932659932664, "grad_norm": 0.4962287138405268, "learning_rate": 3.678725312966629e-06, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.23568958044052124, "step": 3425, "valid_targets_mean": 5845.6, "valid_targets_min": 2110 }, { "epoch": 5.774410774410774, "grad_norm": 0.45971665253736965, "learning_rate": 3.6303465145919716e-06, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.18748649954795837, "step": 3430, "valid_targets_mean": 6514.1, "valid_targets_min": 4917 }, { "epoch": 5.782828282828283, "grad_norm": 0.5045763625955956, "learning_rate": 3.582256166544773e-06, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.23577597737312317, "step": 3435, "valid_targets_mean": 5670.4, "valid_targets_min": 2205 }, { "epoch": 5.7912457912457915, "grad_norm": 0.5026506603551945, "learning_rate": 3.534455116227005e-06, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.24811536073684692, "step": 3440, "valid_targets_mean": 6188.9, "valid_targets_min": 3727 }, { "epoch": 5.799663299663299, "grad_norm": 0.5013307207280829, "learning_rate": 3.4869442059429084e-06, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.24296782910823822, "step": 3445, "valid_targets_mean": 5887.4, "valid_targets_min": 2936 }, { "epoch": 5.808080808080808, "grad_norm": 0.4857730396730159, "learning_rate": 3.4397242728841663e-06, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.2121039479970932, "step": 3450, "valid_targets_mean": 5653.2, "valid_targets_min": 677 }, { "epoch": 5.816498316498317, "grad_norm": 0.5330733750805351, "learning_rate": 3.392796149115132e-06, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.2211214303970337, "step": 3455, "valid_targets_mean": 5979.4, "valid_targets_min": 3875 }, { "epoch": 5.824915824915825, "grad_norm": 0.5031682106996872, "learning_rate": 3.3461606615581686e-06, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.22831107676029205, "step": 3460, "valid_targets_mean": 5962.1, "valid_targets_min": 1753 }, { "epoch": 5.833333333333333, "grad_norm": 0.5018170197197533, "learning_rate": 3.2998186319791037e-06, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.22891631722450256, "step": 3465, "valid_targets_mean": 5357.0, "valid_targets_min": 710 }, { "epoch": 5.841750841750842, "grad_norm": 0.5144545245009204, "learning_rate": 3.2537708769727105e-06, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.23250479996204376, "step": 3470, "valid_targets_mean": 5865.8, "valid_targets_min": 976 }, { "epoch": 5.85016835016835, "grad_norm": 0.5293606642107064, "learning_rate": 3.2080182079483492e-06, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.23509103059768677, "step": 3475, "valid_targets_mean": 4859.6, "valid_targets_min": 642 }, { "epoch": 5.858585858585858, "grad_norm": 0.5144848394075487, "learning_rate": 3.162561431115654e-06, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.23617658019065857, "step": 3480, "valid_targets_mean": 5443.1, "valid_targets_min": 1760 }, { "epoch": 5.867003367003367, "grad_norm": 0.5254868769972713, "learning_rate": 3.1174013474703255e-06, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.2453891634941101, "step": 3485, "valid_targets_mean": 5495.3, "valid_targets_min": 786 }, { "epoch": 5.875420875420875, "grad_norm": 0.4776346524861737, "learning_rate": 3.0725387527800388e-06, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.2222374677658081, "step": 3490, "valid_targets_mean": 6261.4, "valid_targets_min": 3908 }, { "epoch": 5.883838383838384, "grad_norm": 0.5207427790341015, "learning_rate": 3.027974437570389e-06, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.24584221839904785, "step": 3495, "valid_targets_mean": 5397.8, "valid_targets_min": 1098 }, { "epoch": 5.892255892255893, "grad_norm": 0.5309523002539125, "learning_rate": 2.9837091871109748e-06, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.2331022322177887, "step": 3500, "valid_targets_mean": 5541.5, "valid_targets_min": 805 }, { "epoch": 5.9006734006734005, "grad_norm": 0.5265535546852831, "learning_rate": 2.939743781401576e-06, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.24659153819084167, "step": 3505, "valid_targets_mean": 5344.6, "valid_targets_min": 1761 }, { "epoch": 5.909090909090909, "grad_norm": 0.5269585514846513, "learning_rate": 2.896078995158391e-06, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.2496645152568817, "step": 3510, "valid_targets_mean": 5882.9, "valid_targets_min": 823 }, { "epoch": 5.917508417508418, "grad_norm": 0.5318764988027825, "learning_rate": 2.852715597800373e-06, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2297423630952835, "step": 3515, "valid_targets_mean": 5516.7, "valid_targets_min": 599 }, { "epoch": 5.925925925925926, "grad_norm": 0.4895912672050829, "learning_rate": 2.8096543534357157e-06, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.22827956080436707, "step": 3520, "valid_targets_mean": 6107.5, "valid_targets_min": 4393 }, { "epoch": 5.934343434343434, "grad_norm": 0.5091664341563568, "learning_rate": 2.766896020848351e-06, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.24848194420337677, "step": 3525, "valid_targets_mean": 6239.6, "valid_targets_min": 4263 }, { "epoch": 5.942760942760943, "grad_norm": 0.4896189673623001, "learning_rate": 2.7244413534845813e-06, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2458949238061905, "step": 3530, "valid_targets_mean": 5956.6, "valid_targets_min": 2262 }, { "epoch": 5.951178451178452, "grad_norm": 0.4985274922172781, "learning_rate": 2.6822910994398334e-06, "loss": 0.2407, "loss_nan_ranks": 0, "loss_rank_avg": 0.2408095747232437, "step": 3535, "valid_targets_mean": 5447.9, "valid_targets_min": 737 }, { "epoch": 5.959595959595959, "grad_norm": 0.5025455962690482, "learning_rate": 2.6404460014454356e-06, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.22609840333461761, "step": 3540, "valid_targets_mean": 5844.9, "valid_targets_min": 833 }, { "epoch": 5.968013468013468, "grad_norm": 0.5777884151750781, "learning_rate": 2.5989067968555514e-06, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.2250966876745224, "step": 3545, "valid_targets_mean": 5791.6, "valid_targets_min": 1732 }, { "epoch": 5.976430976430977, "grad_norm": 0.47037374955087863, "learning_rate": 2.557674217634196e-06, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.2266923189163208, "step": 3550, "valid_targets_mean": 6096.9, "valid_targets_min": 3177 }, { "epoch": 5.984848484848484, "grad_norm": 0.4729716390407066, "learning_rate": 2.516748990342317e-06, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.2235698103904724, "step": 3555, "valid_targets_mean": 5944.9, "valid_targets_min": 2345 }, { "epoch": 5.993265993265993, "grad_norm": 0.5070240661629777, "learning_rate": 2.476131836125e-06, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.21875323355197906, "step": 3560, "valid_targets_mean": 5720.9, "valid_targets_min": 3382 }, { "epoch": 6.001683501683502, "grad_norm": 0.5114000681337469, "learning_rate": 2.435823470698768e-06, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.23242336511611938, "step": 3565, "valid_targets_mean": 5812.8, "valid_targets_min": 2026 }, { "epoch": 6.01010101010101, "grad_norm": 0.4877299717933894, "learning_rate": 2.3958246043389566e-06, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.22799277305603027, "step": 3570, "valid_targets_mean": 6143.9, "valid_targets_min": 3948 }, { "epoch": 6.018518518518518, "grad_norm": 0.5104477619265424, "learning_rate": 2.356135941867217e-06, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.2472635954618454, "step": 3575, "valid_targets_mean": 6150.5, "valid_targets_min": 5193 }, { "epoch": 6.026936026936027, "grad_norm": 0.5257410926565665, "learning_rate": 2.3167581826390806e-06, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.22177693247795105, "step": 3580, "valid_targets_mean": 6363.8, "valid_targets_min": 1273 }, { "epoch": 6.0353535353535355, "grad_norm": 0.5340948925922618, "learning_rate": 2.2776920205316276e-06, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.21528631448745728, "step": 3585, "valid_targets_mean": 5297.4, "valid_targets_min": 740 }, { "epoch": 6.043771043771044, "grad_norm": 0.49589683213064645, "learning_rate": 2.2389381439312973e-06, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2327052652835846, "step": 3590, "valid_targets_mean": 6229.2, "valid_targets_min": 4307 }, { "epoch": 6.052188552188552, "grad_norm": 0.5405859979341503, "learning_rate": 2.2004972357217146e-06, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.2503454089164734, "step": 3595, "valid_targets_mean": 5809.4, "valid_targets_min": 2837 }, { "epoch": 6.0606060606060606, "grad_norm": 0.5362685969042656, "learning_rate": 2.1623699732716787e-06, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.210447758436203, "step": 3600, "valid_targets_mean": 5844.3, "valid_targets_min": 2311 }, { "epoch": 6.069023569023569, "grad_norm": 0.4857377618243944, "learning_rate": 2.1245570284232263e-06, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2283036708831787, "step": 3605, "valid_targets_mean": 5930.3, "valid_targets_min": 3133 }, { "epoch": 6.077441077441078, "grad_norm": 0.5069274043988372, "learning_rate": 2.0870590674797884e-06, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.24341779947280884, "step": 3610, "valid_targets_mean": 6278.7, "valid_targets_min": 809 }, { "epoch": 6.085858585858586, "grad_norm": 0.5185395351533187, "learning_rate": 2.049876751194464e-06, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2473084181547165, "step": 3615, "valid_targets_mean": 6127.9, "valid_targets_min": 4402 }, { "epoch": 6.094276094276094, "grad_norm": 0.5140171375506261, "learning_rate": 2.0130107347583492e-06, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.22461938858032227, "step": 3620, "valid_targets_mean": 5651.7, "valid_targets_min": 3026 }, { "epoch": 6.102693602693603, "grad_norm": 0.5106698343028654, "learning_rate": 1.976461667789009e-06, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.2493961602449417, "step": 3625, "valid_targets_mean": 6109.2, "valid_targets_min": 775 }, { "epoch": 6.111111111111111, "grad_norm": 0.5052132229100402, "learning_rate": 1.940230194319044e-06, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.22754473984241486, "step": 3630, "valid_targets_mean": 5725.6, "valid_targets_min": 1919 }, { "epoch": 6.119528619528619, "grad_norm": 0.5159221563265757, "learning_rate": 1.9043169527847106e-06, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.24825209379196167, "step": 3635, "valid_targets_mean": 5646.5, "valid_targets_min": 2609 }, { "epoch": 6.127946127946128, "grad_norm": 0.5586060335280434, "learning_rate": 1.8687225760146922e-06, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.22073093056678772, "step": 3640, "valid_targets_mean": 5455.7, "valid_targets_min": 2205 }, { "epoch": 6.136363636363637, "grad_norm": 0.5243551621539269, "learning_rate": 1.833447691218948e-06, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.22795337438583374, "step": 3645, "valid_targets_mean": 5602.2, "valid_targets_min": 2095 }, { "epoch": 6.1447811447811445, "grad_norm": 0.4906849438414537, "learning_rate": 1.7984929199776457e-06, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.19058871269226074, "step": 3650, "valid_targets_mean": 5773.0, "valid_targets_min": 2224 }, { "epoch": 6.153198653198653, "grad_norm": 0.5073904766406345, "learning_rate": 1.7638588782302336e-06, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.22966495156288147, "step": 3655, "valid_targets_mean": 5965.8, "valid_targets_min": 2918 }, { "epoch": 6.161616161616162, "grad_norm": 0.5236586043176525, "learning_rate": 1.7295461762645626e-06, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.207240492105484, "step": 3660, "valid_targets_mean": 5210.7, "valid_targets_min": 607 }, { "epoch": 6.17003367003367, "grad_norm": 0.49544814137145954, "learning_rate": 1.6955554187061406e-06, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.22393043339252472, "step": 3665, "valid_targets_mean": 6129.8, "valid_targets_min": 2636 }, { "epoch": 6.178451178451178, "grad_norm": 0.5200333003420963, "learning_rate": 1.6618872045074929e-06, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.2077876478433609, "step": 3670, "valid_targets_mean": 6336.3, "valid_targets_min": 2918 }, { "epoch": 6.186868686868687, "grad_norm": 0.5493760889830712, "learning_rate": 1.6285421269375823e-06, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.23120251297950745, "step": 3675, "valid_targets_mean": 5103.4, "valid_targets_min": 886 }, { "epoch": 6.1952861952861955, "grad_norm": 0.4952648358724955, "learning_rate": 1.595520773571364e-06, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.2233111560344696, "step": 3680, "valid_targets_mean": 6430.8, "valid_targets_min": 4065 }, { "epoch": 6.203703703703703, "grad_norm": 0.5308289686736317, "learning_rate": 1.5628237262794544e-06, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.23317524790763855, "step": 3685, "valid_targets_mean": 5724.6, "valid_targets_min": 3592 }, { "epoch": 6.212121212121212, "grad_norm": 0.5204100323050561, "learning_rate": 1.5304515612178428e-06, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.21899659931659698, "step": 3690, "valid_targets_mean": 5272.9, "valid_targets_min": 795 }, { "epoch": 6.220538720538721, "grad_norm": 0.5395423268893877, "learning_rate": 1.4984048488177628e-06, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.23501020669937134, "step": 3695, "valid_targets_mean": 5511.4, "valid_targets_min": 524 }, { "epoch": 6.228956228956229, "grad_norm": 0.5078500154199302, "learning_rate": 1.466684153775635e-06, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.21515780687332153, "step": 3700, "valid_targets_mean": 5566.1, "valid_targets_min": 3132 }, { "epoch": 6.237373737373737, "grad_norm": 0.49003697819144293, "learning_rate": 1.435290035043111e-06, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.2258685827255249, "step": 3705, "valid_targets_mean": 6305.3, "valid_targets_min": 4132 }, { "epoch": 6.245791245791246, "grad_norm": 0.5234990052252189, "learning_rate": 1.4042230458172257e-06, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.23973727226257324, "step": 3710, "valid_targets_mean": 5435.1, "valid_targets_min": 2469 }, { "epoch": 6.254208754208754, "grad_norm": 0.5091769248174087, "learning_rate": 1.373483733530665e-06, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.24551436305046082, "step": 3715, "valid_targets_mean": 6078.8, "valid_targets_min": 4434 }, { "epoch": 6.262626262626263, "grad_norm": 0.5297523589562412, "learning_rate": 1.3430726398420846e-06, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.23026011884212494, "step": 3720, "valid_targets_mean": 5890.8, "valid_targets_min": 2292 }, { "epoch": 6.271043771043771, "grad_norm": 0.5205027082734003, "learning_rate": 1.3129903006266065e-06, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.212215855717659, "step": 3725, "valid_targets_mean": 5467.5, "valid_targets_min": 2309 }, { "epoch": 6.279461279461279, "grad_norm": 0.5248938296372679, "learning_rate": 1.2832372459663445e-06, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.22421753406524658, "step": 3730, "valid_targets_mean": 5535.9, "valid_targets_min": 875 }, { "epoch": 6.287878787878788, "grad_norm": 0.5597486286171638, "learning_rate": 1.2538140001410826e-06, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.22579503059387207, "step": 3735, "valid_targets_mean": 5427.9, "valid_targets_min": 702 }, { "epoch": 6.296296296296296, "grad_norm": 0.5237046035694222, "learning_rate": 1.224721081619029e-06, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.24596376717090607, "step": 3740, "valid_targets_mean": 5579.4, "valid_targets_min": 923 }, { "epoch": 6.3047138047138045, "grad_norm": 0.5378460293231798, "learning_rate": 1.1959590030476798e-06, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.223431795835495, "step": 3745, "valid_targets_mean": 5233.2, "valid_targets_min": 529 }, { "epoch": 6.313131313131313, "grad_norm": 0.4948826998786642, "learning_rate": 1.1675282712447821e-06, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.2282189428806305, "step": 3750, "valid_targets_mean": 6037.9, "valid_targets_min": 4773 }, { "epoch": 6.321548821548822, "grad_norm": 0.5783981006909941, "learning_rate": 1.1394293871894258e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.23504894971847534, "step": 3755, "valid_targets_mean": 4965.1, "valid_targets_min": 828 }, { "epoch": 6.32996632996633, "grad_norm": 0.5040102749412789, "learning_rate": 1.1116628460131684e-06, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.21298432350158691, "step": 3760, "valid_targets_mean": 5762.1, "valid_targets_min": 2447 }, { "epoch": 6.338383838383838, "grad_norm": 0.4952294476096354, "learning_rate": 1.0842291369913705e-06, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.22944945096969604, "step": 3765, "valid_targets_mean": 6218.2, "valid_targets_min": 2281 }, { "epoch": 6.346801346801347, "grad_norm": 0.5230154051584566, "learning_rate": 1.0571287435345256e-06, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.23738403618335724, "step": 3770, "valid_targets_mean": 5475.8, "valid_targets_min": 2815 }, { "epoch": 6.3552188552188555, "grad_norm": 0.5584119544200802, "learning_rate": 1.0303621431797638e-06, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.21592649817466736, "step": 3775, "valid_targets_mean": 5428.8, "valid_targets_min": 805 }, { "epoch": 6.363636363636363, "grad_norm": 0.5252472014851841, "learning_rate": 1.0039298075824377e-06, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.21030861139297485, "step": 3780, "valid_targets_mean": 6101.9, "valid_targets_min": 4283 }, { "epoch": 6.372053872053872, "grad_norm": 0.510018527842041, "learning_rate": 9.778322025078025e-07, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.22540400922298431, "step": 3785, "valid_targets_mean": 6047.4, "valid_targets_min": 3342 }, { "epoch": 6.380471380471381, "grad_norm": 0.4966811461897099, "learning_rate": 9.520697878228136e-07, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.2320118099451065, "step": 3790, "valid_targets_mean": 5937.1, "valid_targets_min": 2198 }, { "epoch": 6.388888888888889, "grad_norm": 0.5169653382390963, "learning_rate": 9.266430174880314e-07, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.24477005004882812, "step": 3795, "valid_targets_mean": 5758.1, "valid_targets_min": 895 }, { "epoch": 6.397306397306397, "grad_norm": 0.4975857094960845, "learning_rate": 9.015523395495963e-07, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.22504638135433197, "step": 3800, "valid_targets_mean": 5927.6, "valid_targets_min": 524 }, { "epoch": 6.405723905723906, "grad_norm": 0.5210723802099997, "learning_rate": 8.767981961313632e-07, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.23169521987438202, "step": 3805, "valid_targets_mean": 6047.5, "valid_targets_min": 2719 }, { "epoch": 6.414141414141414, "grad_norm": 0.507675266076043, "learning_rate": 8.523810234271024e-07, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.21925891935825348, "step": 3810, "valid_targets_mean": 6002.9, "valid_targets_min": 3674 }, { "epoch": 6.422558922558922, "grad_norm": 0.5044432912409538, "learning_rate": 8.283012516927979e-07, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2430918663740158, "step": 3815, "valid_targets_mean": 6220.0, "valid_targets_min": 3282 }, { "epoch": 6.430976430976431, "grad_norm": 0.5539200125899316, "learning_rate": 8.045593052390832e-07, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.22239992022514343, "step": 3820, "valid_targets_mean": 5531.8, "valid_targets_min": 3670 }, { "epoch": 6.4393939393939394, "grad_norm": 0.5212600886414331, "learning_rate": 7.811556024237644e-07, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.23301962018013, "step": 3825, "valid_targets_mean": 6046.6, "valid_targets_min": 2085 }, { "epoch": 6.447811447811448, "grad_norm": 0.543517601490649, "learning_rate": 7.580905556444351e-07, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.2337494194507599, "step": 3830, "valid_targets_mean": 5565.8, "valid_targets_min": 3133 }, { "epoch": 6.456228956228956, "grad_norm": 0.5789718366274003, "learning_rate": 7.353645713312164e-07, "loss": 0.2225, "loss_nan_ranks": 0, "loss_rank_avg": 0.22291827201843262, "step": 3835, "valid_targets_mean": 5005.3, "valid_targets_min": 548 }, { "epoch": 6.4646464646464645, "grad_norm": 0.5259856372538945, "learning_rate": 7.12978049939601e-07, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.21570321917533875, "step": 3840, "valid_targets_mean": 5165.9, "valid_targets_min": 2304 }, { "epoch": 6.473063973063973, "grad_norm": 0.5136883078710031, "learning_rate": 6.909313859433874e-07, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.2724156975746155, "step": 3845, "valid_targets_mean": 6629.4, "valid_targets_min": 823 }, { "epoch": 6.481481481481482, "grad_norm": 0.4915282768697449, "learning_rate": 6.692249678277373e-07, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.21886561810970306, "step": 3850, "valid_targets_mean": 5787.4, "valid_targets_min": 3854 }, { "epoch": 6.48989898989899, "grad_norm": 0.5101943668044208, "learning_rate": 6.478591780823262e-07, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.21968825161457062, "step": 3855, "valid_targets_mean": 6163.6, "valid_targets_min": 3495 }, { "epoch": 6.498316498316498, "grad_norm": 0.5021067934809788, "learning_rate": 6.268343931945952e-07, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.22854362428188324, "step": 3860, "valid_targets_mean": 5995.1, "valid_targets_min": 3142 }, { "epoch": 6.506734006734007, "grad_norm": 0.557332449113888, "learning_rate": 6.061509836431367e-07, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.21220096945762634, "step": 3865, "valid_targets_mean": 5461.5, "valid_targets_min": 3963 }, { "epoch": 6.515151515151516, "grad_norm": 0.5186256456829461, "learning_rate": 5.85809313891148e-07, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.20755138993263245, "step": 3870, "valid_targets_mean": 5407.1, "valid_targets_min": 1868 }, { "epoch": 6.523569023569023, "grad_norm": 0.49245121143841225, "learning_rate": 5.658097423800124e-07, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.24901744723320007, "step": 3875, "valid_targets_mean": 6360.4, "valid_targets_min": 4581 }, { "epoch": 6.531986531986532, "grad_norm": 0.5838948599522868, "learning_rate": 5.461526215229929e-07, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.2362005114555359, "step": 3880, "valid_targets_mean": 5119.0, "valid_targets_min": 628 }, { "epoch": 6.540404040404041, "grad_norm": 0.4873484403671387, "learning_rate": 5.268382976990083e-07, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.24804040789604187, "step": 3885, "valid_targets_mean": 6448.1, "valid_targets_min": 3836 }, { "epoch": 6.548821548821548, "grad_norm": 0.47878246569387206, "learning_rate": 5.078671112465472e-07, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2332177460193634, "step": 3890, "valid_targets_mean": 6442.3, "valid_targets_min": 4637 }, { "epoch": 6.557239057239057, "grad_norm": 0.5247985422667938, "learning_rate": 4.892393964576547e-07, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.22282634675502777, "step": 3895, "valid_targets_mean": 5424.9, "valid_targets_min": 669 }, { "epoch": 6.565656565656566, "grad_norm": 0.5485608251182884, "learning_rate": 4.7095548157204184e-07, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.22252830862998962, "step": 3900, "valid_targets_mean": 5017.9, "valid_targets_min": 771 }, { "epoch": 6.574074074074074, "grad_norm": 0.5514701095369009, "learning_rate": 4.5301568877132106e-07, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.1949262022972107, "step": 3905, "valid_targets_mean": 6186.4, "valid_targets_min": 2158 }, { "epoch": 6.582491582491582, "grad_norm": 0.49508090440885005, "learning_rate": 4.3542033417330433e-07, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.22400163114070892, "step": 3910, "valid_targets_mean": 5883.4, "valid_targets_min": 3182 }, { "epoch": 6.590909090909091, "grad_norm": 0.5226134266773029, "learning_rate": 4.181697278264496e-07, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.22463016211986542, "step": 3915, "valid_targets_mean": 5738.9, "valid_targets_min": 4297 }, { "epoch": 6.5993265993265995, "grad_norm": 0.46667116305509626, "learning_rate": 4.012641737043899e-07, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.22830307483673096, "step": 3920, "valid_targets_mean": 6400.0, "valid_targets_min": 2262 }, { "epoch": 6.607744107744107, "grad_norm": 0.5006237626497043, "learning_rate": 3.8470396970057946e-07, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2222435474395752, "step": 3925, "valid_targets_mean": 5903.4, "valid_targets_min": 4945 }, { "epoch": 6.616161616161616, "grad_norm": 0.5174878932627028, "learning_rate": 3.6848940762304277e-07, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.23240050673484802, "step": 3930, "valid_targets_mean": 5703.8, "valid_targets_min": 1984 }, { "epoch": 6.624579124579125, "grad_norm": 0.5198759175442372, "learning_rate": 3.5262077318923615e-07, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.2365482747554779, "step": 3935, "valid_targets_mean": 6016.2, "valid_targets_min": 4563 }, { "epoch": 6.632996632996633, "grad_norm": 0.5115968930294122, "learning_rate": 3.37098346021012e-07, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.22688379883766174, "step": 3940, "valid_targets_mean": 5793.9, "valid_targets_min": 4283 }, { "epoch": 6.641414141414142, "grad_norm": 0.5152584191758609, "learning_rate": 3.2192239963968477e-07, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.22982186079025269, "step": 3945, "valid_targets_mean": 5751.3, "valid_targets_min": 1486 }, { "epoch": 6.64983164983165, "grad_norm": 0.4903080196046145, "learning_rate": 3.07093201461226e-07, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.2335420846939087, "step": 3950, "valid_targets_mean": 6418.2, "valid_targets_min": 3667 }, { "epoch": 6.658249158249158, "grad_norm": 0.5411356489778124, "learning_rate": 2.926110127915327e-07, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.22956421971321106, "step": 3955, "valid_targets_mean": 5280.3, "valid_targets_min": 580 }, { "epoch": 6.666666666666667, "grad_norm": 0.48921399133046517, "learning_rate": 2.7847608882184186e-07, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.21850576996803284, "step": 3960, "valid_targets_mean": 6326.2, "valid_targets_min": 4168 }, { "epoch": 6.675084175084175, "grad_norm": 0.5082833393301474, "learning_rate": 2.6468867862421865e-07, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.228357195854187, "step": 3965, "valid_targets_mean": 5868.0, "valid_targets_min": 1900 }, { "epoch": 6.683501683501683, "grad_norm": 0.48858787085087396, "learning_rate": 2.5124902514717773e-07, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.22642362117767334, "step": 3970, "valid_targets_mean": 6190.9, "valid_targets_min": 4478 }, { "epoch": 6.691919191919192, "grad_norm": 0.48981711224027497, "learning_rate": 2.3815736521139775e-07, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.22989197075366974, "step": 3975, "valid_targets_mean": 6458.6, "valid_targets_min": 3865 }, { "epoch": 6.700336700336701, "grad_norm": 0.5396742819020192, "learning_rate": 2.254139295055513e-07, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.21652349829673767, "step": 3980, "valid_targets_mean": 5217.4, "valid_targets_min": 1809 }, { "epoch": 6.7087542087542085, "grad_norm": 0.538771879253705, "learning_rate": 2.1301894258223045e-07, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.2519531846046448, "step": 3985, "valid_targets_mean": 5681.4, "valid_targets_min": 2085 }, { "epoch": 6.717171717171717, "grad_norm": 0.5053903866002492, "learning_rate": 2.0097262285400764e-07, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.21983280777931213, "step": 3990, "valid_targets_mean": 5716.7, "valid_targets_min": 2388 }, { "epoch": 6.725589225589226, "grad_norm": 0.5128327242924421, "learning_rate": 1.8927518258957e-07, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.20815545320510864, "step": 3995, "valid_targets_mean": 5685.9, "valid_targets_min": 882 }, { "epoch": 6.7340067340067336, "grad_norm": 0.5155864351532222, "learning_rate": 1.7792682790998217e-07, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.25162017345428467, "step": 4000, "valid_targets_mean": 6619.4, "valid_targets_min": 2331 }, { "epoch": 6.742424242424242, "grad_norm": 0.5572123489167949, "learning_rate": 1.6692775878506705e-07, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.23857121169567108, "step": 4005, "valid_targets_mean": 5601.3, "valid_targets_min": 2042 }, { "epoch": 6.750841750841751, "grad_norm": 0.5386724169939262, "learning_rate": 1.5627816902986204e-07, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.2514593005180359, "step": 4010, "valid_targets_mean": 5908.2, "valid_targets_min": 3662 }, { "epoch": 6.7592592592592595, "grad_norm": 0.5142136892512724, "learning_rate": 1.4597824630122604e-07, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.22154447436332703, "step": 4015, "valid_targets_mean": 5728.4, "valid_targets_min": 3307 }, { "epoch": 6.767676767676767, "grad_norm": 0.505999257157595, "learning_rate": 1.360281720945089e-07, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.22565945982933044, "step": 4020, "valid_targets_mean": 6077.9, "valid_targets_min": 3131 }, { "epoch": 6.776094276094276, "grad_norm": 0.5091773084597425, "learning_rate": 1.2642812174037621e-07, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.24219831824302673, "step": 4025, "valid_targets_mean": 5903.4, "valid_targets_min": 713 }, { "epoch": 6.784511784511785, "grad_norm": 0.469852641795815, "learning_rate": 1.1717826440170054e-07, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.21723823249340057, "step": 4030, "valid_targets_mean": 6776.9, "valid_targets_min": 5320 }, { "epoch": 6.792929292929293, "grad_norm": 0.4814380129058402, "learning_rate": 1.0827876307059503e-07, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.22944395244121552, "step": 4035, "valid_targets_mean": 6529.6, "valid_targets_min": 4226 }, { "epoch": 6.801346801346801, "grad_norm": 0.5218042402047304, "learning_rate": 9.972977456553345e-08, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.2270907461643219, "step": 4040, "valid_targets_mean": 5496.2, "valid_targets_min": 2157 }, { "epoch": 6.80976430976431, "grad_norm": 0.5691017326768867, "learning_rate": 9.153144952859017e-08, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.22278842329978943, "step": 4045, "valid_targets_mean": 5140.4, "valid_targets_min": 767 }, { "epoch": 6.818181818181818, "grad_norm": 0.5499421984771002, "learning_rate": 8.368393242277784e-08, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.2250651717185974, "step": 4050, "valid_targets_mean": 5465.9, "valid_targets_min": 791 }, { "epoch": 6.826599326599327, "grad_norm": 0.5378879282700434, "learning_rate": 7.618736152951611e-08, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.253796249628067, "step": 4055, "valid_targets_mean": 5403.1, "valid_targets_min": 1986 }, { "epoch": 6.835016835016835, "grad_norm": 0.5589319216560491, "learning_rate": 6.904186894618692e-08, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2060225009918213, "step": 4060, "valid_targets_mean": 6291.4, "valid_targets_min": 3416 }, { "epoch": 6.843434343434343, "grad_norm": 0.5563582211872528, "learning_rate": 6.224758058380298e-08, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.23780454695224762, "step": 4065, "valid_targets_mean": 5445.9, "valid_targets_min": 1482 }, { "epoch": 6.851851851851852, "grad_norm": 0.49591666289659025, "learning_rate": 5.580461616479183e-08, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.2293078452348709, "step": 4070, "valid_targets_mean": 5957.1, "valid_targets_min": 4006 }, { "epoch": 6.86026936026936, "grad_norm": 0.5195416954225124, "learning_rate": 4.971308922089746e-08, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.21978473663330078, "step": 4075, "valid_targets_mean": 5605.7, "valid_targets_min": 2270 }, { "epoch": 6.8686868686868685, "grad_norm": 0.6230757006742872, "learning_rate": 4.397310709115532e-08, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.21849480271339417, "step": 4080, "valid_targets_mean": 4612.2, "valid_targets_min": 804 }, { "epoch": 6.877104377104377, "grad_norm": 0.5136176458728036, "learning_rate": 3.85847709200271e-08, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.23595461249351501, "step": 4085, "valid_targets_mean": 5972.6, "valid_targets_min": 5081 }, { "epoch": 6.885521885521886, "grad_norm": 0.48471813785882656, "learning_rate": 3.35481756556022e-08, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.23174874484539032, "step": 4090, "valid_targets_mean": 5933.6, "valid_targets_min": 1004 }, { "epoch": 6.893939393939394, "grad_norm": 0.5181480546027055, "learning_rate": 2.886341004793014e-08, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.22367450594902039, "step": 4095, "valid_targets_mean": 5459.8, "valid_targets_min": 3090 }, { "epoch": 6.902356902356902, "grad_norm": 0.5259358606796519, "learning_rate": 2.4530556647457404e-08, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.2420312762260437, "step": 4100, "valid_targets_mean": 5836.4, "valid_targets_min": 2388 }, { "epoch": 6.910774410774411, "grad_norm": 0.5216774951720721, "learning_rate": 2.0549691803566362e-08, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.24406731128692627, "step": 4105, "valid_targets_mean": 5652.4, "valid_targets_min": 963 }, { "epoch": 6.91919191919192, "grad_norm": 0.5064354053022379, "learning_rate": 1.6920885663238573e-08, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2080550193786621, "step": 4110, "valid_targets_mean": 5772.5, "valid_targets_min": 3893 }, { "epoch": 6.927609427609427, "grad_norm": 0.48979470818174814, "learning_rate": 1.3644202169813547e-08, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.2382018268108368, "step": 4115, "valid_targets_mean": 6401.1, "valid_targets_min": 2133 }, { "epoch": 6.936026936026936, "grad_norm": 0.5657014297746613, "learning_rate": 1.0719699061865208e-08, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.2425881028175354, "step": 4120, "valid_targets_mean": 5984.1, "valid_targets_min": 4215 }, { "epoch": 6.944444444444445, "grad_norm": 0.49423121741118176, "learning_rate": 8.147427872180481e-09, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.20437312126159668, "step": 4125, "valid_targets_mean": 5447.6, "valid_targets_min": 728 }, { "epoch": 6.952861952861953, "grad_norm": 0.5045817158250394, "learning_rate": 5.927433926855575e-09, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.24840131402015686, "step": 4130, "valid_targets_mean": 6229.9, "valid_targets_min": 5249 }, { "epoch": 6.961279461279461, "grad_norm": 0.5657405963065263, "learning_rate": 4.059756344492183e-09, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.222096785902977, "step": 4135, "valid_targets_mean": 5216.6, "valid_targets_min": 1782 }, { "epoch": 6.96969696969697, "grad_norm": 0.5185358892889281, "learning_rate": 2.5444280355135796e-09, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.22283129394054413, "step": 4140, "valid_targets_mean": 6054.6, "valid_targets_min": 2148 }, { "epoch": 6.978114478114478, "grad_norm": 0.6277226876991597, "learning_rate": 1.381475701580648e-09, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.2108631134033203, "step": 4145, "valid_targets_mean": 5032.8, "valid_targets_min": 896 }, { "epoch": 6.986531986531986, "grad_norm": 0.5184384890847686, "learning_rate": 5.709198351233624e-10, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.2267255336046219, "step": 4150, "valid_targets_mean": 5675.1, "valid_targets_min": 570 }, { "epoch": 6.994949494949495, "grad_norm": 0.5444858373108672, "learning_rate": 1.1277471898107905e-10, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.21790213882923126, "step": 4155, "valid_targets_mean": 5063.0, "valid_targets_min": 650 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.23528757691383362, "step": 4158, "total_flos": 2225784336678912.0, "train_loss": 0.1554051661732221, "train_runtime": 19007.0278, "train_samples_per_second": 3.495, "train_steps_per_second": 0.219, "valid_targets_mean": 5790.4, "valid_targets_min": 2026 } ], "logging_steps": 5, "max_steps": 4158, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2225784336678912.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }