{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4389, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.007974481658692184, "grad_norm": 18.18803099603151, "learning_rate": 3.644646924829157e-07, "loss": 0.7198, "loss_nan_ranks": 0, "loss_rank_avg": 0.7252004146575928, "step": 5, "valid_targets_mean": 3434.4, "valid_targets_min": 864 }, { "epoch": 0.01594896331738437, "grad_norm": 14.307158106996866, "learning_rate": 8.200455580865605e-07, "loss": 0.67, "loss_nan_ranks": 0, "loss_rank_avg": 0.6224847435951233, "step": 10, "valid_targets_mean": 4096.6, "valid_targets_min": 510 }, { "epoch": 0.023923444976076555, "grad_norm": 14.459528130720114, "learning_rate": 1.2756264236902052e-06, "loss": 0.6655, "loss_nan_ranks": 0, "loss_rank_avg": 0.6342157125473022, "step": 15, "valid_targets_mean": 5213.8, "valid_targets_min": 1714 }, { "epoch": 0.03189792663476874, "grad_norm": 13.998960975547485, "learning_rate": 1.7312072892938498e-06, "loss": 0.6358, "loss_nan_ranks": 0, "loss_rank_avg": 0.6497429013252258, "step": 20, "valid_targets_mean": 3823.2, "valid_targets_min": 1156 }, { "epoch": 0.03987240829346093, "grad_norm": 7.703819741872236, "learning_rate": 2.1867881548974945e-06, "loss": 0.5962, "loss_nan_ranks": 0, "loss_rank_avg": 0.5347366333007812, "step": 25, "valid_targets_mean": 4505.9, "valid_targets_min": 1707 }, { "epoch": 0.04784688995215311, "grad_norm": 4.528783755997337, "learning_rate": 2.642369020501139e-06, "loss": 0.5417, "loss_nan_ranks": 0, "loss_rank_avg": 0.48101523518562317, "step": 30, "valid_targets_mean": 4406.1, "valid_targets_min": 1431 }, { "epoch": 0.05582137161084529, "grad_norm": 2.971933510909393, "learning_rate": 3.0979498861047843e-06, "loss": 0.4918, "loss_nan_ranks": 0, "loss_rank_avg": 0.4876139760017395, "step": 35, "valid_targets_mean": 3874.3, "valid_targets_min": 1363 }, { "epoch": 0.06379585326953748, "grad_norm": 1.836628593469571, "learning_rate": 3.5535307517084285e-06, "loss": 0.4547, "loss_nan_ranks": 0, "loss_rank_avg": 0.47373178601264954, "step": 40, "valid_targets_mean": 3826.8, "valid_targets_min": 1465 }, { "epoch": 0.07177033492822966, "grad_norm": 1.2423251085316844, "learning_rate": 4.009111617312073e-06, "loss": 0.4167, "loss_nan_ranks": 0, "loss_rank_avg": 0.4141938090324402, "step": 45, "valid_targets_mean": 4673.0, "valid_targets_min": 1811 }, { "epoch": 0.07974481658692185, "grad_norm": 1.1976629955780103, "learning_rate": 4.464692482915718e-06, "loss": 0.4112, "loss_nan_ranks": 0, "loss_rank_avg": 0.4462246000766754, "step": 50, "valid_targets_mean": 3402.2, "valid_targets_min": 1417 }, { "epoch": 0.08771929824561403, "grad_norm": 0.9374607824761864, "learning_rate": 4.920273348519363e-06, "loss": 0.4168, "loss_nan_ranks": 0, "loss_rank_avg": 0.39574891328811646, "step": 55, "valid_targets_mean": 3730.4, "valid_targets_min": 1185 }, { "epoch": 0.09569377990430622, "grad_norm": 0.8345026125790815, "learning_rate": 5.375854214123008e-06, "loss": 0.4056, "loss_nan_ranks": 0, "loss_rank_avg": 0.3709059953689575, "step": 60, "valid_targets_mean": 4410.6, "valid_targets_min": 1877 }, { "epoch": 0.10366826156299841, "grad_norm": 0.7251088865875112, "learning_rate": 5.831435079726651e-06, "loss": 0.3957, "loss_nan_ranks": 0, "loss_rank_avg": 0.414184033870697, "step": 65, "valid_targets_mean": 4409.2, "valid_targets_min": 1579 }, { "epoch": 0.11164274322169059, "grad_norm": 0.6361706459112471, "learning_rate": 6.287015945330297e-06, "loss": 0.3825, "loss_nan_ranks": 0, "loss_rank_avg": 0.3978373408317566, "step": 70, "valid_targets_mean": 4352.1, "valid_targets_min": 629 }, { "epoch": 0.11961722488038277, "grad_norm": 0.8778851407966174, "learning_rate": 6.742596810933942e-06, "loss": 0.3551, "loss_nan_ranks": 0, "loss_rank_avg": 0.3310779929161072, "step": 75, "valid_targets_mean": 3677.3, "valid_targets_min": 1683 }, { "epoch": 0.12759170653907495, "grad_norm": 0.5499827496003175, "learning_rate": 7.1981776765375854e-06, "loss": 0.3597, "loss_nan_ranks": 0, "loss_rank_avg": 0.34589529037475586, "step": 80, "valid_targets_mean": 4806.0, "valid_targets_min": 1519 }, { "epoch": 0.13556618819776714, "grad_norm": 0.6376269307263297, "learning_rate": 7.65375854214123e-06, "loss": 0.3658, "loss_nan_ranks": 0, "loss_rank_avg": 0.3655011057853699, "step": 85, "valid_targets_mean": 3583.9, "valid_targets_min": 2175 }, { "epoch": 0.14354066985645933, "grad_norm": 0.5742252753369051, "learning_rate": 8.109339407744875e-06, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.385811448097229, "step": 90, "valid_targets_mean": 4250.4, "valid_targets_min": 1863 }, { "epoch": 0.15151515151515152, "grad_norm": 0.5753097344872611, "learning_rate": 8.564920273348521e-06, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.3747674226760864, "step": 95, "valid_targets_mean": 4264.9, "valid_targets_min": 1876 }, { "epoch": 0.1594896331738437, "grad_norm": 0.5354986309600116, "learning_rate": 9.020501138952164e-06, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.29349711537361145, "step": 100, "valid_targets_mean": 4301.4, "valid_targets_min": 1022 }, { "epoch": 0.1674641148325359, "grad_norm": 0.5042094725304733, "learning_rate": 9.47608200455581e-06, "loss": 0.3269, "loss_nan_ranks": 0, "loss_rank_avg": 0.3074486553668976, "step": 105, "valid_targets_mean": 4285.6, "valid_targets_min": 949 }, { "epoch": 0.17543859649122806, "grad_norm": 0.5342534363482105, "learning_rate": 9.931662870159453e-06, "loss": 0.3345, "loss_nan_ranks": 0, "loss_rank_avg": 0.33433669805526733, "step": 110, "valid_targets_mean": 4667.8, "valid_targets_min": 1007 }, { "epoch": 0.18341307814992025, "grad_norm": 0.5664117732647538, "learning_rate": 1.03872437357631e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.3258150815963745, "step": 115, "valid_targets_mean": 4168.5, "valid_targets_min": 2399 }, { "epoch": 0.19138755980861244, "grad_norm": 0.6195050405082234, "learning_rate": 1.0842824601366744e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.317843496799469, "step": 120, "valid_targets_mean": 4331.0, "valid_targets_min": 311 }, { "epoch": 0.19936204146730463, "grad_norm": 0.7106286580810014, "learning_rate": 1.1298405466970387e-05, "loss": 0.3052, "loss_nan_ranks": 0, "loss_rank_avg": 0.345772385597229, "step": 125, "valid_targets_mean": 3779.2, "valid_targets_min": 1227 }, { "epoch": 0.20733652312599682, "grad_norm": 0.5142652660619057, "learning_rate": 1.1753986332574032e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607839107513428, "step": 130, "valid_targets_mean": 4497.3, "valid_targets_min": 809 }, { "epoch": 0.215311004784689, "grad_norm": 0.5952097660485908, "learning_rate": 1.2209567198177677e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.31705808639526367, "step": 135, "valid_targets_mean": 4538.1, "valid_targets_min": 1387 }, { "epoch": 0.22328548644338117, "grad_norm": 0.5105105591440974, "learning_rate": 1.2665148063781323e-05, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607859969139099, "step": 140, "valid_targets_mean": 4369.7, "valid_targets_min": 1806 }, { "epoch": 0.23125996810207336, "grad_norm": 0.503655334834791, "learning_rate": 1.3120728929384968e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.26573601365089417, "step": 145, "valid_targets_mean": 4547.8, "valid_targets_min": 1503 }, { "epoch": 0.23923444976076555, "grad_norm": 0.5331226450754283, "learning_rate": 1.357630979498861e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.29404884576797485, "step": 150, "valid_targets_mean": 4822.4, "valid_targets_min": 465 }, { "epoch": 0.24720893141945774, "grad_norm": 0.5583950119493155, "learning_rate": 1.4031890660592255e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.28105857968330383, "step": 155, "valid_targets_mean": 4380.1, "valid_targets_min": 1890 }, { "epoch": 0.2551834130781499, "grad_norm": 0.5248261173296397, "learning_rate": 1.4487471526195902e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.35021817684173584, "step": 160, "valid_targets_mean": 5202.3, "valid_targets_min": 1672 }, { "epoch": 0.2631578947368421, "grad_norm": 0.4720997343296031, "learning_rate": 1.4943052391799546e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.3036966323852539, "step": 165, "valid_targets_mean": 5538.6, "valid_targets_min": 635 }, { "epoch": 0.2711323763955343, "grad_norm": 0.5595618392183499, "learning_rate": 1.539863325740319e-05, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.30375349521636963, "step": 170, "valid_targets_mean": 4671.9, "valid_targets_min": 1260 }, { "epoch": 0.27910685805422647, "grad_norm": 0.5555511001381592, "learning_rate": 1.5854214123006836e-05, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.31066784262657166, "step": 175, "valid_targets_mean": 3623.2, "valid_targets_min": 404 }, { "epoch": 0.28708133971291866, "grad_norm": 0.49946036712405906, "learning_rate": 1.630979498861048e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.25820064544677734, "step": 180, "valid_targets_mean": 4328.4, "valid_targets_min": 2082 }, { "epoch": 0.29505582137161085, "grad_norm": 0.6264471320724355, "learning_rate": 1.6765375854214125e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.28867748379707336, "step": 185, "valid_targets_mean": 4590.6, "valid_targets_min": 621 }, { "epoch": 0.30303030303030304, "grad_norm": 0.5759630894438817, "learning_rate": 1.722095671981777e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.315102219581604, "step": 190, "valid_targets_mean": 4509.0, "valid_targets_min": 1333 }, { "epoch": 0.31100478468899523, "grad_norm": 0.5294255834259166, "learning_rate": 1.7676537585421415e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.27122050523757935, "step": 195, "valid_targets_mean": 4544.4, "valid_targets_min": 1545 }, { "epoch": 0.3189792663476874, "grad_norm": 0.6154065761188445, "learning_rate": 1.813211845102506e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.24356196820735931, "step": 200, "valid_targets_mean": 3598.1, "valid_targets_min": 1584 }, { "epoch": 0.3269537480063796, "grad_norm": 0.5224082452829883, "learning_rate": 1.8587699316628704e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.284517765045166, "step": 205, "valid_targets_mean": 5208.4, "valid_targets_min": 1290 }, { "epoch": 0.3349282296650718, "grad_norm": 0.5756342094108516, "learning_rate": 1.904328018223235e-05, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.3382299542427063, "step": 210, "valid_targets_mean": 4352.9, "valid_targets_min": 1068 }, { "epoch": 0.34290271132376393, "grad_norm": 0.5209919174559063, "learning_rate": 1.9498861047835993e-05, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.3093770444393158, "step": 215, "valid_targets_mean": 4669.0, "valid_targets_min": 1859 }, { "epoch": 0.3508771929824561, "grad_norm": 0.5564760822604873, "learning_rate": 1.9954441913439638e-05, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.41471871733665466, "step": 220, "valid_targets_mean": 5771.4, "valid_targets_min": 467 }, { "epoch": 0.3588516746411483, "grad_norm": 0.4401205513624318, "learning_rate": 2.0410022779043283e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.23879970610141754, "step": 225, "valid_targets_mean": 5340.2, "valid_targets_min": 1166 }, { "epoch": 0.3668261562998405, "grad_norm": 0.548529089679332, "learning_rate": 2.0865603644646927e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.2805835008621216, "step": 230, "valid_targets_mean": 4598.0, "valid_targets_min": 1647 }, { "epoch": 0.3748006379585327, "grad_norm": 0.6106048799267036, "learning_rate": 2.1321184510250572e-05, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.260797917842865, "step": 235, "valid_targets_mean": 3621.2, "valid_targets_min": 1345 }, { "epoch": 0.3827751196172249, "grad_norm": 0.5381663991323422, "learning_rate": 2.1776765375854217e-05, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.2917918562889099, "step": 240, "valid_targets_mean": 4667.2, "valid_targets_min": 2104 }, { "epoch": 0.39074960127591707, "grad_norm": 0.7581595258947841, "learning_rate": 2.223234624145786e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.28909996151924133, "step": 245, "valid_targets_mean": 4371.6, "valid_targets_min": 1739 }, { "epoch": 0.39872408293460926, "grad_norm": 0.5806802069339, "learning_rate": 2.2687927107061506e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631956934928894, "step": 250, "valid_targets_mean": 4192.1, "valid_targets_min": 1587 }, { "epoch": 0.40669856459330145, "grad_norm": 0.6263257130474685, "learning_rate": 2.314350797266515e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.25036656856536865, "step": 255, "valid_targets_mean": 4222.9, "valid_targets_min": 2196 }, { "epoch": 0.41467304625199364, "grad_norm": 0.5344890255498245, "learning_rate": 2.3599088838268792e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.26563674211502075, "step": 260, "valid_targets_mean": 4978.1, "valid_targets_min": 1867 }, { "epoch": 0.4226475279106858, "grad_norm": 0.5058620232957759, "learning_rate": 2.4054669703872436e-05, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.25486892461776733, "step": 265, "valid_targets_mean": 5157.2, "valid_targets_min": 1801 }, { "epoch": 0.430622009569378, "grad_norm": 0.6522226250750656, "learning_rate": 2.4510250569476085e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.27999359369277954, "step": 270, "valid_targets_mean": 4255.8, "valid_targets_min": 1735 }, { "epoch": 0.43859649122807015, "grad_norm": 0.5746725160756948, "learning_rate": 2.496583143507973e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.23281586170196533, "step": 275, "valid_targets_mean": 5547.3, "valid_targets_min": 1335 }, { "epoch": 0.44657097288676234, "grad_norm": 0.5241130870299622, "learning_rate": 2.5421412300683374e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.28230002522468567, "step": 280, "valid_targets_mean": 4519.5, "valid_targets_min": 1043 }, { "epoch": 0.45454545454545453, "grad_norm": 0.566135695536269, "learning_rate": 2.587699316628702e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.25908809900283813, "step": 285, "valid_targets_mean": 3886.4, "valid_targets_min": 1509 }, { "epoch": 0.4625199362041467, "grad_norm": 0.5438761096776028, "learning_rate": 2.6332574031890663e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.2712545394897461, "step": 290, "valid_targets_mean": 4487.6, "valid_targets_min": 736 }, { "epoch": 0.4704944178628389, "grad_norm": 0.559648132337892, "learning_rate": 2.6788154897494308e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.24313515424728394, "step": 295, "valid_targets_mean": 4423.8, "valid_targets_min": 686 }, { "epoch": 0.4784688995215311, "grad_norm": 0.5966418677079639, "learning_rate": 2.7243735763097953e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.23721837997436523, "step": 300, "valid_targets_mean": 3706.7, "valid_targets_min": 1173 }, { "epoch": 0.4864433811802233, "grad_norm": 0.5815566112988382, "learning_rate": 2.7699316628701597e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.23788884282112122, "step": 305, "valid_targets_mean": 3594.3, "valid_targets_min": 1815 }, { "epoch": 0.4944178628389155, "grad_norm": 0.5045506008502036, "learning_rate": 2.815489749430524e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.25513797998428345, "step": 310, "valid_targets_mean": 5347.7, "valid_targets_min": 1221 }, { "epoch": 0.5023923444976076, "grad_norm": 0.5701555342264036, "learning_rate": 2.8610478359908883e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.24246780574321747, "step": 315, "valid_targets_mean": 3548.3, "valid_targets_min": 1136 }, { "epoch": 0.5103668261562998, "grad_norm": 0.5182367732301608, "learning_rate": 2.906605922551253e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.23432882130146027, "step": 320, "valid_targets_mean": 4655.8, "valid_targets_min": 1400 }, { "epoch": 0.518341307814992, "grad_norm": 0.581611039848372, "learning_rate": 2.9521640091116176e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.24655424058437347, "step": 325, "valid_targets_mean": 4075.2, "valid_targets_min": 1087 }, { "epoch": 0.5263157894736842, "grad_norm": 0.5119496690813441, "learning_rate": 2.997722095671982e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.28360801935195923, "step": 330, "valid_targets_mean": 4828.7, "valid_targets_min": 2185 }, { "epoch": 0.5342902711323764, "grad_norm": 0.4842764810320044, "learning_rate": 3.0432801822323465e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.3004698157310486, "step": 335, "valid_targets_mean": 5661.6, "valid_targets_min": 1938 }, { "epoch": 0.5422647527910686, "grad_norm": 0.5349587768564628, "learning_rate": 3.088838268792711e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.2438666820526123, "step": 340, "valid_targets_mean": 4150.4, "valid_targets_min": 1564 }, { "epoch": 0.5502392344497608, "grad_norm": 0.5402803413388506, "learning_rate": 3.1343963553530755e-05, "loss": 0.2517, "loss_nan_ranks": 0, "loss_rank_avg": 0.25511205196380615, "step": 345, "valid_targets_mean": 4414.5, "valid_targets_min": 2053 }, { "epoch": 0.5582137161084529, "grad_norm": 0.7357121532770818, "learning_rate": 3.17995444191344e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.30022668838500977, "step": 350, "valid_targets_mean": 3161.2, "valid_targets_min": 655 }, { "epoch": 0.5661881977671451, "grad_norm": 0.6635034938265247, "learning_rate": 3.2255125284738044e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.27807778120040894, "step": 355, "valid_targets_mean": 3865.3, "valid_targets_min": 2029 }, { "epoch": 0.5741626794258373, "grad_norm": 0.5759574185615652, "learning_rate": 3.271070615034169e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.2875663936138153, "step": 360, "valid_targets_mean": 4687.4, "valid_targets_min": 1812 }, { "epoch": 0.5821371610845295, "grad_norm": 0.5603633405311572, "learning_rate": 3.316628701594533e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.25267183780670166, "step": 365, "valid_targets_mean": 4408.4, "valid_targets_min": 1131 }, { "epoch": 0.5901116427432217, "grad_norm": 0.6869663265290378, "learning_rate": 3.362186788154898e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.2470800280570984, "step": 370, "valid_targets_mean": 3387.9, "valid_targets_min": 1615 }, { "epoch": 0.5980861244019139, "grad_norm": 0.578708204023255, "learning_rate": 3.407744874715262e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.25405412912368774, "step": 375, "valid_targets_mean": 3955.7, "valid_targets_min": 1637 }, { "epoch": 0.6060606060606061, "grad_norm": 0.5959034995071885, "learning_rate": 3.453302961275627e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.2276259809732437, "step": 380, "valid_targets_mean": 3714.9, "valid_targets_min": 1249 }, { "epoch": 0.6140350877192983, "grad_norm": 0.7236145579514683, "learning_rate": 3.498861047835991e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.23672303557395935, "step": 385, "valid_targets_mean": 3127.5, "valid_targets_min": 440 }, { "epoch": 0.6220095693779905, "grad_norm": 0.4956883624100392, "learning_rate": 3.5444191343963557e-05, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.2489890456199646, "step": 390, "valid_targets_mean": 4754.2, "valid_targets_min": 1637 }, { "epoch": 0.6299840510366826, "grad_norm": 0.8505599140008155, "learning_rate": 3.58997722095672e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.2957842946052551, "step": 395, "valid_targets_mean": 4341.0, "valid_targets_min": 975 }, { "epoch": 0.6379585326953748, "grad_norm": 0.4755589673221355, "learning_rate": 3.6355353075170846e-05, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.2880033254623413, "step": 400, "valid_targets_mean": 5651.7, "valid_targets_min": 2397 }, { "epoch": 0.645933014354067, "grad_norm": 0.5917983081159787, "learning_rate": 3.681093394077449e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.2151985466480255, "step": 405, "valid_targets_mean": 3261.0, "valid_targets_min": 961 }, { "epoch": 0.6539074960127592, "grad_norm": 0.5368476047325583, "learning_rate": 3.7266514806378135e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.22232232987880707, "step": 410, "valid_targets_mean": 4013.4, "valid_targets_min": 1506 }, { "epoch": 0.6618819776714514, "grad_norm": 0.5211632420663286, "learning_rate": 3.772209567198178e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.23664991557598114, "step": 415, "valid_targets_mean": 4907.0, "valid_targets_min": 1902 }, { "epoch": 0.6698564593301436, "grad_norm": 0.4767758351048497, "learning_rate": 3.8177676537585425e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.23484618961811066, "step": 420, "valid_targets_mean": 4859.4, "valid_targets_min": 1921 }, { "epoch": 0.6778309409888357, "grad_norm": 1.2417309029902845, "learning_rate": 3.863325740318907e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.26523351669311523, "step": 425, "valid_targets_mean": 4098.0, "valid_targets_min": 1888 }, { "epoch": 0.6858054226475279, "grad_norm": 0.6004123621981486, "learning_rate": 3.9088838268792714e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.2325078547000885, "step": 430, "valid_targets_mean": 3585.0, "valid_targets_min": 1821 }, { "epoch": 0.69377990430622, "grad_norm": 0.5537664296614766, "learning_rate": 3.954441913439636e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.23680134117603302, "step": 435, "valid_targets_mean": 3540.8, "valid_targets_min": 416 }, { "epoch": 0.7017543859649122, "grad_norm": 0.5101795039873435, "learning_rate": 4e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.21456380188465118, "step": 440, "valid_targets_mean": 3978.2, "valid_targets_min": 1659 }, { "epoch": 0.7097288676236044, "grad_norm": 0.5031434314037209, "learning_rate": 3.9999841858814384e-05, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.23804379999637604, "step": 445, "valid_targets_mean": 4688.0, "valid_targets_min": 2147 }, { "epoch": 0.7177033492822966, "grad_norm": 0.53053495346675, "learning_rate": 3.999936743775839e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.32655003666877747, "step": 450, "valid_targets_mean": 5120.7, "valid_targets_min": 528 }, { "epoch": 0.7256778309409888, "grad_norm": 0.5915625545140855, "learning_rate": 3.9998576744334574e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.22716417908668518, "step": 455, "valid_targets_mean": 3332.4, "valid_targets_min": 377 }, { "epoch": 0.733652312599681, "grad_norm": 0.5945946110181048, "learning_rate": 3.999746979104705e-05, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.26090529561042786, "step": 460, "valid_targets_mean": 3924.7, "valid_targets_min": 1501 }, { "epoch": 0.7416267942583732, "grad_norm": 0.6362179372108026, "learning_rate": 3.999604659540131e-05, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.22476539015769958, "step": 465, "valid_targets_mean": 4122.6, "valid_targets_min": 2180 }, { "epoch": 0.7496012759170654, "grad_norm": 0.6471807631332203, "learning_rate": 3.999430717990395e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.23010434210300446, "step": 470, "valid_targets_mean": 3640.4, "valid_targets_min": 1361 }, { "epoch": 0.7575757575757576, "grad_norm": 0.5703865355046819, "learning_rate": 3.999225157206228e-05, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.23672768473625183, "step": 475, "valid_targets_mean": 4066.2, "valid_targets_min": 1061 }, { "epoch": 0.7655502392344498, "grad_norm": 0.5858989027495684, "learning_rate": 3.998987980438393e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.32610398530960083, "step": 480, "valid_targets_mean": 4883.6, "valid_targets_min": 1424 }, { "epoch": 0.773524720893142, "grad_norm": 0.5813017376748988, "learning_rate": 3.9987191914376306e-05, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.2823824882507324, "step": 485, "valid_targets_mean": 4392.2, "valid_targets_min": 359 }, { "epoch": 0.7814992025518341, "grad_norm": 0.5636916408209902, "learning_rate": 3.998418794454604e-05, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.25734850764274597, "step": 490, "valid_targets_mean": 4360.2, "valid_targets_min": 1272 }, { "epoch": 0.7894736842105263, "grad_norm": 0.4972880813638341, "learning_rate": 3.998086794239825e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.22650626301765442, "step": 495, "valid_targets_mean": 5009.5, "valid_targets_min": 1342 }, { "epoch": 0.7974481658692185, "grad_norm": 0.6083655046569959, "learning_rate": 3.997723196043585e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.254880428314209, "step": 500, "valid_targets_mean": 3642.2, "valid_targets_min": 1547 }, { "epoch": 0.8054226475279107, "grad_norm": 0.4854760864042363, "learning_rate": 3.9973280056158695e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.2242877185344696, "step": 505, "valid_targets_mean": 4663.0, "valid_targets_min": 1162 }, { "epoch": 0.8133971291866029, "grad_norm": 0.4838878799701098, "learning_rate": 3.9969012292062655e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.2093224823474884, "step": 510, "valid_targets_mean": 4763.6, "valid_targets_min": 1913 }, { "epoch": 0.8213716108452951, "grad_norm": 0.6268372836484649, "learning_rate": 3.996442873563866e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.28269273042678833, "step": 515, "valid_targets_mean": 4417.9, "valid_targets_min": 445 }, { "epoch": 0.8293460925039873, "grad_norm": 0.5129765312718306, "learning_rate": 3.9959529459371624e-05, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.26153725385665894, "step": 520, "valid_targets_mean": 5101.4, "valid_targets_min": 1506 }, { "epoch": 0.8373205741626795, "grad_norm": 0.614028186365327, "learning_rate": 3.9954314540739284e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.21306970715522766, "step": 525, "valid_targets_mean": 4610.0, "valid_targets_min": 1604 }, { "epoch": 0.8452950558213717, "grad_norm": 0.5183329707466268, "learning_rate": 3.994878406221097e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.22915929555892944, "step": 530, "valid_targets_mean": 3992.6, "valid_targets_min": 1596 }, { "epoch": 0.8532695374800638, "grad_norm": 0.48748891646891646, "learning_rate": 3.994293811124632e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.21784503757953644, "step": 535, "valid_targets_mean": 4734.7, "valid_targets_min": 2272 }, { "epoch": 0.861244019138756, "grad_norm": 0.5577470057219691, "learning_rate": 3.993677678029392e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.261586457490921, "step": 540, "valid_targets_mean": 4207.6, "valid_targets_min": 2094 }, { "epoch": 0.8692185007974481, "grad_norm": 0.5361831016352179, "learning_rate": 3.9930300166789765e-05, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.24090802669525146, "step": 545, "valid_targets_mean": 4649.8, "valid_targets_min": 1477 }, { "epoch": 0.8771929824561403, "grad_norm": 0.5535412241281055, "learning_rate": 3.992350837315581e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.29971128702163696, "step": 550, "valid_targets_mean": 4245.1, "valid_targets_min": 489 }, { "epoch": 0.8851674641148325, "grad_norm": 0.5925574761855791, "learning_rate": 3.991640150679826e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.22118769586086273, "step": 555, "valid_targets_mean": 4004.8, "valid_targets_min": 447 }, { "epoch": 0.8931419457735247, "grad_norm": 0.5767617153732819, "learning_rate": 3.990897968010596e-05, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.20498380064964294, "step": 560, "valid_targets_mean": 4139.0, "valid_targets_min": 838 }, { "epoch": 0.9011164274322169, "grad_norm": 0.4835231868725431, "learning_rate": 3.990124301044855e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.1946374922990799, "step": 565, "valid_targets_mean": 4275.1, "valid_targets_min": 2198 }, { "epoch": 0.9090909090909091, "grad_norm": 0.5296996222002296, "learning_rate": 3.989319162017465e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.2601141035556793, "step": 570, "valid_targets_mean": 3926.8, "valid_targets_min": 763 }, { "epoch": 0.9170653907496013, "grad_norm": 0.4471460846434403, "learning_rate": 3.988482563660989e-05, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.24986547231674194, "step": 575, "valid_targets_mean": 5239.9, "valid_targets_min": 883 }, { "epoch": 0.9250398724082934, "grad_norm": 0.4777445171386324, "learning_rate": 3.987614519205493e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.22537899017333984, "step": 580, "valid_targets_mean": 4626.4, "valid_targets_min": 632 }, { "epoch": 0.9330143540669856, "grad_norm": 0.49075192060803235, "learning_rate": 3.986715042378334e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.23568783700466156, "step": 585, "valid_targets_mean": 5212.7, "valid_targets_min": 1512 }, { "epoch": 0.9409888357256778, "grad_norm": 0.5462851495643627, "learning_rate": 3.985784147403947e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.23025473952293396, "step": 590, "valid_targets_mean": 3878.6, "valid_targets_min": 794 }, { "epoch": 0.94896331738437, "grad_norm": 0.5130018222856094, "learning_rate": 3.9848218490036144e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.21813419461250305, "step": 595, "valid_targets_mean": 4043.2, "valid_targets_min": 1178 }, { "epoch": 0.9569377990430622, "grad_norm": 0.4970815254000969, "learning_rate": 3.983828162395238e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.24089229106903076, "step": 600, "valid_targets_mean": 4810.4, "valid_targets_min": 985 }, { "epoch": 0.9649122807017544, "grad_norm": 0.5721802181838589, "learning_rate": 3.9828031032930944e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.2031339704990387, "step": 605, "valid_targets_mean": 3739.4, "valid_targets_min": 1367 }, { "epoch": 0.9728867623604466, "grad_norm": 0.5188176743792337, "learning_rate": 3.98174668790759e-05, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.27065911889076233, "step": 610, "valid_targets_mean": 4289.9, "valid_targets_min": 644 }, { "epoch": 0.9808612440191388, "grad_norm": 0.5016486734647293, "learning_rate": 3.9806589329450045e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.2198173850774765, "step": 615, "valid_targets_mean": 4156.7, "valid_targets_min": 861 }, { "epoch": 0.988835725677831, "grad_norm": 0.495182154320868, "learning_rate": 3.979539855607222e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.22900980710983276, "step": 620, "valid_targets_mean": 4202.0, "valid_targets_min": 1404 }, { "epoch": 0.9968102073365231, "grad_norm": 0.4977265786366298, "learning_rate": 3.9783894735914646e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.20909643173217773, "step": 625, "valid_targets_mean": 4351.4, "valid_targets_min": 1625 }, { "epoch": 1.0047846889952152, "grad_norm": 0.5032203543453754, "learning_rate": 3.9772078050900105e-05, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.22026538848876953, "step": 630, "valid_targets_mean": 3949.2, "valid_targets_min": 1519 }, { "epoch": 1.0127591706539074, "grad_norm": 0.5229641736587483, "learning_rate": 3.9759948687899055e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.25218960642814636, "step": 635, "valid_targets_mean": 3920.1, "valid_targets_min": 667 }, { "epoch": 1.0207336523125996, "grad_norm": 0.5502168871278199, "learning_rate": 3.974750683872667e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.21615633368492126, "step": 640, "valid_targets_mean": 3966.8, "valid_targets_min": 1387 }, { "epoch": 1.0287081339712918, "grad_norm": 0.5482724060330286, "learning_rate": 3.973475270013984e-05, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.22589367628097534, "step": 645, "valid_targets_mean": 4249.8, "valid_targets_min": 1645 }, { "epoch": 1.036682615629984, "grad_norm": 0.48681150157765296, "learning_rate": 3.972168647383402e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.18984422087669373, "step": 650, "valid_targets_mean": 4701.6, "valid_targets_min": 1897 }, { "epoch": 1.0446570972886762, "grad_norm": 0.5286726205605536, "learning_rate": 3.970830836644006e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.2323208749294281, "step": 655, "valid_targets_mean": 3915.1, "valid_targets_min": 2094 }, { "epoch": 1.0526315789473684, "grad_norm": 0.5463582558960633, "learning_rate": 3.9694618589520945e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.24363505840301514, "step": 660, "valid_targets_mean": 3746.0, "valid_targets_min": 1271 }, { "epoch": 1.0606060606060606, "grad_norm": 0.4692304274685834, "learning_rate": 3.9680617359568414e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.22661146521568298, "step": 665, "valid_targets_mean": 4613.2, "valid_targets_min": 811 }, { "epoch": 1.0685805422647527, "grad_norm": 0.5076971387573798, "learning_rate": 3.966630489799959e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.2089880257844925, "step": 670, "valid_targets_mean": 3869.4, "valid_targets_min": 1038 }, { "epoch": 1.076555023923445, "grad_norm": 0.4498347073038136, "learning_rate": 3.9651681431153445e-05, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.21558557450771332, "step": 675, "valid_targets_mean": 4482.1, "valid_targets_min": 1271 }, { "epoch": 1.0845295055821371, "grad_norm": 0.5064153829663555, "learning_rate": 3.96367471902872e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.2504901587963104, "step": 680, "valid_targets_mean": 5206.8, "valid_targets_min": 1827 }, { "epoch": 1.0925039872408293, "grad_norm": 0.5259888970380884, "learning_rate": 3.9621502411572705e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.2569437623023987, "step": 685, "valid_targets_mean": 4280.9, "valid_targets_min": 655 }, { "epoch": 1.1004784688995215, "grad_norm": 0.6046706105924078, "learning_rate": 3.960594733609273e-05, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.21926787495613098, "step": 690, "valid_targets_mean": 3736.1, "valid_targets_min": 1596 }, { "epoch": 1.1084529505582137, "grad_norm": 0.48006122244847677, "learning_rate": 3.9590082209837054e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.23299375176429749, "step": 695, "valid_targets_mean": 4608.6, "valid_targets_min": 1949 }, { "epoch": 1.1164274322169059, "grad_norm": 0.553902049161527, "learning_rate": 3.957390728369867e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.2619227170944214, "step": 700, "valid_targets_mean": 3900.5, "valid_targets_min": 1523 }, { "epoch": 1.124401913875598, "grad_norm": 0.5567781830902339, "learning_rate": 3.955742281346979e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.22066161036491394, "step": 705, "valid_targets_mean": 3926.1, "valid_targets_min": 818 }, { "epoch": 1.1323763955342903, "grad_norm": 0.5030489445709994, "learning_rate": 3.9540629059837767e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.21337543427944183, "step": 710, "valid_targets_mean": 4503.9, "valid_targets_min": 1611 }, { "epoch": 1.1403508771929824, "grad_norm": 0.4521443857332383, "learning_rate": 3.952352628838102e-05, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.2025744616985321, "step": 715, "valid_targets_mean": 4265.0, "valid_targets_min": 1616 }, { "epoch": 1.1483253588516746, "grad_norm": 0.5501529406774962, "learning_rate": 3.95061147695648e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.26300299167633057, "step": 720, "valid_targets_mean": 5110.0, "valid_targets_min": 1602 }, { "epoch": 1.1562998405103668, "grad_norm": 0.5721986878872145, "learning_rate": 3.9488394778736935e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.2308548390865326, "step": 725, "valid_targets_mean": 4003.0, "valid_targets_min": 1036 }, { "epoch": 1.164274322169059, "grad_norm": 0.4803368155501433, "learning_rate": 3.947036659612345e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.23096925020217896, "step": 730, "valid_targets_mean": 4496.0, "valid_targets_min": 1436 }, { "epoch": 1.1722488038277512, "grad_norm": 0.5066273119569031, "learning_rate": 3.945203050682418e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.23388348519802094, "step": 735, "valid_targets_mean": 3819.8, "valid_targets_min": 1237 }, { "epoch": 1.1802232854864434, "grad_norm": 0.4830554741716881, "learning_rate": 3.94333868008082e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.25258368253707886, "step": 740, "valid_targets_mean": 4634.4, "valid_targets_min": 916 }, { "epoch": 1.1881977671451356, "grad_norm": 0.4843244438344029, "learning_rate": 3.94144357729093e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.206687331199646, "step": 745, "valid_targets_mean": 4439.3, "valid_targets_min": 458 }, { "epoch": 1.1961722488038278, "grad_norm": 0.5243718793861886, "learning_rate": 3.939517772282127e-05, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.2652336359024048, "step": 750, "valid_targets_mean": 4485.8, "valid_targets_min": 891 }, { "epoch": 1.20414673046252, "grad_norm": 0.5788052182039267, "learning_rate": 3.93756129550932e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.20965895056724548, "step": 755, "valid_targets_mean": 3390.4, "valid_targets_min": 278 }, { "epoch": 1.2121212121212122, "grad_norm": 0.620883837268961, "learning_rate": 3.935574177912465e-05, "loss": 0.2143, "loss_nan_ranks": 0, "loss_rank_avg": 0.23990340530872345, "step": 760, "valid_targets_mean": 4009.7, "valid_targets_min": 2077 }, { "epoch": 1.2200956937799043, "grad_norm": 0.5871274762207975, "learning_rate": 3.9335564509160746e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.22472716867923737, "step": 765, "valid_targets_mean": 4286.5, "valid_targets_min": 319 }, { "epoch": 1.2280701754385965, "grad_norm": 0.5010639217355422, "learning_rate": 3.931508146428724e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.21770870685577393, "step": 770, "valid_targets_mean": 4047.3, "valid_targets_min": 1735 }, { "epoch": 1.2360446570972887, "grad_norm": 0.5039635008586113, "learning_rate": 3.929429296842542e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.19232256710529327, "step": 775, "valid_targets_mean": 3779.6, "valid_targets_min": 1637 }, { "epoch": 1.244019138755981, "grad_norm": 0.5189905433600639, "learning_rate": 3.927319935032703e-05, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.23623117804527283, "step": 780, "valid_targets_mean": 4330.4, "valid_targets_min": 342 }, { "epoch": 1.251993620414673, "grad_norm": 0.6627491973095729, "learning_rate": 3.925180094356905e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.24548950791358948, "step": 785, "valid_targets_mean": 4172.2, "valid_targets_min": 1251 }, { "epoch": 1.2599681020733653, "grad_norm": 0.5079001254806608, "learning_rate": 3.9230098086548414e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.21201512217521667, "step": 790, "valid_targets_mean": 4065.2, "valid_targets_min": 585 }, { "epoch": 1.2679425837320575, "grad_norm": 0.47150540150141773, "learning_rate": 3.920809112247668e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.20915411412715912, "step": 795, "valid_targets_mean": 4409.1, "valid_targets_min": 1091 }, { "epoch": 1.2759170653907497, "grad_norm": 0.5514140187109288, "learning_rate": 3.918578039937459e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.23035244643688202, "step": 800, "valid_targets_mean": 4182.2, "valid_targets_min": 2198 }, { "epoch": 1.2838915470494419, "grad_norm": 0.4500995102298934, "learning_rate": 3.916316627006656e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.2097713053226471, "step": 805, "valid_targets_mean": 4795.3, "valid_targets_min": 1902 }, { "epoch": 1.291866028708134, "grad_norm": 0.52633246142109, "learning_rate": 3.914024909217511e-05, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.19991585612297058, "step": 810, "valid_targets_mean": 3731.4, "valid_targets_min": 1883 }, { "epoch": 1.2998405103668262, "grad_norm": 0.4467294156911823, "learning_rate": 3.911702922811522e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.203420490026474, "step": 815, "valid_targets_mean": 4653.8, "valid_targets_min": 2174 }, { "epoch": 1.3078149920255182, "grad_norm": 0.5081778926888767, "learning_rate": 3.909350704508856e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.20174889266490936, "step": 820, "valid_targets_mean": 3439.1, "valid_targets_min": 1350 }, { "epoch": 1.3157894736842106, "grad_norm": 0.9310514979548232, "learning_rate": 3.906968291507773e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.2513682246208191, "step": 825, "valid_targets_mean": 4917.4, "valid_targets_min": 1283 }, { "epoch": 1.3237639553429026, "grad_norm": 0.5555892851581838, "learning_rate": 3.904555721484034e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.20496833324432373, "step": 830, "valid_targets_mean": 4021.7, "valid_targets_min": 248 }, { "epoch": 1.331738437001595, "grad_norm": 0.47232094168845945, "learning_rate": 3.9021130325903076e-05, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.19785736501216888, "step": 835, "valid_targets_mean": 5302.4, "valid_targets_min": 2353 }, { "epoch": 1.339712918660287, "grad_norm": 0.5812182577655588, "learning_rate": 3.899640263455566e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.18643829226493835, "step": 840, "valid_targets_mean": 3905.0, "valid_targets_min": 961 }, { "epoch": 1.3476874003189794, "grad_norm": 0.5500888468056214, "learning_rate": 3.897137453184472e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.18745486438274384, "step": 845, "valid_targets_mean": 3677.1, "valid_targets_min": 574 }, { "epoch": 1.3556618819776713, "grad_norm": 0.6847492160049518, "learning_rate": 3.894604641356767e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.2598264813423157, "step": 850, "valid_targets_mean": 4733.8, "valid_targets_min": 1433 }, { "epoch": 1.3636363636363638, "grad_norm": 0.45372699194812466, "learning_rate": 3.8920418680266346e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.19950619339942932, "step": 855, "valid_targets_mean": 4372.9, "valid_targets_min": 933 }, { "epoch": 1.3716108452950557, "grad_norm": 0.49007066533357946, "learning_rate": 3.889449173722077e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.20979920029640198, "step": 860, "valid_targets_mean": 3954.1, "valid_targets_min": 1402 }, { "epoch": 1.3795853269537481, "grad_norm": 0.5091212381448587, "learning_rate": 3.8868265994442694e-05, "loss": 0.2061, "loss_nan_ranks": 0, "loss_rank_avg": 0.22372718155384064, "step": 865, "valid_targets_mean": 4045.6, "valid_targets_min": 600 }, { "epoch": 1.38755980861244, "grad_norm": 0.49225432870048075, "learning_rate": 3.8841741866669126e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.1865185797214508, "step": 870, "valid_targets_mean": 3703.1, "valid_targets_min": 1619 }, { "epoch": 1.3955342902711323, "grad_norm": 0.47745581156193523, "learning_rate": 3.881491977335577e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.2252838909626007, "step": 875, "valid_targets_mean": 4296.0, "valid_targets_min": 1796 }, { "epoch": 1.4035087719298245, "grad_norm": 0.43928492337677577, "learning_rate": 3.878780013867038e-05, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.20441752672195435, "step": 880, "valid_targets_mean": 4535.2, "valid_targets_min": 1824 }, { "epoch": 1.4114832535885167, "grad_norm": 0.5033914360127287, "learning_rate": 3.8760383391486074e-05, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.30052030086517334, "step": 885, "valid_targets_mean": 4486.1, "valid_targets_min": 531 }, { "epoch": 1.4194577352472089, "grad_norm": 0.46617057902823866, "learning_rate": 3.873266996537456e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.19758670032024384, "step": 890, "valid_targets_mean": 4368.9, "valid_targets_min": 588 }, { "epoch": 1.427432216905901, "grad_norm": 0.43206619780636607, "learning_rate": 3.8704660298599225e-05, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.2040582001209259, "step": 895, "valid_targets_mean": 6326.5, "valid_targets_min": 1686 }, { "epoch": 1.4354066985645932, "grad_norm": 0.48207222426509794, "learning_rate": 3.867635483410827e-05, "loss": 0.2178, "loss_nan_ranks": 0, "loss_rank_avg": 0.2013099491596222, "step": 900, "valid_targets_mean": 4192.6, "valid_targets_min": 1486 }, { "epoch": 1.4433811802232854, "grad_norm": 0.4666337478470858, "learning_rate": 3.864775401952767e-05, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.22802595794200897, "step": 905, "valid_targets_mean": 4553.6, "valid_targets_min": 376 }, { "epoch": 1.4513556618819776, "grad_norm": 0.44722531533793, "learning_rate": 3.8618858307154085e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.20279376208782196, "step": 910, "valid_targets_mean": 4846.8, "valid_targets_min": 1507 }, { "epoch": 1.4593301435406698, "grad_norm": 0.5371093701872409, "learning_rate": 3.8589668153947743e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.23264798521995544, "step": 915, "valid_targets_mean": 4581.4, "valid_targets_min": 386 }, { "epoch": 1.467304625199362, "grad_norm": 0.5165471090234898, "learning_rate": 3.8560184021525194e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.2197292149066925, "step": 920, "valid_targets_mean": 4447.9, "valid_targets_min": 2488 }, { "epoch": 1.4752791068580542, "grad_norm": 0.4798137016348713, "learning_rate": 3.853040637615199e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.22513622045516968, "step": 925, "valid_targets_mean": 4678.5, "valid_targets_min": 286 }, { "epoch": 1.4832535885167464, "grad_norm": 0.4979070884147898, "learning_rate": 3.850033568873536e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.23755387961864471, "step": 930, "valid_targets_mean": 4021.5, "valid_targets_min": 1577 }, { "epoch": 1.4912280701754386, "grad_norm": 0.4572253404809861, "learning_rate": 3.8469972434816706e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.23543182015419006, "step": 935, "valid_targets_mean": 5077.9, "valid_targets_min": 1116 }, { "epoch": 1.4992025518341308, "grad_norm": 0.47248195445727853, "learning_rate": 3.843931709456414e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.20499253273010254, "step": 940, "valid_targets_mean": 3970.7, "valid_targets_min": 1530 }, { "epoch": 1.507177033492823, "grad_norm": 0.42598999174275803, "learning_rate": 3.840837015276483e-05, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2627623975276947, "step": 945, "valid_targets_mean": 5831.6, "valid_targets_min": 2288 }, { "epoch": 1.5151515151515151, "grad_norm": 0.6269538410575813, "learning_rate": 3.83771320988174e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.18554210662841797, "step": 950, "valid_targets_mean": 4548.8, "valid_targets_min": 1487 }, { "epoch": 1.5231259968102073, "grad_norm": 0.500690066016818, "learning_rate": 3.834560342672413e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.22179262340068817, "step": 955, "valid_targets_mean": 3794.7, "valid_targets_min": 1451 }, { "epoch": 1.5311004784688995, "grad_norm": 0.4844197425861743, "learning_rate": 3.831378463508318e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.1850634515285492, "step": 960, "valid_targets_mean": 4430.5, "valid_targets_min": 1689 }, { "epoch": 1.5390749601275917, "grad_norm": 0.49254151371909743, "learning_rate": 3.8281676227080694e-05, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.2288564294576645, "step": 965, "valid_targets_mean": 3998.4, "valid_targets_min": 291 }, { "epoch": 1.547049441786284, "grad_norm": 0.5742983155284956, "learning_rate": 3.824927871048284e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.2189641147851944, "step": 970, "valid_targets_mean": 3550.6, "valid_targets_min": 1509 }, { "epoch": 1.555023923444976, "grad_norm": 0.5433468243901337, "learning_rate": 3.8216592597627797e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.223488450050354, "step": 975, "valid_targets_mean": 4082.4, "valid_targets_min": 1704 }, { "epoch": 1.5629984051036683, "grad_norm": 0.5196900072582149, "learning_rate": 3.818361840541761e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.20587456226348877, "step": 980, "valid_targets_mean": 4621.8, "valid_targets_min": 815 }, { "epoch": 1.5709728867623605, "grad_norm": 0.5135498979104908, "learning_rate": 3.815035665531008e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.24312788248062134, "step": 985, "valid_targets_mean": 3476.9, "valid_targets_min": 462 }, { "epoch": 1.5789473684210527, "grad_norm": 0.7898137054288659, "learning_rate": 3.811680787331047e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.22189228236675262, "step": 990, "valid_targets_mean": 3913.2, "valid_targets_min": 1367 }, { "epoch": 1.5869218500797448, "grad_norm": 0.43969010537708586, "learning_rate": 3.8082972589963175e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.20273138582706451, "step": 995, "valid_targets_mean": 4583.5, "valid_targets_min": 1345 }, { "epoch": 1.594896331738437, "grad_norm": 0.5555222366008191, "learning_rate": 3.80488513403434e-05, "loss": 0.2225, "loss_nan_ranks": 0, "loss_rank_avg": 0.21825510263442993, "step": 1000, "valid_targets_mean": 3541.6, "valid_targets_min": 1470 }, { "epoch": 1.6028708133971292, "grad_norm": 0.4321959152756272, "learning_rate": 3.8014444664048616e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.1973963975906372, "step": 1005, "valid_targets_mean": 4639.2, "valid_targets_min": 1503 }, { "epoch": 1.6108452950558214, "grad_norm": 0.46446966286351066, "learning_rate": 3.797975310519009e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.2148362100124359, "step": 1010, "valid_targets_mean": 4174.1, "valid_targets_min": 1381 }, { "epoch": 1.6188197767145136, "grad_norm": 0.48913950514237353, "learning_rate": 3.794477721238425e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.2184276580810547, "step": 1015, "valid_targets_mean": 4014.8, "valid_targets_min": 1722 }, { "epoch": 1.6267942583732058, "grad_norm": 0.4303667207370021, "learning_rate": 3.7909517538744e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.2015509009361267, "step": 1020, "valid_targets_mean": 4448.6, "valid_targets_min": 1590 }, { "epoch": 1.6347687400318978, "grad_norm": 0.5289047871909957, "learning_rate": 3.7873974641870006e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.21874231100082397, "step": 1025, "valid_targets_mean": 3820.2, "valid_targets_min": 1733 }, { "epoch": 1.6427432216905902, "grad_norm": 0.4762507453851103, "learning_rate": 3.7838149083841856e-05, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.2580573558807373, "step": 1030, "valid_targets_mean": 5352.6, "valid_targets_min": 1846 }, { "epoch": 1.6507177033492821, "grad_norm": 0.47198599267721897, "learning_rate": 3.7802041431209166e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.205755352973938, "step": 1035, "valid_targets_mean": 4287.4, "valid_targets_min": 1811 }, { "epoch": 1.6586921850079746, "grad_norm": 0.5028769618064659, "learning_rate": 3.776565225498264e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.20170894265174866, "step": 1040, "valid_targets_mean": 3809.2, "valid_targets_min": 1688 }, { "epoch": 1.6666666666666665, "grad_norm": 0.504718091730453, "learning_rate": 3.7728982130625025e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.2416345477104187, "step": 1045, "valid_targets_mean": 4589.6, "valid_targets_min": 1648 }, { "epoch": 1.674641148325359, "grad_norm": 0.554866907792144, "learning_rate": 3.769203163804202e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.22144190967082977, "step": 1050, "valid_targets_mean": 4044.3, "valid_targets_min": 867 }, { "epoch": 1.682615629984051, "grad_norm": 0.4912047494949895, "learning_rate": 3.7654801361573076e-05, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.19729235768318176, "step": 1055, "valid_targets_mean": 4379.2, "valid_targets_min": 1476 }, { "epoch": 1.6905901116427433, "grad_norm": 0.5033895385309353, "learning_rate": 3.761729188998222e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.19748783111572266, "step": 1060, "valid_targets_mean": 4624.8, "valid_targets_min": 2190 }, { "epoch": 1.6985645933014353, "grad_norm": 0.5473790729590564, "learning_rate": 3.757950381644868e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.25469958782196045, "step": 1065, "valid_targets_mean": 3925.2, "valid_targets_min": 599 }, { "epoch": 1.7065390749601277, "grad_norm": 0.5180414304101282, "learning_rate": 3.7541437738557524e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.19136464595794678, "step": 1070, "valid_targets_mean": 3960.3, "valid_targets_min": 1645 }, { "epoch": 1.7145135566188197, "grad_norm": 0.5003214798788846, "learning_rate": 3.750309425829022e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.19182105362415314, "step": 1075, "valid_targets_mean": 3812.0, "valid_targets_min": 1303 }, { "epoch": 1.722488038277512, "grad_norm": 0.49690764989147096, "learning_rate": 3.746447398201512e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.19056028127670288, "step": 1080, "valid_targets_mean": 4023.6, "valid_targets_min": 1050 }, { "epoch": 1.730462519936204, "grad_norm": 0.5016898081489446, "learning_rate": 3.7425577520477846e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.21159327030181885, "step": 1085, "valid_targets_mean": 4200.7, "valid_targets_min": 1525 }, { "epoch": 1.7384370015948964, "grad_norm": 0.5659690695722234, "learning_rate": 3.738640548879166e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.2166757434606552, "step": 1090, "valid_targets_mean": 4174.4, "valid_targets_min": 1178 }, { "epoch": 1.7464114832535884, "grad_norm": 0.4955709318314084, "learning_rate": 3.7346958506427696e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.26833972334861755, "step": 1095, "valid_targets_mean": 4771.3, "valid_targets_min": 338 }, { "epoch": 1.7543859649122808, "grad_norm": 0.38960186550719944, "learning_rate": 3.730723719720523e-05, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.1986948400735855, "step": 1100, "valid_targets_mean": 5489.8, "valid_targets_min": 2149 }, { "epoch": 1.7623604465709728, "grad_norm": 0.4629656896157057, "learning_rate": 3.7267242189281746e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.21994957327842712, "step": 1105, "valid_targets_mean": 4140.4, "valid_targets_min": 1083 }, { "epoch": 1.7703349282296652, "grad_norm": 0.49029157020426084, "learning_rate": 3.722697411514305e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.22220617532730103, "step": 1110, "valid_targets_mean": 4312.5, "valid_targets_min": 1783 }, { "epoch": 1.7783094098883572, "grad_norm": 0.47257303125367206, "learning_rate": 3.7186433611593225e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.20860454440116882, "step": 1115, "valid_targets_mean": 4489.4, "valid_targets_min": 1180 }, { "epoch": 1.7862838915470496, "grad_norm": 0.4881940956993811, "learning_rate": 3.7145621319744614e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.22178339958190918, "step": 1120, "valid_targets_mean": 4007.1, "valid_targets_min": 1672 }, { "epoch": 1.7942583732057416, "grad_norm": 0.49017938696756835, "learning_rate": 3.7104537885007635e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537485361099243, "step": 1125, "valid_targets_mean": 4017.6, "valid_targets_min": 1443 }, { "epoch": 1.802232854864434, "grad_norm": 0.4709602958627766, "learning_rate": 3.7063183957080594e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.22469566762447357, "step": 1130, "valid_targets_mean": 4085.2, "valid_targets_min": 793 }, { "epoch": 1.810207336523126, "grad_norm": 0.4928808140478705, "learning_rate": 3.7021560189939416e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.20846673846244812, "step": 1135, "valid_targets_mean": 3571.0, "valid_targets_min": 1270 }, { "epoch": 1.8181818181818183, "grad_norm": 0.4479091986972175, "learning_rate": 3.697966724182729e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.25488775968551636, "step": 1140, "valid_targets_mean": 5469.8, "valid_targets_min": 2538 }, { "epoch": 1.8261562998405103, "grad_norm": 0.5036402613565975, "learning_rate": 3.6937505775244246e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.22394904494285583, "step": 1145, "valid_targets_mean": 3642.4, "valid_targets_min": 1295 }, { "epoch": 1.8341307814992025, "grad_norm": 0.4780135062253511, "learning_rate": 3.689507645693674e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.2610904574394226, "step": 1150, "valid_targets_mean": 4336.4, "valid_targets_min": 1326 }, { "epoch": 1.8421052631578947, "grad_norm": 0.44381256880644715, "learning_rate": 3.6852379957887025e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.2414180189371109, "step": 1155, "valid_targets_mean": 4727.1, "valid_targets_min": 1465 }, { "epoch": 1.8500797448165869, "grad_norm": 0.5083384797022545, "learning_rate": 3.6809416953302606e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.19842639565467834, "step": 1160, "valid_targets_mean": 3549.2, "valid_targets_min": 331 }, { "epoch": 1.858054226475279, "grad_norm": 0.49199658884829844, "learning_rate": 3.676618812260553e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.2503410577774048, "step": 1165, "valid_targets_mean": 5109.9, "valid_targets_min": 2149 }, { "epoch": 1.8660287081339713, "grad_norm": 0.55008339033863, "learning_rate": 3.672269414942166e-05, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.22753937542438507, "step": 1170, "valid_targets_mean": 4630.0, "valid_targets_min": 976 }, { "epoch": 1.8740031897926634, "grad_norm": 0.4586261326556948, "learning_rate": 3.6678935721569825e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.18508616089820862, "step": 1175, "valid_targets_mean": 4012.5, "valid_targets_min": 1306 }, { "epoch": 1.8819776714513556, "grad_norm": 0.5027511997863094, "learning_rate": 3.663491353105101e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.2094116061925888, "step": 1180, "valid_targets_mean": 4146.3, "valid_targets_min": 1831 }, { "epoch": 1.8899521531100478, "grad_norm": 0.44258348252135243, "learning_rate": 3.659062827403735e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.21222475171089172, "step": 1185, "valid_targets_mean": 4740.8, "valid_targets_min": 484 }, { "epoch": 1.89792663476874, "grad_norm": 0.4593536791251397, "learning_rate": 3.654608065086115e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.21094900369644165, "step": 1190, "valid_targets_mean": 4180.3, "valid_targets_min": 1467 }, { "epoch": 1.9059011164274322, "grad_norm": 0.3864590115928493, "learning_rate": 3.650127136600379e-05, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.2283993363380432, "step": 1195, "valid_targets_mean": 6030.2, "valid_targets_min": 2216 }, { "epoch": 1.9138755980861244, "grad_norm": 0.4493029875433048, "learning_rate": 3.645620112808464e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.20390526950359344, "step": 1200, "valid_targets_mean": 4438.4, "valid_targets_min": 1179 }, { "epoch": 1.9218500797448166, "grad_norm": 0.4717808228916783, "learning_rate": 3.641087064984977e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.29960161447525024, "step": 1205, "valid_targets_mean": 5767.2, "valid_targets_min": 2064 }, { "epoch": 1.9298245614035088, "grad_norm": 0.4408153072153271, "learning_rate": 3.636528064816073e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.21097023785114288, "step": 1210, "valid_targets_mean": 4657.0, "valid_targets_min": 1295 }, { "epoch": 1.937799043062201, "grad_norm": 0.5308216721572256, "learning_rate": 3.6319431843983223e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.26519426703453064, "step": 1215, "valid_targets_mean": 4505.1, "valid_targets_min": 777 }, { "epoch": 1.9457735247208932, "grad_norm": 0.5036613470499272, "learning_rate": 3.6273324962375676e-05, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.2110607922077179, "step": 1220, "valid_targets_mean": 3974.0, "valid_targets_min": 1086 }, { "epoch": 1.9537480063795853, "grad_norm": 0.47289512484636687, "learning_rate": 3.622696073247777e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.20814213156700134, "step": 1225, "valid_targets_mean": 4752.9, "valid_targets_min": 445 }, { "epoch": 1.9617224880382775, "grad_norm": 0.49652731607830747, "learning_rate": 3.6180339887498953e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.2197228968143463, "step": 1230, "valid_targets_mean": 4165.1, "valid_targets_min": 1840 }, { "epoch": 1.9696969696969697, "grad_norm": 0.4303512638873414, "learning_rate": 3.613346316470678e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.19560399651527405, "step": 1235, "valid_targets_mean": 4744.9, "valid_targets_min": 1290 }, { "epoch": 1.977671451355662, "grad_norm": 0.46027425838155206, "learning_rate": 3.60863313054153e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.20572498440742493, "step": 1240, "valid_targets_mean": 4645.9, "valid_targets_min": 1393 }, { "epoch": 1.985645933014354, "grad_norm": 0.4179304388168029, "learning_rate": 3.6038945054973334e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.18564409017562866, "step": 1245, "valid_targets_mean": 4841.8, "valid_targets_min": 2470 }, { "epoch": 1.9936204146730463, "grad_norm": 0.429983595414097, "learning_rate": 3.599130516275266e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.17854493856430054, "step": 1250, "valid_targets_mean": 4375.5, "valid_targets_min": 738 }, { "epoch": 2.0015948963317385, "grad_norm": 0.5835831287236563, "learning_rate": 3.594341238213618e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.2125822901725769, "step": 1255, "valid_targets_mean": 4207.8, "valid_targets_min": 1622 }, { "epoch": 2.0095693779904304, "grad_norm": 0.48535029081671693, "learning_rate": 3.589526747050601e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.18778109550476074, "step": 1260, "valid_targets_mean": 4847.1, "valid_targets_min": 1503 }, { "epoch": 2.017543859649123, "grad_norm": 0.4142330646373312, "learning_rate": 3.584687118923149e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.16331608593463898, "step": 1265, "valid_targets_mean": 5046.7, "valid_targets_min": 2438 }, { "epoch": 2.025518341307815, "grad_norm": 0.5387717755970093, "learning_rate": 3.579822430365714e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.19953720271587372, "step": 1270, "valid_targets_mean": 3987.6, "valid_targets_min": 1561 }, { "epoch": 2.0334928229665072, "grad_norm": 0.492124600517885, "learning_rate": 3.57493275830906e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.2031257301568985, "step": 1275, "valid_targets_mean": 4217.2, "valid_targets_min": 1199 }, { "epoch": 2.041467304625199, "grad_norm": 0.49992210755448996, "learning_rate": 3.570018180079037e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.1987209916114807, "step": 1280, "valid_targets_mean": 4681.9, "valid_targets_min": 1519 }, { "epoch": 2.0494417862838916, "grad_norm": 0.5505016254551602, "learning_rate": 3.5650787733953715e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.19336707890033722, "step": 1285, "valid_targets_mean": 4355.0, "valid_targets_min": 1653 }, { "epoch": 2.0574162679425836, "grad_norm": 0.579774349638529, "learning_rate": 3.560114616370425e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.20641644299030304, "step": 1290, "valid_targets_mean": 4079.1, "valid_targets_min": 583 }, { "epoch": 2.065390749601276, "grad_norm": 0.4389607585870106, "learning_rate": 3.555125787507964e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.18444427847862244, "step": 1295, "valid_targets_mean": 5314.6, "valid_targets_min": 1254 }, { "epoch": 2.073365231259968, "grad_norm": 0.4893113319926811, "learning_rate": 3.550112365701921e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.22254320979118347, "step": 1300, "valid_targets_mean": 4483.9, "valid_targets_min": 1227 }, { "epoch": 2.0813397129186604, "grad_norm": 0.5537767932697284, "learning_rate": 3.545074430235142e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.18424861133098602, "step": 1305, "valid_targets_mean": 4432.2, "valid_targets_min": 1619 }, { "epoch": 2.0893141945773523, "grad_norm": 0.5182340294860415, "learning_rate": 3.540012060778137e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.17916396260261536, "step": 1310, "valid_targets_mean": 4455.2, "valid_targets_min": 1876 }, { "epoch": 2.0972886762360448, "grad_norm": 0.4906965964718632, "learning_rate": 3.534925337387816e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.17498987913131714, "step": 1315, "valid_targets_mean": 4435.5, "valid_targets_min": 1179 }, { "epoch": 2.1052631578947367, "grad_norm": 0.5227104218173729, "learning_rate": 3.529814340506226e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.19775143265724182, "step": 1320, "valid_targets_mean": 4533.5, "valid_targets_min": 1604 }, { "epoch": 2.113237639553429, "grad_norm": 0.6246358255489487, "learning_rate": 3.524679150959277e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.18220943212509155, "step": 1325, "valid_targets_mean": 4121.6, "valid_targets_min": 1517 }, { "epoch": 2.121212121212121, "grad_norm": 0.4427948849698209, "learning_rate": 3.519519849955466e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.17299795150756836, "step": 1330, "valid_targets_mean": 4151.1, "valid_targets_min": 1403 }, { "epoch": 2.1291866028708135, "grad_norm": 0.45665193547767974, "learning_rate": 3.514336519084591e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.17760662734508514, "step": 1335, "valid_targets_mean": 5019.9, "valid_targets_min": 1252 }, { "epoch": 2.1371610845295055, "grad_norm": 0.5111255448822826, "learning_rate": 3.509129240316461e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.18380534648895264, "step": 1340, "valid_targets_mean": 3753.7, "valid_targets_min": 1912 }, { "epoch": 2.145135566188198, "grad_norm": 0.4888821553823615, "learning_rate": 3.5038980959995985e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.18884651362895966, "step": 1345, "valid_targets_mean": 4299.5, "valid_targets_min": 524 }, { "epoch": 2.15311004784689, "grad_norm": 0.5876826648011623, "learning_rate": 3.498643168859941e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.21021640300750732, "step": 1350, "valid_targets_mean": 4070.5, "valid_targets_min": 1091 }, { "epoch": 2.1610845295055823, "grad_norm": 0.4433617225762594, "learning_rate": 3.493364541999529e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.15240584313869476, "step": 1355, "valid_targets_mean": 3732.5, "valid_targets_min": 1223 }, { "epoch": 2.1690590111642742, "grad_norm": 0.4999003849230528, "learning_rate": 3.488062298895194e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.22450381517410278, "step": 1360, "valid_targets_mean": 5037.6, "valid_targets_min": 1831 }, { "epoch": 2.1770334928229667, "grad_norm": 0.5515763140814884, "learning_rate": 3.482736523397237e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.17379963397979736, "step": 1365, "valid_targets_mean": 4321.4, "valid_targets_min": 1374 }, { "epoch": 2.1850079744816586, "grad_norm": 0.5140961821958343, "learning_rate": 3.4773872997281026e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.21524573862552643, "step": 1370, "valid_targets_mean": 4404.0, "valid_targets_min": 1576 }, { "epoch": 2.192982456140351, "grad_norm": 0.5277729139359486, "learning_rate": 3.472014712481048e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.22807437181472778, "step": 1375, "valid_targets_mean": 4321.2, "valid_targets_min": 1846 }, { "epoch": 2.200956937799043, "grad_norm": 0.5031333134053864, "learning_rate": 3.466618846618806e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.22107753157615662, "step": 1380, "valid_targets_mean": 4169.7, "valid_targets_min": 1166 }, { "epoch": 2.2089314194577354, "grad_norm": 0.483311395201815, "learning_rate": 3.461199787472238e-05, "loss": 0.2041, "loss_nan_ranks": 0, "loss_rank_avg": 0.19544145464897156, "step": 1385, "valid_targets_mean": 3844.2, "valid_targets_min": 744 }, { "epoch": 2.2169059011164274, "grad_norm": 0.4498139497860062, "learning_rate": 3.455757620738989e-05, "loss": 0.2111, "loss_nan_ranks": 0, "loss_rank_avg": 0.21751423180103302, "step": 1390, "valid_targets_mean": 4871.2, "valid_targets_min": 377 }, { "epoch": 2.22488038277512, "grad_norm": 0.46372087812522933, "learning_rate": 3.450292432482127e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.20186303555965424, "step": 1395, "valid_targets_mean": 4219.1, "valid_targets_min": 1451 }, { "epoch": 2.2328548644338118, "grad_norm": 0.4234330431162755, "learning_rate": 3.444804309128789e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.16204340755939484, "step": 1400, "valid_targets_mean": 5115.7, "valid_targets_min": 2142 }, { "epoch": 2.240829346092504, "grad_norm": 0.46729513282292884, "learning_rate": 3.439293337468808e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1783636510372162, "step": 1405, "valid_targets_mean": 4136.9, "valid_targets_min": 1653 }, { "epoch": 2.248803827751196, "grad_norm": 0.5256776358531895, "learning_rate": 3.4337596046533426e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.2295759618282318, "step": 1410, "valid_targets_mean": 4567.9, "valid_targets_min": 1222 }, { "epoch": 2.2567783094098885, "grad_norm": 0.4138467943971567, "learning_rate": 3.4282031981935e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.16236048936843872, "step": 1415, "valid_targets_mean": 4935.4, "valid_targets_min": 1512 }, { "epoch": 2.2647527910685805, "grad_norm": 0.5052303861398547, "learning_rate": 3.42262420595895e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.21595962345600128, "step": 1420, "valid_targets_mean": 4676.1, "valid_targets_min": 462 }, { "epoch": 2.2727272727272725, "grad_norm": 0.42027522309214377, "learning_rate": 3.417022716176539e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.21920445561408997, "step": 1425, "valid_targets_mean": 5443.5, "valid_targets_min": 818 }, { "epoch": 2.280701754385965, "grad_norm": 0.42271888607035824, "learning_rate": 3.411398817428889e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.21368569135665894, "step": 1430, "valid_targets_mean": 5346.8, "valid_targets_min": 2060 }, { "epoch": 2.2886762360446573, "grad_norm": 0.46762819973280395, "learning_rate": 3.4057525986530016e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.21968646347522736, "step": 1435, "valid_targets_mean": 4741.2, "valid_targets_min": 331 }, { "epoch": 2.2966507177033493, "grad_norm": 0.47510163265424776, "learning_rate": 3.400084149138851e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.19467958807945251, "step": 1440, "valid_targets_mean": 4569.6, "valid_targets_min": 1837 }, { "epoch": 2.3046251993620412, "grad_norm": 0.4906053699523343, "learning_rate": 3.394393558527969e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.21481776237487793, "step": 1445, "valid_targets_mean": 4330.7, "valid_targets_min": 1908 }, { "epoch": 2.3125996810207337, "grad_norm": 0.5017709902553857, "learning_rate": 3.388680916812031e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.20141157507896423, "step": 1450, "valid_targets_mean": 4137.5, "valid_targets_min": 1589 }, { "epoch": 2.320574162679426, "grad_norm": 0.45313626296858717, "learning_rate": 3.382946314331429e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1925966739654541, "step": 1455, "valid_targets_mean": 4450.9, "valid_targets_min": 397 }, { "epoch": 2.328548644338118, "grad_norm": 0.6495234625151266, "learning_rate": 3.377189841773848e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.20314140617847443, "step": 1460, "valid_targets_mean": 4231.6, "valid_targets_min": 1037 }, { "epoch": 2.33652312599681, "grad_norm": 0.5436303133229426, "learning_rate": 3.371411590172827e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.20022675395011902, "step": 1465, "valid_targets_mean": 4746.3, "valid_targets_min": 1710 }, { "epoch": 2.3444976076555024, "grad_norm": 0.4712354546705832, "learning_rate": 3.365611650906321e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.15993911027908325, "step": 1470, "valid_targets_mean": 3833.4, "valid_targets_min": 1170 }, { "epoch": 2.352472089314195, "grad_norm": 0.4505288458448758, "learning_rate": 3.359790115695259e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.21294520795345306, "step": 1475, "valid_targets_mean": 5357.1, "valid_targets_min": 1479 }, { "epoch": 2.360446570972887, "grad_norm": 0.5025939693327697, "learning_rate": 3.353947076602088e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.21563753485679626, "step": 1480, "valid_targets_mean": 4241.7, "valid_targets_min": 858 }, { "epoch": 2.3684210526315788, "grad_norm": 0.4676350895459756, "learning_rate": 3.34808262602932e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.2031913697719574, "step": 1485, "valid_targets_mean": 4083.8, "valid_targets_min": 884 }, { "epoch": 2.376395534290271, "grad_norm": 0.4563739844772263, "learning_rate": 3.342196856718074e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.1997055560350418, "step": 1490, "valid_targets_mean": 4307.0, "valid_targets_min": 1402 }, { "epoch": 2.384370015948963, "grad_norm": 0.43749184940511027, "learning_rate": 3.336289861746602e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.18445178866386414, "step": 1495, "valid_targets_mean": 4663.4, "valid_targets_min": 1569 }, { "epoch": 2.3923444976076556, "grad_norm": 0.45977508895019903, "learning_rate": 3.330361734528823e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.1979564130306244, "step": 1500, "valid_targets_mean": 4822.2, "valid_targets_min": 1832 }, { "epoch": 2.4003189792663475, "grad_norm": 0.5414838734249728, "learning_rate": 3.324412568812844e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.19212666153907776, "step": 1505, "valid_targets_mean": 3750.8, "valid_targets_min": 777 }, { "epoch": 2.40829346092504, "grad_norm": 0.4358025730158986, "learning_rate": 3.318442458679477e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.1796949803829193, "step": 1510, "valid_targets_mean": 4733.1, "valid_targets_min": 1462 }, { "epoch": 2.416267942583732, "grad_norm": 0.5789725852587035, "learning_rate": 3.312451498540751e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.22660470008850098, "step": 1515, "valid_targets_mean": 3926.1, "valid_targets_min": 1148 }, { "epoch": 2.4242424242424243, "grad_norm": 0.4810092138228401, "learning_rate": 3.306439783138421e-05, "loss": 0.2056, "loss_nan_ranks": 0, "loss_rank_avg": 0.1583409607410431, "step": 1520, "valid_targets_mean": 3954.2, "valid_targets_min": 2144 }, { "epoch": 2.4322169059011163, "grad_norm": 0.480939376721317, "learning_rate": 3.3004074075424666e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.19095252454280853, "step": 1525, "valid_targets_mean": 4131.1, "valid_targets_min": 636 }, { "epoch": 2.4401913875598087, "grad_norm": 0.44164348513325546, "learning_rate": 3.29435446714959e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.18615323305130005, "step": 1530, "valid_targets_mean": 4125.1, "valid_targets_min": 909 }, { "epoch": 2.4481658692185007, "grad_norm": 0.49332778067002697, "learning_rate": 3.288281057681709e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.23022127151489258, "step": 1535, "valid_targets_mean": 4346.1, "valid_targets_min": 1011 }, { "epoch": 2.456140350877193, "grad_norm": 0.5217870366629661, "learning_rate": 3.28218727518444e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.19895359873771667, "step": 1540, "valid_targets_mean": 3616.3, "valid_targets_min": 1063 }, { "epoch": 2.464114832535885, "grad_norm": 0.44722789365078947, "learning_rate": 3.2760732160255835e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.16717740893363953, "step": 1545, "valid_targets_mean": 4226.1, "valid_targets_min": 951 }, { "epoch": 2.4720893141945774, "grad_norm": 0.41737884025495914, "learning_rate": 3.269938976893595e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2132222056388855, "step": 1550, "valid_targets_mean": 5227.2, "valid_targets_min": 2208 }, { "epoch": 2.4800637958532694, "grad_norm": 0.4677786411136909, "learning_rate": 3.2637846547960596e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.19589948654174805, "step": 1555, "valid_targets_mean": 4841.1, "valid_targets_min": 1762 }, { "epoch": 2.488038277511962, "grad_norm": 0.4965944170108996, "learning_rate": 3.2576103470581564e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.17509344220161438, "step": 1560, "valid_targets_mean": 3434.1, "valid_targets_min": 629 }, { "epoch": 2.496012759170654, "grad_norm": 0.492974160023232, "learning_rate": 3.25141615132112e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.15599842369556427, "step": 1565, "valid_targets_mean": 4451.3, "valid_targets_min": 1194 }, { "epoch": 2.503987240829346, "grad_norm": 0.42642356808242493, "learning_rate": 3.245202165540697e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.16409683227539062, "step": 1570, "valid_targets_mean": 4488.6, "valid_targets_min": 1827 }, { "epoch": 2.511961722488038, "grad_norm": 0.4616220732618904, "learning_rate": 3.238968487985594e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.16624875366687775, "step": 1575, "valid_targets_mean": 3498.1, "valid_targets_min": 1233 }, { "epoch": 2.5199362041467306, "grad_norm": 0.45820206047868534, "learning_rate": 3.232715217235927e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.1971983015537262, "step": 1580, "valid_targets_mean": 4863.6, "valid_targets_min": 385 }, { "epoch": 2.5279106858054226, "grad_norm": 0.42279033871539334, "learning_rate": 3.226442452181662e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.19996625185012817, "step": 1585, "valid_targets_mean": 5554.1, "valid_targets_min": 2678 }, { "epoch": 2.535885167464115, "grad_norm": 0.46417011052422286, "learning_rate": 3.220150292021049e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.19248399138450623, "step": 1590, "valid_targets_mean": 4302.6, "valid_targets_min": 1647 }, { "epoch": 2.543859649122807, "grad_norm": 0.42195835961915845, "learning_rate": 3.213838836259055e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.1905175745487213, "step": 1595, "valid_targets_mean": 5845.2, "valid_targets_min": 2714 }, { "epoch": 2.5518341307814993, "grad_norm": 0.41169073814710955, "learning_rate": 3.2075081847057886e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413644641637802, "step": 1600, "valid_targets_mean": 6022.2, "valid_targets_min": 2591 }, { "epoch": 2.5598086124401913, "grad_norm": 0.42143967615716676, "learning_rate": 3.201158437474925e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.17829415202140808, "step": 1605, "valid_targets_mean": 4504.9, "valid_targets_min": 2008 }, { "epoch": 2.5677830940988837, "grad_norm": 0.4019639267134053, "learning_rate": 3.194789694982119e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.19469118118286133, "step": 1610, "valid_targets_mean": 4991.6, "valid_targets_min": 2037 }, { "epoch": 2.5757575757575757, "grad_norm": 0.4967706504496925, "learning_rate": 3.1884020579434216e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.18184614181518555, "step": 1615, "valid_targets_mean": 3664.2, "valid_targets_min": 989 }, { "epoch": 2.583732057416268, "grad_norm": 0.40679294637064134, "learning_rate": 3.181995627373679e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.17015117406845093, "step": 1620, "valid_targets_mean": 4571.1, "valid_targets_min": 529 }, { "epoch": 2.59170653907496, "grad_norm": 0.4584533151540396, "learning_rate": 3.1755705045849465e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.17102062702178955, "step": 1625, "valid_targets_mean": 4546.4, "valid_targets_min": 1534 }, { "epoch": 2.5996810207336525, "grad_norm": 0.4353991390783487, "learning_rate": 3.1691267911848765e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.20528733730316162, "step": 1630, "valid_targets_mean": 4818.4, "valid_targets_min": 2380 }, { "epoch": 2.6076555023923444, "grad_norm": 0.4725264329143068, "learning_rate": 3.1626645890751167e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.23138327896595, "step": 1635, "valid_targets_mean": 4452.9, "valid_targets_min": 1687 }, { "epoch": 2.6156299840510364, "grad_norm": 0.7190616362034168, "learning_rate": 3.156184000449697e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.2099694162607193, "step": 1640, "valid_targets_mean": 4351.5, "valid_targets_min": 792 }, { "epoch": 2.623604465709729, "grad_norm": 0.4262432921313368, "learning_rate": 3.149685127793415e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.2072952389717102, "step": 1645, "valid_targets_mean": 5261.7, "valid_targets_min": 1564 }, { "epoch": 2.6315789473684212, "grad_norm": 0.44663659913615, "learning_rate": 3.143168073880214e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.20910018682479858, "step": 1650, "valid_targets_mean": 4689.8, "valid_targets_min": 1977 }, { "epoch": 2.639553429027113, "grad_norm": 0.47855265259414465, "learning_rate": 3.1366329417715556e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.17901211977005005, "step": 1655, "valid_targets_mean": 3450.9, "valid_targets_min": 764 }, { "epoch": 2.647527910685805, "grad_norm": 0.42030685495576364, "learning_rate": 3.1300798348147954e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.17088496685028076, "step": 1660, "valid_targets_mean": 4424.1, "valid_targets_min": 685 }, { "epoch": 2.6555023923444976, "grad_norm": 0.424205274613458, "learning_rate": 3.123508856641542e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.20387335121631622, "step": 1665, "valid_targets_mean": 4416.8, "valid_targets_min": 641 }, { "epoch": 2.66347687400319, "grad_norm": 0.6446111039179884, "learning_rate": 3.116920111166025e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.18233443796634674, "step": 1670, "valid_targets_mean": 3812.8, "valid_targets_min": 1710 }, { "epoch": 2.671451355661882, "grad_norm": 0.4016792889917327, "learning_rate": 3.1103137025834456e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.17425809800624847, "step": 1675, "valid_targets_mean": 5096.6, "valid_targets_min": 1249 }, { "epoch": 2.679425837320574, "grad_norm": 0.4651781503641287, "learning_rate": 3.103689735368333e-05, "loss": 0.2157, "loss_nan_ranks": 0, "loss_rank_avg": 0.1736563742160797, "step": 1680, "valid_targets_mean": 4534.1, "valid_targets_min": 1866 }, { "epoch": 2.6874003189792663, "grad_norm": 0.5822658951368973, "learning_rate": 3.097048314272889e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.25176823139190674, "step": 1685, "valid_targets_mean": 3692.4, "valid_targets_min": 904 }, { "epoch": 2.6953748006379588, "grad_norm": 0.49469625871209677, "learning_rate": 3.090389544325335e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.20558789372444153, "step": 1690, "valid_targets_mean": 3640.8, "valid_targets_min": 683 }, { "epoch": 2.7033492822966507, "grad_norm": 0.6014487435674147, "learning_rate": 3.08371353082825e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.18729646503925323, "step": 1695, "valid_targets_mean": 3934.1, "valid_targets_min": 1318 }, { "epoch": 2.7113237639553427, "grad_norm": 0.4723809602275162, "learning_rate": 3.0770203793568994e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.1865779161453247, "step": 1700, "valid_targets_mean": 4184.6, "valid_targets_min": 1924 }, { "epoch": 2.719298245614035, "grad_norm": 0.4575136224294941, "learning_rate": 3.0703101957575765e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.18605884909629822, "step": 1705, "valid_targets_mean": 4517.9, "valid_targets_min": 1272 }, { "epoch": 2.7272727272727275, "grad_norm": 0.44365096011449917, "learning_rate": 3.0635830861459204e-05, "loss": 0.201, "loss_nan_ranks": 0, "loss_rank_avg": 0.211789071559906, "step": 1710, "valid_targets_mean": 5082.9, "valid_targets_min": 667 }, { "epoch": 2.7352472089314195, "grad_norm": 0.46945868579564015, "learning_rate": 3.056839156905239e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.17882491648197174, "step": 1715, "valid_targets_mean": 4237.8, "valid_targets_min": 1611 }, { "epoch": 2.7432216905901115, "grad_norm": 0.44204098954171, "learning_rate": 3.0500785146848303e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.20405025780200958, "step": 1720, "valid_targets_mean": 5329.2, "valid_targets_min": 1796 }, { "epoch": 2.751196172248804, "grad_norm": 0.46803832657642275, "learning_rate": 3.04330126639829e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.188456192612648, "step": 1725, "valid_targets_mean": 3660.6, "valid_targets_min": 1421 }, { "epoch": 2.7591706539074963, "grad_norm": 0.46909903458430224, "learning_rate": 3.0365075192218278e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.20096969604492188, "step": 1730, "valid_targets_mean": 3955.4, "valid_targets_min": 1782 }, { "epoch": 2.7671451355661882, "grad_norm": 0.4540996711308176, "learning_rate": 3.0296973805925663e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.15702204406261444, "step": 1735, "valid_targets_mean": 3424.9, "valid_targets_min": 996 }, { "epoch": 2.77511961722488, "grad_norm": 0.43447333950282657, "learning_rate": 3.022870958206845e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.17967906594276428, "step": 1740, "valid_targets_mean": 4727.9, "valid_targets_min": 1797 }, { "epoch": 2.7830940988835726, "grad_norm": 0.534010470635787, "learning_rate": 3.0160283600185168e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.16738936305046082, "step": 1745, "valid_targets_mean": 3008.1, "valid_targets_min": 1061 }, { "epoch": 2.7910685805422646, "grad_norm": 0.4657128578979155, "learning_rate": 3.0091696942372412e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.2012743055820465, "step": 1750, "valid_targets_mean": 4893.4, "valid_targets_min": 486 }, { "epoch": 2.799043062200957, "grad_norm": 0.4392915887871567, "learning_rate": 3.002295069326772e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.16907723248004913, "step": 1755, "valid_targets_mean": 4969.5, "valid_targets_min": 1327 }, { "epoch": 2.807017543859649, "grad_norm": 0.4982700232598375, "learning_rate": 2.9954045940032423e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.21579095721244812, "step": 1760, "valid_targets_mean": 3663.6, "valid_targets_min": 1646 }, { "epoch": 2.8149920255183414, "grad_norm": 0.4632009960069745, "learning_rate": 2.988498377233446e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.17049282789230347, "step": 1765, "valid_targets_mean": 4540.4, "valid_targets_min": 1038 }, { "epoch": 2.8229665071770333, "grad_norm": 0.42410704640339714, "learning_rate": 2.981576528233114e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.19153660535812378, "step": 1770, "valid_targets_mean": 4711.1, "valid_targets_min": 2124 }, { "epoch": 2.8309409888357258, "grad_norm": 0.45542782962545275, "learning_rate": 2.9746391564651867e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.16209903359413147, "step": 1775, "valid_targets_mean": 3815.8, "valid_targets_min": 1518 }, { "epoch": 2.8389154704944177, "grad_norm": 0.44181038225703473, "learning_rate": 2.9676863716380845e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.1918773651123047, "step": 1780, "valid_targets_mean": 5145.6, "valid_targets_min": 2006 }, { "epoch": 2.84688995215311, "grad_norm": 0.4733731410179992, "learning_rate": 2.9607182837039697e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.17720836400985718, "step": 1785, "valid_targets_mean": 3921.2, "valid_targets_min": 1306 }, { "epoch": 2.854864433811802, "grad_norm": 0.4759505220208452, "learning_rate": 2.9537350028570126e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.19989919662475586, "step": 1790, "valid_targets_mean": 4174.9, "valid_targets_min": 1135 }, { "epoch": 2.8628389154704945, "grad_norm": 0.42878416628933597, "learning_rate": 2.946736639531643e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.19443926215171814, "step": 1795, "valid_targets_mean": 4803.4, "valid_targets_min": 2250 }, { "epoch": 2.8708133971291865, "grad_norm": 0.4976297417784473, "learning_rate": 2.9397233044008092e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.19648616015911102, "step": 1800, "valid_targets_mean": 3719.8, "valid_targets_min": 1844 }, { "epoch": 2.878787878787879, "grad_norm": 0.431683591573211, "learning_rate": 2.9326951083742243e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.21068888902664185, "step": 1805, "valid_targets_mean": 5563.5, "valid_targets_min": 1363 }, { "epoch": 2.886762360446571, "grad_norm": 0.5121916169724076, "learning_rate": 2.925652162596613e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2092716246843338, "step": 1810, "valid_targets_mean": 4329.8, "valid_targets_min": 1729 }, { "epoch": 2.8947368421052633, "grad_norm": 0.4272155165121044, "learning_rate": 2.9185945784459558e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.17961260676383972, "step": 1815, "valid_targets_mean": 4433.8, "valid_targets_min": 1092 }, { "epoch": 2.9027113237639552, "grad_norm": 0.4446934153344442, "learning_rate": 2.9115224675317252e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.189774751663208, "step": 1820, "valid_targets_mean": 4546.6, "valid_targets_min": 1965 }, { "epoch": 2.9106858054226477, "grad_norm": 0.4076827298604876, "learning_rate": 2.9044359416931206e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1695403754711151, "step": 1825, "valid_targets_mean": 4729.8, "valid_targets_min": 2092 }, { "epoch": 2.9186602870813396, "grad_norm": 0.43032076390253393, "learning_rate": 2.897335112997302e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.15757311880588531, "step": 1830, "valid_targets_mean": 3931.1, "valid_targets_min": 1880 }, { "epoch": 2.926634768740032, "grad_norm": 0.7730974548275344, "learning_rate": 2.8902200937376173e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.18478021025657654, "step": 1835, "valid_targets_mean": 4594.4, "valid_targets_min": 880 }, { "epoch": 2.934609250398724, "grad_norm": 0.43970061090571333, "learning_rate": 2.8830909964318242e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.17417211830615997, "step": 1840, "valid_targets_mean": 4185.7, "valid_targets_min": 1643 }, { "epoch": 2.9425837320574164, "grad_norm": 0.46307277533553975, "learning_rate": 2.875947933820312e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.1813255250453949, "step": 1845, "valid_targets_mean": 4267.8, "valid_targets_min": 412 }, { "epoch": 2.9505582137161084, "grad_norm": 0.45885144568744957, "learning_rate": 2.868791018864321e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.17331145703792572, "step": 1850, "valid_targets_mean": 3941.5, "valid_targets_min": 1577 }, { "epoch": 2.958532695374801, "grad_norm": 0.4564977890190464, "learning_rate": 2.861620364744151e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.16592752933502197, "step": 1855, "valid_targets_mean": 3880.0, "valid_targets_min": 1417 }, { "epoch": 2.9665071770334928, "grad_norm": 0.4644093884900869, "learning_rate": 2.854436084857379e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.15251806378364563, "step": 1860, "valid_targets_mean": 3713.1, "valid_targets_min": 1441 }, { "epoch": 2.974481658692185, "grad_norm": 0.4959719091360015, "learning_rate": 2.847238292817057e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.19827379286289215, "step": 1865, "valid_targets_mean": 3770.2, "valid_targets_min": 600 }, { "epoch": 2.982456140350877, "grad_norm": 0.5612759105888359, "learning_rate": 2.8400271024499212e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.1830437183380127, "step": 1870, "valid_targets_mean": 3588.1, "valid_targets_min": 510 }, { "epoch": 2.990430622009569, "grad_norm": 0.4841101151001515, "learning_rate": 2.832802627794593e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.17299309372901917, "step": 1875, "valid_targets_mean": 4010.5, "valid_targets_min": 1156 }, { "epoch": 2.9984051036682615, "grad_norm": 0.48228383639741784, "learning_rate": 2.8255649830997704e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.170659139752388, "step": 1880, "valid_targets_mean": 3891.1, "valid_targets_min": 1303 }, { "epoch": 3.006379585326954, "grad_norm": 0.4187959247951961, "learning_rate": 2.8183142828224238e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.15005925297737122, "step": 1885, "valid_targets_mean": 4229.8, "valid_targets_min": 726 }, { "epoch": 3.014354066985646, "grad_norm": 0.5518696834811211, "learning_rate": 2.811050641625988e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.16052091121673584, "step": 1890, "valid_targets_mean": 3637.3, "valid_targets_min": 1523 }, { "epoch": 3.0223285486443383, "grad_norm": 0.5272361647263227, "learning_rate": 2.8037741743785458e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.17966750264167786, "step": 1895, "valid_targets_mean": 4879.4, "valid_targets_min": 1303 }, { "epoch": 3.0303030303030303, "grad_norm": 0.44821310582608315, "learning_rate": 2.796484996151013e-05, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.21618738770484924, "step": 1900, "valid_targets_mean": 5611.4, "valid_targets_min": 1867 }, { "epoch": 3.0382775119617227, "grad_norm": 0.4784008624223626, "learning_rate": 2.7891832222153188e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.16092903912067413, "step": 1905, "valid_targets_mean": 4007.4, "valid_targets_min": 291 }, { "epoch": 3.0462519936204147, "grad_norm": 0.46337869290279277, "learning_rate": 2.7818689680425807e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.18314269185066223, "step": 1910, "valid_targets_mean": 4119.5, "valid_targets_min": 319 }, { "epoch": 3.054226475279107, "grad_norm": 0.45687713151005843, "learning_rate": 2.7745423493012827e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.2106841802597046, "step": 1915, "valid_targets_mean": 4950.8, "valid_targets_min": 1469 }, { "epoch": 3.062200956937799, "grad_norm": 0.4790710436995416, "learning_rate": 2.767203481855441e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.17638225853443146, "step": 1920, "valid_targets_mean": 4521.6, "valid_targets_min": 1922 }, { "epoch": 3.0701754385964914, "grad_norm": 0.46515663038891586, "learning_rate": 2.7598524817627764e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.1621520221233368, "step": 1925, "valid_targets_mean": 5203.6, "valid_targets_min": 2173 }, { "epoch": 3.0781499202551834, "grad_norm": 0.6079774346243542, "learning_rate": 2.7524894652728754e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.18975286185741425, "step": 1930, "valid_targets_mean": 3732.1, "valid_targets_min": 906 }, { "epoch": 3.0861244019138754, "grad_norm": 0.4548224335500046, "learning_rate": 2.7451145488253544e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.18545740842819214, "step": 1935, "valid_targets_mean": 4543.8, "valid_targets_min": 763 }, { "epoch": 3.094098883572568, "grad_norm": 0.43076682756967427, "learning_rate": 2.7377278490480157e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.18288424611091614, "step": 1940, "valid_targets_mean": 5278.6, "valid_targets_min": 2115 }, { "epoch": 3.1020733652312598, "grad_norm": 0.44219495400736336, "learning_rate": 2.730329482755006e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.17927348613739014, "step": 1945, "valid_targets_mean": 4926.1, "valid_targets_min": 1333 }, { "epoch": 3.110047846889952, "grad_norm": 0.4642793792070131, "learning_rate": 2.7229195669449667e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.15698301792144775, "step": 1950, "valid_targets_mean": 5145.6, "valid_targets_min": 2758 }, { "epoch": 3.118022328548644, "grad_norm": 0.5081120712069186, "learning_rate": 2.7154982187991855e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.16398665308952332, "step": 1955, "valid_targets_mean": 3972.9, "valid_targets_min": 1024 }, { "epoch": 3.1259968102073366, "grad_norm": 0.39334994682912094, "learning_rate": 2.7080655556797406e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.1446482390165329, "step": 1960, "valid_targets_mean": 5047.1, "valid_targets_min": 1067 }, { "epoch": 3.1339712918660285, "grad_norm": 0.49370701263368166, "learning_rate": 2.700621695127649e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.1659671664237976, "step": 1965, "valid_targets_mean": 3601.8, "valid_targets_min": 809 }, { "epoch": 3.141945773524721, "grad_norm": 0.5236111485377425, "learning_rate": 2.693166754861003e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.15575477480888367, "step": 1970, "valid_targets_mean": 3251.2, "valid_targets_min": 1446 }, { "epoch": 3.149920255183413, "grad_norm": 0.5184956275914406, "learning_rate": 2.685700852773113e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.17251455783843994, "step": 1975, "valid_targets_mean": 5407.9, "valid_targets_min": 1637 }, { "epoch": 3.1578947368421053, "grad_norm": 0.567900202509518, "learning_rate": 2.6782241069306395e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.17170360684394836, "step": 1980, "valid_targets_mean": 3757.9, "valid_targets_min": 1669 }, { "epoch": 3.1658692185007973, "grad_norm": 0.5331605536049749, "learning_rate": 2.6707366355717268e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.183954119682312, "step": 1985, "valid_targets_mean": 3772.0, "valid_targets_min": 1645 }, { "epoch": 3.1738437001594897, "grad_norm": 0.5372666317594943, "learning_rate": 2.663238557104136e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.19271928071975708, "step": 1990, "valid_targets_mean": 4226.8, "valid_targets_min": 462 }, { "epoch": 3.1818181818181817, "grad_norm": 0.4511808563006348, "learning_rate": 2.655729990103368e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.18819640576839447, "step": 1995, "valid_targets_mean": 4724.9, "valid_targets_min": 1801 }, { "epoch": 3.189792663476874, "grad_norm": 0.515719063530578, "learning_rate": 2.648211053310792e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.17429378628730774, "step": 2000, "valid_targets_mean": 3824.9, "valid_targets_min": 1608 }, { "epoch": 3.197767145135566, "grad_norm": 0.49018438347190046, "learning_rate": 2.6406818656317654e-05, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.23138472437858582, "step": 2005, "valid_targets_mean": 4367.4, "valid_targets_min": 1162 }, { "epoch": 3.2057416267942584, "grad_norm": 0.5140123035534574, "learning_rate": 2.6331425461337557e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.15981221199035645, "step": 2010, "valid_targets_mean": 3901.4, "valid_targets_min": 1592 }, { "epoch": 3.2137161084529504, "grad_norm": 0.5084601119365288, "learning_rate": 2.6255932140444546e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.16400453448295593, "step": 2015, "valid_targets_mean": 3658.4, "valid_targets_min": 418 }, { "epoch": 3.221690590111643, "grad_norm": 0.5222629370653686, "learning_rate": 2.618033988749895e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.18251457810401917, "step": 2020, "valid_targets_mean": 3590.5, "valid_targets_min": 404 }, { "epoch": 3.229665071770335, "grad_norm": 0.44929273918603535, "learning_rate": 2.6104649897925622e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.18098227679729462, "step": 2025, "valid_targets_mean": 4840.8, "valid_targets_min": 1725 }, { "epoch": 3.237639553429027, "grad_norm": 0.5128148092418456, "learning_rate": 2.602886336869503e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.18772810697555542, "step": 2030, "valid_targets_mean": 4087.9, "valid_targets_min": 278 }, { "epoch": 3.245614035087719, "grad_norm": 0.5085322011859369, "learning_rate": 2.595298149830433e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.16362358629703522, "step": 2035, "valid_targets_mean": 3683.7, "valid_targets_min": 1530 }, { "epoch": 3.2535885167464116, "grad_norm": 0.44741903202469246, "learning_rate": 2.5877005486758424e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595516800880432, "step": 2040, "valid_targets_mean": 4753.9, "valid_targets_min": 2291 }, { "epoch": 3.2615629984051036, "grad_norm": 0.46510640494197375, "learning_rate": 2.5800936535550954e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.16583102941513062, "step": 2045, "valid_targets_mean": 4312.9, "valid_targets_min": 1997 }, { "epoch": 3.269537480063796, "grad_norm": 0.4531657121086904, "learning_rate": 2.5724775847645345e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.19412560760974884, "step": 2050, "valid_targets_mean": 5226.4, "valid_targets_min": 1255 }, { "epoch": 3.277511961722488, "grad_norm": 0.46205211802785623, "learning_rate": 2.5648524627455738e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.17929866909980774, "step": 2055, "valid_targets_mean": 4219.8, "valid_targets_min": 962 }, { "epoch": 3.2854864433811803, "grad_norm": 0.583980913889235, "learning_rate": 2.557218408082798e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.17891603708267212, "step": 2060, "valid_targets_mean": 5263.7, "valid_targets_min": 1495 }, { "epoch": 3.2934609250398723, "grad_norm": 0.528345239667559, "learning_rate": 2.5495755415020504e-05, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.16911692917346954, "step": 2065, "valid_targets_mean": 4109.6, "valid_targets_min": 710 }, { "epoch": 3.3014354066985647, "grad_norm": 0.5330821422864389, "learning_rate": 2.5419239838685325e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.19775941967964172, "step": 2070, "valid_targets_mean": 4235.2, "valid_targets_min": 989 }, { "epoch": 3.3094098883572567, "grad_norm": 0.5494101250916248, "learning_rate": 2.5342638561848817e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.20631219446659088, "step": 2075, "valid_targets_mean": 3423.0, "valid_targets_min": 1477 }, { "epoch": 3.317384370015949, "grad_norm": 0.45567413053215694, "learning_rate": 2.526595279589265e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.16964775323867798, "step": 2080, "valid_targets_mean": 4667.2, "valid_targets_min": 1610 }, { "epoch": 3.325358851674641, "grad_norm": 0.48291376026654725, "learning_rate": 2.5189183753534634e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.17720086872577667, "step": 2085, "valid_targets_mean": 4395.1, "valid_targets_min": 1859 }, { "epoch": 3.3333333333333335, "grad_norm": 0.5572381771566919, "learning_rate": 2.5112332648809495e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.16899794340133667, "step": 2090, "valid_targets_mean": 4103.3, "valid_targets_min": 655 }, { "epoch": 3.3413078149920254, "grad_norm": 0.5124868674052819, "learning_rate": 2.503540069704973e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.195106640458107, "step": 2095, "valid_targets_mean": 4012.4, "valid_targets_min": 1067 }, { "epoch": 3.349282296650718, "grad_norm": 0.5470151593968711, "learning_rate": 2.4958389114866326e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.21948151290416718, "step": 2100, "valid_targets_mean": 3900.2, "valid_targets_min": 515 }, { "epoch": 3.35725677830941, "grad_norm": 0.46712894349683487, "learning_rate": 2.488129912012958e-05, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.1717987209558487, "step": 2105, "valid_targets_mean": 4451.4, "valid_targets_min": 1283 }, { "epoch": 3.3652312599681022, "grad_norm": 0.5296054451681127, "learning_rate": 2.4804131931949823e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.16957393288612366, "step": 2110, "valid_targets_mean": 4148.4, "valid_targets_min": 858 }, { "epoch": 3.373205741626794, "grad_norm": 0.44324708492039827, "learning_rate": 2.4726888770658103e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.19824856519699097, "step": 2115, "valid_targets_mean": 5021.0, "valid_targets_min": 1764 }, { "epoch": 3.3811802232854866, "grad_norm": 0.44782890540327536, "learning_rate": 2.4649570857786928e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.19559164345264435, "step": 2120, "valid_targets_mean": 5260.7, "valid_targets_min": 1522 }, { "epoch": 3.3891547049441786, "grad_norm": 0.4415358571325815, "learning_rate": 2.4572179416050953e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.16224873065948486, "step": 2125, "valid_targets_mean": 4277.9, "valid_targets_min": 1156 }, { "epoch": 3.397129186602871, "grad_norm": 0.5354109744414436, "learning_rate": 2.449471566932761e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.15482710301876068, "step": 2130, "valid_targets_mean": 3514.0, "valid_targets_min": 791 }, { "epoch": 3.405103668261563, "grad_norm": 0.4598141951361569, "learning_rate": 2.4417180842637764e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.1662302166223526, "step": 2135, "valid_targets_mean": 5137.8, "valid_targets_min": 1509 }, { "epoch": 3.4130781499202554, "grad_norm": 0.5263732946909472, "learning_rate": 2.4339576162126362e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471291333436966, "step": 2140, "valid_targets_mean": 3313.0, "valid_targets_min": 1479 }, { "epoch": 3.4210526315789473, "grad_norm": 0.5328365830297036, "learning_rate": 2.4261902855043027e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.16807958483695984, "step": 2145, "valid_targets_mean": 3053.6, "valid_targets_min": 1038 }, { "epoch": 3.4290271132376393, "grad_norm": 0.4973411156089335, "learning_rate": 2.418416214972265e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.1936582326889038, "step": 2150, "valid_targets_mean": 3973.1, "valid_targets_min": 1500 }, { "epoch": 3.4370015948963317, "grad_norm": 0.48444835144260445, "learning_rate": 2.4106355275565937e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.18759359419345856, "step": 2155, "valid_targets_mean": 4261.8, "valid_targets_min": 400 }, { "epoch": 3.444976076555024, "grad_norm": 0.43370463589864844, "learning_rate": 2.4028483463020053e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.14529302716255188, "step": 2160, "valid_targets_mean": 4517.1, "valid_targets_min": 961 }, { "epoch": 3.452950558213716, "grad_norm": 0.5083145951827011, "learning_rate": 2.3950547943559056e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.1669323891401291, "step": 2165, "valid_targets_mean": 3752.9, "valid_targets_min": 286 }, { "epoch": 3.460925039872408, "grad_norm": 0.44649606232597117, "learning_rate": 2.3872549949664493e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.14849191904067993, "step": 2170, "valid_targets_mean": 4235.8, "valid_targets_min": 1152 }, { "epoch": 3.4688995215311005, "grad_norm": 0.39918099350110425, "learning_rate": 2.3794490714805897e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.1473017781972885, "step": 2175, "valid_targets_mean": 4902.6, "valid_targets_min": 1706 }, { "epoch": 3.476874003189793, "grad_norm": 0.4752038213110687, "learning_rate": 2.3716371473421242e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1683822125196457, "step": 2180, "valid_targets_mean": 3975.9, "valid_targets_min": 819 }, { "epoch": 3.484848484848485, "grad_norm": 0.528684880085982, "learning_rate": 2.36381934608975e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.19594570994377136, "step": 2185, "valid_targets_mean": 3924.7, "valid_targets_min": 1300 }, { "epoch": 3.492822966507177, "grad_norm": 0.45930586621782155, "learning_rate": 2.3559957913551014e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.1664031445980072, "step": 2190, "valid_targets_mean": 4340.3, "valid_targets_min": 1633 }, { "epoch": 3.5007974481658692, "grad_norm": 0.5587103197549831, "learning_rate": 2.3481666068607994e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.16250400245189667, "step": 2195, "valid_targets_mean": 4534.1, "valid_targets_min": 1007 }, { "epoch": 3.5087719298245617, "grad_norm": 0.4849102461514037, "learning_rate": 2.3403319164184986e-05, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.20459748804569244, "step": 2200, "valid_targets_mean": 4523.4, "valid_targets_min": 1154 }, { "epoch": 3.5167464114832536, "grad_norm": 0.5005441651860468, "learning_rate": 2.3324918439269206e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.21811363101005554, "step": 2205, "valid_targets_mean": 4844.4, "valid_targets_min": 961 }, { "epoch": 3.5247208931419456, "grad_norm": 0.43346313086997673, "learning_rate": 2.3246465133699024e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.15447084605693817, "step": 2210, "valid_targets_mean": 4603.5, "valid_targets_min": 1367 }, { "epoch": 3.532695374800638, "grad_norm": 0.47292276496360025, "learning_rate": 2.31679604881443e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.17732763290405273, "step": 2215, "valid_targets_mean": 3960.4, "valid_targets_min": 1642 }, { "epoch": 3.5406698564593304, "grad_norm": 0.495679757867468, "learning_rate": 2.3089405744086823e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.21921885013580322, "step": 2220, "valid_targets_mean": 4405.0, "valid_targets_min": 1545 }, { "epoch": 3.5486443381180224, "grad_norm": 0.4778196917275496, "learning_rate": 2.3010802143800626e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.17508621513843536, "step": 2225, "valid_targets_mean": 4082.6, "valid_targets_min": 733 }, { "epoch": 3.5566188197767143, "grad_norm": 0.4115894050467132, "learning_rate": 2.2932150930332363e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.18152204155921936, "step": 2230, "valid_targets_mean": 5820.9, "valid_targets_min": 1092 }, { "epoch": 3.5645933014354068, "grad_norm": 0.47451933923829037, "learning_rate": 2.2853453347481635e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.1449630856513977, "step": 2235, "valid_targets_mean": 3705.7, "valid_targets_min": 1707 }, { "epoch": 3.5725677830940987, "grad_norm": 0.4246625993601654, "learning_rate": 2.277471063978137e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.16793304681777954, "step": 2240, "valid_targets_mean": 5003.7, "valid_targets_min": 1953 }, { "epoch": 3.580542264752791, "grad_norm": 0.39671974046040576, "learning_rate": 2.2695924052478065e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.15611745417118073, "step": 2245, "valid_targets_mean": 6036.0, "valid_targets_min": 876 }, { "epoch": 3.588516746411483, "grad_norm": 0.4870061065232744, "learning_rate": 2.2617094831512167e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.18916553258895874, "step": 2250, "valid_targets_mean": 4665.1, "valid_targets_min": 279 }, { "epoch": 3.5964912280701755, "grad_norm": 0.42205864082695105, "learning_rate": 2.253822422349831e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.14394357800483704, "step": 2255, "valid_targets_mean": 4616.1, "valid_targets_min": 1506 }, { "epoch": 3.6044657097288675, "grad_norm": 0.5077629191461961, "learning_rate": 2.2459313475705645e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.186385378241539, "step": 2260, "valid_targets_mean": 4445.6, "valid_targets_min": 1350 }, { "epoch": 3.61244019138756, "grad_norm": 0.5109160496433331, "learning_rate": 2.23803638360381e-05, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.1869809627532959, "step": 2265, "valid_targets_mean": 4321.5, "valid_targets_min": 1637 }, { "epoch": 3.620414673046252, "grad_norm": 0.47044498703469384, "learning_rate": 2.2301376553014625e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.17290177941322327, "step": 2270, "valid_targets_mean": 4751.1, "valid_targets_min": 1507 }, { "epoch": 3.6283891547049443, "grad_norm": 0.4729512095272896, "learning_rate": 2.2222352875749493e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.16890928149223328, "step": 2275, "valid_targets_mean": 4695.2, "valid_targets_min": 449 }, { "epoch": 3.6363636363636362, "grad_norm": 0.49129927177444355, "learning_rate": 2.214329405393249e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.22857588529586792, "step": 2280, "valid_targets_mean": 5797.1, "valid_targets_min": 1477 }, { "epoch": 3.6443381180223287, "grad_norm": 0.5144669886043687, "learning_rate": 2.2064201337809212e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.17676298320293427, "step": 2285, "valid_targets_mean": 4023.9, "valid_targets_min": 1965 }, { "epoch": 3.6523125996810206, "grad_norm": 0.5205684042429719, "learning_rate": 2.1985075978161236e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.18539035320281982, "step": 2290, "valid_targets_mean": 3931.9, "valid_targets_min": 1260 }, { "epoch": 3.660287081339713, "grad_norm": 0.45299343870889275, "learning_rate": 2.1905919226286385e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.1681886911392212, "step": 2295, "valid_targets_mean": 4429.4, "valid_targets_min": 1525 }, { "epoch": 3.668261562998405, "grad_norm": 0.4506347012164917, "learning_rate": 2.1826732333978924e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.16298139095306396, "step": 2300, "valid_targets_mean": 5305.1, "valid_targets_min": 1115 }, { "epoch": 3.6762360446570974, "grad_norm": 0.49361016290996385, "learning_rate": 2.1747516553509755e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.15665629506111145, "step": 2305, "valid_targets_mean": 3544.4, "valid_targets_min": 1180 }, { "epoch": 3.6842105263157894, "grad_norm": 0.5778205395291415, "learning_rate": 2.166827313760662e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2410949170589447, "step": 2310, "valid_targets_mean": 4867.1, "valid_targets_min": 949 }, { "epoch": 3.692185007974482, "grad_norm": 0.4707485849572123, "learning_rate": 2.1589003339434292e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.16910578310489655, "step": 2315, "valid_targets_mean": 4868.1, "valid_targets_min": 1811 }, { "epoch": 3.7001594896331738, "grad_norm": 0.5270779646775441, "learning_rate": 2.150970841257476e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.17331373691558838, "step": 2320, "valid_targets_mean": 3425.9, "valid_targets_min": 691 }, { "epoch": 3.708133971291866, "grad_norm": 0.4559801428274919, "learning_rate": 2.1430389611007393e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.16542251408100128, "step": 2325, "valid_targets_mean": 4824.6, "valid_targets_min": 1039 }, { "epoch": 3.716108452950558, "grad_norm": 0.39739881900048674, "learning_rate": 2.135104818908913e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.14475056529045105, "step": 2330, "valid_targets_mean": 4815.1, "valid_targets_min": 1431 }, { "epoch": 3.7240829346092506, "grad_norm": 0.46555703219656114, "learning_rate": 2.1271685401534617e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.16371889412403107, "step": 2335, "valid_targets_mean": 3977.3, "valid_targets_min": 1661 }, { "epoch": 3.7320574162679425, "grad_norm": 0.538529815559161, "learning_rate": 2.11923025033964e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.17419461905956268, "step": 2340, "valid_targets_mean": 4204.9, "valid_targets_min": 1325 }, { "epoch": 3.740031897926635, "grad_norm": 0.4835471565226542, "learning_rate": 2.111290075004503e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.16316327452659607, "step": 2345, "valid_targets_mean": 4010.9, "valid_targets_min": 621 }, { "epoch": 3.748006379585327, "grad_norm": 0.474398046842084, "learning_rate": 2.103348139714925e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.15339785814285278, "step": 2350, "valid_targets_mean": 4455.0, "valid_targets_min": 1738 }, { "epoch": 3.7559808612440193, "grad_norm": 0.5090815418316118, "learning_rate": 2.0954045700656126e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.17221853137016296, "step": 2355, "valid_targets_mean": 3577.1, "valid_targets_min": 1003 }, { "epoch": 3.7639553429027113, "grad_norm": 0.43326727747863436, "learning_rate": 2.0874594916771174e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.14630118012428284, "step": 2360, "valid_targets_mean": 4644.5, "valid_targets_min": 1902 }, { "epoch": 3.7719298245614032, "grad_norm": 0.4759734629916401, "learning_rate": 2.079513030193852e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.17981478571891785, "step": 2365, "valid_targets_mean": 4401.8, "valid_targets_min": 636 }, { "epoch": 3.7799043062200957, "grad_norm": 0.47047851791101014, "learning_rate": 2.071565311282099e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.17851416766643524, "step": 2370, "valid_targets_mean": 4240.1, "valid_targets_min": 1589 }, { "epoch": 3.787878787878788, "grad_norm": 0.5464081586672188, "learning_rate": 2.063616460628029e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.18592001497745514, "step": 2375, "valid_targets_mean": 4041.9, "valid_targets_min": 1807 }, { "epoch": 3.79585326953748, "grad_norm": 0.4464818206087508, "learning_rate": 2.0556666039357084e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.18792858719825745, "step": 2380, "valid_targets_mean": 4739.8, "valid_targets_min": 1157 }, { "epoch": 3.803827751196172, "grad_norm": 0.5041109661524343, "learning_rate": 2.047715866925113e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.1874503344297409, "step": 2385, "valid_targets_mean": 4454.7, "valid_targets_min": 1432 }, { "epoch": 3.8118022328548644, "grad_norm": 0.45113237417450835, "learning_rate": 2.0397643753301403e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.1641354113817215, "step": 2390, "valid_targets_mean": 5005.2, "valid_targets_min": 1886 }, { "epoch": 3.819776714513557, "grad_norm": 0.49530584534417454, "learning_rate": 2.0318122548966225e-05, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.1944631189107895, "step": 2395, "valid_targets_mean": 4375.2, "valid_targets_min": 1665 }, { "epoch": 3.827751196172249, "grad_norm": 0.49543993336649245, "learning_rate": 2.0238596313803337e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1980539858341217, "step": 2400, "valid_targets_mean": 4541.7, "valid_targets_min": 627 }, { "epoch": 3.8357256778309408, "grad_norm": 0.4254188193829258, "learning_rate": 2.015906630545005e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.15166829526424408, "step": 2405, "valid_targets_mean": 4715.5, "valid_targets_min": 2173 }, { "epoch": 3.843700159489633, "grad_norm": 0.4882032464005021, "learning_rate": 2.0079533781603352e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.19435849785804749, "step": 2410, "valid_targets_mean": 4388.9, "valid_targets_min": 531 }, { "epoch": 3.8516746411483256, "grad_norm": 0.5265806814763052, "learning_rate": 2e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.18883755803108215, "step": 2415, "valid_targets_mean": 3900.7, "valid_targets_min": 1194 }, { "epoch": 3.8596491228070176, "grad_norm": 0.4970672078467313, "learning_rate": 1.9920466218396655e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.14973965287208557, "step": 2420, "valid_targets_mean": 3951.0, "valid_targets_min": 1906 }, { "epoch": 3.8676236044657095, "grad_norm": 0.4485320461327396, "learning_rate": 1.9840933694549956e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.1715766191482544, "step": 2425, "valid_targets_mean": 4628.1, "valid_targets_min": 2325 }, { "epoch": 3.875598086124402, "grad_norm": 0.46144828607434146, "learning_rate": 1.976140368619667e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.1804232895374298, "step": 2430, "valid_targets_mean": 4036.7, "valid_targets_min": 1579 }, { "epoch": 3.8835725677830943, "grad_norm": 0.40935989183035376, "learning_rate": 1.9681877451033778e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.13349954783916473, "step": 2435, "valid_targets_mean": 4621.5, "valid_targets_min": 2387 }, { "epoch": 3.8915470494417863, "grad_norm": 0.5822879432451648, "learning_rate": 1.9602356246698597e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.17016389966011047, "step": 2440, "valid_targets_mean": 4279.2, "valid_targets_min": 1442 }, { "epoch": 3.8995215311004783, "grad_norm": 0.45662436879070906, "learning_rate": 1.9522841330748877e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.16033823788166046, "step": 2445, "valid_targets_mean": 4220.1, "valid_targets_min": 1598 }, { "epoch": 3.9074960127591707, "grad_norm": 0.48077089254158484, "learning_rate": 1.944333396064292e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.14935660362243652, "step": 2450, "valid_targets_mean": 3772.9, "valid_targets_min": 1647 }, { "epoch": 3.915470494417863, "grad_norm": 0.4244926540119392, "learning_rate": 1.936383539371971e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.14506709575653076, "step": 2455, "valid_targets_mean": 4454.8, "valid_targets_min": 1710 }, { "epoch": 3.923444976076555, "grad_norm": 0.4427100557851415, "learning_rate": 1.9284346887179016e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.15511883795261383, "step": 2460, "valid_targets_mean": 4552.0, "valid_targets_min": 1761 }, { "epoch": 3.931419457735247, "grad_norm": 0.47909923376130753, "learning_rate": 1.9204869698061493e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.15708695352077484, "step": 2465, "valid_targets_mean": 3728.4, "valid_targets_min": 1978 }, { "epoch": 3.9393939393939394, "grad_norm": 0.595539634060728, "learning_rate": 1.9125405083228833e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.16844023764133453, "step": 2470, "valid_targets_mean": 3325.6, "valid_targets_min": 1501 }, { "epoch": 3.9473684210526314, "grad_norm": 0.4533444186226723, "learning_rate": 1.9045954299343884e-05, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.17140570282936096, "step": 2475, "valid_targets_mean": 4405.3, "valid_targets_min": 2264 }, { "epoch": 3.955342902711324, "grad_norm": 0.4595885145274142, "learning_rate": 1.896651860285076e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.16533583402633667, "step": 2480, "valid_targets_mean": 4279.9, "valid_targets_min": 1464 }, { "epoch": 3.963317384370016, "grad_norm": 0.45222684065372687, "learning_rate": 1.8887099249954976e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614869087934494, "step": 2485, "valid_targets_mean": 4647.2, "valid_targets_min": 1192 }, { "epoch": 3.971291866028708, "grad_norm": 0.4725644857876905, "learning_rate": 1.8807697496603604e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.17880479991436005, "step": 2490, "valid_targets_mean": 4414.1, "valid_targets_min": 2303 }, { "epoch": 3.9792663476874, "grad_norm": 0.45652270717722077, "learning_rate": 1.8728314598465386e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1617339849472046, "step": 2495, "valid_targets_mean": 4411.3, "valid_targets_min": 1827 }, { "epoch": 3.9872408293460926, "grad_norm": 0.5151368519656011, "learning_rate": 1.8648951810910878e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.15443146228790283, "step": 2500, "valid_targets_mean": 3280.9, "valid_targets_min": 1115 }, { "epoch": 3.9952153110047846, "grad_norm": 0.47470285857166405, "learning_rate": 1.856961038899261e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.15671250224113464, "step": 2505, "valid_targets_mean": 4404.2, "valid_targets_min": 1362 }, { "epoch": 4.003189792663477, "grad_norm": 0.4899880225039297, "learning_rate": 1.849029158742525e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.15422114729881287, "step": 2510, "valid_targets_mean": 3694.6, "valid_targets_min": 1506 }, { "epoch": 4.011164274322169, "grad_norm": 0.4634790318267732, "learning_rate": 1.8410996660565714e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345663070678711, "step": 2515, "valid_targets_mean": 4565.0, "valid_targets_min": 2064 }, { "epoch": 4.019138755980861, "grad_norm": 0.5042108705454043, "learning_rate": 1.8331726862393385e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16057871282100677, "step": 2520, "valid_targets_mean": 4519.1, "valid_targets_min": 1717 }, { "epoch": 4.027113237639553, "grad_norm": 0.4844796153115308, "learning_rate": 1.8252483446490245e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.17984318733215332, "step": 2525, "valid_targets_mean": 4351.6, "valid_targets_min": 1530 }, { "epoch": 4.035087719298246, "grad_norm": 0.45265367637894693, "learning_rate": 1.8173267666021075e-05, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.16487132012844086, "step": 2530, "valid_targets_mean": 5113.8, "valid_targets_min": 1797 }, { "epoch": 4.043062200956938, "grad_norm": 0.5341917502431222, "learning_rate": 1.8094080773713615e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1509234458208084, "step": 2535, "valid_targets_mean": 3534.0, "valid_targets_min": 1379 }, { "epoch": 4.05103668261563, "grad_norm": 0.5250909339903316, "learning_rate": 1.8014924021838774e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.1545257717370987, "step": 2540, "valid_targets_mean": 3596.7, "valid_targets_min": 524 }, { "epoch": 4.059011164274322, "grad_norm": 0.4771773683854749, "learning_rate": 1.7935798662190798e-05, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.14937272667884827, "step": 2545, "valid_targets_mean": 4365.2, "valid_targets_min": 1184 }, { "epoch": 4.0669856459330145, "grad_norm": 0.4378658709624504, "learning_rate": 1.785670594606752e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.16334344446659088, "step": 2550, "valid_targets_mean": 4933.5, "valid_targets_min": 1487 }, { "epoch": 4.074960127591707, "grad_norm": 0.5408025302725352, "learning_rate": 1.777764712425052e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1732405722141266, "step": 2555, "valid_targets_mean": 3627.1, "valid_targets_min": 317 }, { "epoch": 4.082934609250398, "grad_norm": 0.507827216712315, "learning_rate": 1.7698623446985378e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.17435893416404724, "step": 2560, "valid_targets_mean": 4402.0, "valid_targets_min": 1466 }, { "epoch": 4.090909090909091, "grad_norm": 0.4951560011181849, "learning_rate": 1.7619636163961907e-05, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.14189505577087402, "step": 2565, "valid_targets_mean": 4492.1, "valid_targets_min": 1893 }, { "epoch": 4.098883572567783, "grad_norm": 0.48077419738077953, "learning_rate": 1.754068652429436e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.14747288823127747, "step": 2570, "valid_targets_mean": 4816.2, "valid_targets_min": 1338 }, { "epoch": 4.106858054226476, "grad_norm": 0.48118894084351693, "learning_rate": 1.74617757765017e-05, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.15636608004570007, "step": 2575, "valid_targets_mean": 3937.2, "valid_targets_min": 385 }, { "epoch": 4.114832535885167, "grad_norm": 0.46253282549841945, "learning_rate": 1.738290516848784e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.13956312835216522, "step": 2580, "valid_targets_mean": 5142.4, "valid_targets_min": 1541 }, { "epoch": 4.12280701754386, "grad_norm": 0.4840910750690081, "learning_rate": 1.730407594752194e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.18448464572429657, "step": 2585, "valid_targets_mean": 4904.5, "valid_targets_min": 610 }, { "epoch": 4.130781499202552, "grad_norm": 0.46098830201420854, "learning_rate": 1.722528936021864e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.16083885729312897, "step": 2590, "valid_targets_mean": 4776.6, "valid_targets_min": 1693 }, { "epoch": 4.138755980861244, "grad_norm": 0.4509630939011778, "learning_rate": 1.714654665251837e-05, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1386050283908844, "step": 2595, "valid_targets_mean": 4520.9, "valid_targets_min": 430 }, { "epoch": 4.146730462519936, "grad_norm": 0.5078283848796444, "learning_rate": 1.7067849069667644e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.14574451744556427, "step": 2600, "valid_targets_mean": 3890.8, "valid_targets_min": 1673 }, { "epoch": 4.154704944178628, "grad_norm": 0.5425342658424712, "learning_rate": 1.6989197856199377e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.14644119143486023, "step": 2605, "valid_targets_mean": 4598.1, "valid_targets_min": 599 }, { "epoch": 4.162679425837321, "grad_norm": 0.6814195331715653, "learning_rate": 1.6910594255913177e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.16274163126945496, "step": 2610, "valid_targets_mean": 3990.4, "valid_targets_min": 1780 }, { "epoch": 4.170653907496013, "grad_norm": 0.47901972456824515, "learning_rate": 1.6832039511855702e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1412867307662964, "step": 2615, "valid_targets_mean": 4189.2, "valid_targets_min": 1917 }, { "epoch": 4.178628389154705, "grad_norm": 0.47380491777234185, "learning_rate": 1.6753534866300983e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.16598361730575562, "step": 2620, "valid_targets_mean": 4522.2, "valid_targets_min": 2215 }, { "epoch": 4.186602870813397, "grad_norm": 0.4623200429689346, "learning_rate": 1.6675081560730804e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1583814024925232, "step": 2625, "valid_targets_mean": 4811.9, "valid_targets_min": 484 }, { "epoch": 4.1945773524720895, "grad_norm": 0.4639372494986275, "learning_rate": 1.6596680835815024e-05, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.1427120864391327, "step": 2630, "valid_targets_mean": 4565.5, "valid_targets_min": 1893 }, { "epoch": 4.202551834130782, "grad_norm": 0.5202843864845481, "learning_rate": 1.651833393139201e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.16338421404361725, "step": 2635, "valid_targets_mean": 4019.4, "valid_targets_min": 1725 }, { "epoch": 4.2105263157894735, "grad_norm": 0.5235868701035974, "learning_rate": 1.6440042086449e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.15927179157733917, "step": 2640, "valid_targets_mean": 4495.2, "valid_targets_min": 951 }, { "epoch": 4.218500797448166, "grad_norm": 0.44531838825532105, "learning_rate": 1.6361806539102508e-05, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.1629904806613922, "step": 2645, "valid_targets_mean": 5343.2, "valid_targets_min": 867 }, { "epoch": 4.226475279106858, "grad_norm": 0.4251988292309876, "learning_rate": 1.628362852657876e-05, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.13012798130512238, "step": 2650, "valid_targets_mean": 5094.8, "valid_targets_min": 339 }, { "epoch": 4.23444976076555, "grad_norm": 0.46887168314695904, "learning_rate": 1.620550928519411e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.15908288955688477, "step": 2655, "valid_targets_mean": 4939.9, "valid_targets_min": 2028 }, { "epoch": 4.242424242424242, "grad_norm": 0.5098973831313105, "learning_rate": 1.612745005033551e-05, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334664523601532, "step": 2660, "valid_targets_mean": 4081.6, "valid_targets_min": 1556 }, { "epoch": 4.250398724082935, "grad_norm": 0.46808481227323445, "learning_rate": 1.6049452056440948e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15534178912639618, "step": 2665, "valid_targets_mean": 4708.3, "valid_targets_min": 2017 }, { "epoch": 4.258373205741627, "grad_norm": 0.4875790771425733, "learning_rate": 1.597151653697995e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.12777553498744965, "step": 2670, "valid_targets_mean": 4391.9, "valid_targets_min": 278 }, { "epoch": 4.266347687400319, "grad_norm": 0.47842605994377785, "learning_rate": 1.5893644724434066e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.15351736545562744, "step": 2675, "valid_targets_mean": 4784.4, "valid_targets_min": 440 }, { "epoch": 4.274322169059011, "grad_norm": 0.4798020507410421, "learning_rate": 1.581583785027736e-05, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.12768876552581787, "step": 2680, "valid_targets_mean": 4058.9, "valid_targets_min": 1533 }, { "epoch": 4.282296650717703, "grad_norm": 0.4890971139697186, "learning_rate": 1.5738097144956976e-05, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.1449412852525711, "step": 2685, "valid_targets_mean": 4657.4, "valid_targets_min": 2325 }, { "epoch": 4.290271132376396, "grad_norm": 0.5461562109497161, "learning_rate": 1.566042383787364e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455443799495697, "step": 2690, "valid_targets_mean": 3337.1, "valid_targets_min": 1529 }, { "epoch": 4.298245614035087, "grad_norm": 0.46410280159872597, "learning_rate": 1.558281915736224e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.17412641644477844, "step": 2695, "valid_targets_mean": 4995.4, "valid_targets_min": 2412 }, { "epoch": 4.30622009569378, "grad_norm": 0.5330477782573131, "learning_rate": 1.550528433067239e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.17384281754493713, "step": 2700, "valid_targets_mean": 4280.9, "valid_targets_min": 396 }, { "epoch": 4.314194577352472, "grad_norm": 0.4993801267582135, "learning_rate": 1.5427820583949054e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.1459612250328064, "step": 2705, "valid_targets_mean": 3986.2, "valid_targets_min": 1182 }, { "epoch": 4.3221690590111645, "grad_norm": 0.5020099422312442, "learning_rate": 1.5350429142213075e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.24648582935333252, "step": 2710, "valid_targets_mean": 6519.9, "valid_targets_min": 2514 }, { "epoch": 4.330143540669856, "grad_norm": 0.544133437246787, "learning_rate": 1.5273111229341907e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.13865166902542114, "step": 2715, "valid_targets_mean": 4138.2, "valid_targets_min": 1620 }, { "epoch": 4.3381180223285485, "grad_norm": 0.5733519120938113, "learning_rate": 1.5195868068050185e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.16256359219551086, "step": 2720, "valid_targets_mean": 3474.5, "valid_targets_min": 1836 }, { "epoch": 4.346092503987241, "grad_norm": 0.4716089878439407, "learning_rate": 1.5118700879870426e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.17399930953979492, "step": 2725, "valid_targets_mean": 5075.4, "valid_targets_min": 1690 }, { "epoch": 4.354066985645933, "grad_norm": 0.4209893499367196, "learning_rate": 1.5041610885133681e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.12980689108371735, "step": 2730, "valid_targets_mean": 5178.8, "valid_targets_min": 1476 }, { "epoch": 4.362041467304625, "grad_norm": 0.5515449457928758, "learning_rate": 1.496459930295028e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.16415995359420776, "step": 2735, "valid_targets_mean": 3561.8, "valid_targets_min": 1387 }, { "epoch": 4.370015948963317, "grad_norm": 0.5109525433836578, "learning_rate": 1.4887667351190508e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.18121805787086487, "step": 2740, "valid_targets_mean": 4864.2, "valid_targets_min": 1895 }, { "epoch": 4.37799043062201, "grad_norm": 0.5037396991640567, "learning_rate": 1.4810816246465374e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1513875126838684, "step": 2745, "valid_targets_mean": 4453.0, "valid_targets_min": 907 }, { "epoch": 4.385964912280702, "grad_norm": 0.4934516813748904, "learning_rate": 1.4734047204107358e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.1657409369945526, "step": 2750, "valid_targets_mean": 4435.2, "valid_targets_min": 1760 }, { "epoch": 4.393939393939394, "grad_norm": 0.4417129235128675, "learning_rate": 1.4657361438151192e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.13217982649803162, "step": 2755, "valid_targets_mean": 4826.6, "valid_targets_min": 1233 }, { "epoch": 4.401913875598086, "grad_norm": 0.572380140644963, "learning_rate": 1.458076016131468e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.1532914787530899, "step": 2760, "valid_targets_mean": 3163.1, "valid_targets_min": 1432 }, { "epoch": 4.409888357256778, "grad_norm": 0.5850789870287324, "learning_rate": 1.4504244584979494e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.17484025657176971, "step": 2765, "valid_targets_mean": 3527.3, "valid_targets_min": 759 }, { "epoch": 4.417862838915471, "grad_norm": 0.5345615763784187, "learning_rate": 1.442781591917203e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.17847514152526855, "step": 2770, "valid_targets_mean": 3803.9, "valid_targets_min": 288 }, { "epoch": 4.425837320574162, "grad_norm": 0.49877751842401186, "learning_rate": 1.4351475372544262e-05, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.14222899079322815, "step": 2775, "valid_targets_mean": 4224.1, "valid_targets_min": 2213 }, { "epoch": 4.433811802232855, "grad_norm": 0.5127528633812499, "learning_rate": 1.4275224152354658e-05, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.14961972832679749, "step": 2780, "valid_targets_mean": 3905.4, "valid_targets_min": 1318 }, { "epoch": 4.441786283891547, "grad_norm": 0.48555317932260317, "learning_rate": 1.4199063464449047e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.17323818802833557, "step": 2785, "valid_targets_mean": 4936.8, "valid_targets_min": 1178 }, { "epoch": 4.44976076555024, "grad_norm": 0.46902570337103017, "learning_rate": 1.4122994513241587e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.14024415612220764, "step": 2790, "valid_targets_mean": 4709.8, "valid_targets_min": 1527 }, { "epoch": 4.457735247208931, "grad_norm": 0.5286358404792354, "learning_rate": 1.4047018501695677e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.14404083788394928, "step": 2795, "valid_targets_mean": 4177.2, "valid_targets_min": 949 }, { "epoch": 4.4657097288676235, "grad_norm": 0.5835959583862976, "learning_rate": 1.3971136631304978e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.16053429245948792, "step": 2800, "valid_targets_mean": 4404.4, "valid_targets_min": 635 }, { "epoch": 4.473684210526316, "grad_norm": 0.5087390219672198, "learning_rate": 1.3895350102074386e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.154604971408844, "step": 2805, "valid_targets_mean": 4275.4, "valid_targets_min": 311 }, { "epoch": 4.481658692185008, "grad_norm": 0.4701979924293451, "learning_rate": 1.3819660112501054e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.16549868881702423, "step": 2810, "valid_targets_mean": 4737.1, "valid_targets_min": 860 }, { "epoch": 4.4896331738437, "grad_norm": 0.4801457713814075, "learning_rate": 1.3744067859555461e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.14757005870342255, "step": 2815, "valid_targets_mean": 4083.9, "valid_targets_min": 1011 }, { "epoch": 4.497607655502392, "grad_norm": 0.4327428514767497, "learning_rate": 1.3668574538662451e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.16689707338809967, "step": 2820, "valid_targets_mean": 5532.1, "valid_targets_min": 1640 }, { "epoch": 4.505582137161085, "grad_norm": 0.48232554647060877, "learning_rate": 1.3593181343682353e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.1623343527317047, "step": 2825, "valid_targets_mean": 4389.2, "valid_targets_min": 815 }, { "epoch": 4.513556618819777, "grad_norm": 0.46842062004881196, "learning_rate": 1.3517889466892085e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.16388767957687378, "step": 2830, "valid_targets_mean": 4568.9, "valid_targets_min": 1589 }, { "epoch": 4.521531100478469, "grad_norm": 0.5316043989251976, "learning_rate": 1.3442700098966326e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.13952653110027313, "step": 2835, "valid_targets_mean": 4084.7, "valid_targets_min": 1625 }, { "epoch": 4.529505582137161, "grad_norm": 0.6131005374748497, "learning_rate": 1.3367614428958646e-05, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.1712581217288971, "step": 2840, "valid_targets_mean": 4815.7, "valid_targets_min": 738 }, { "epoch": 4.5374800637958534, "grad_norm": 0.511066316660687, "learning_rate": 1.3292633644282735e-05, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.14669950306415558, "step": 2845, "valid_targets_mean": 3795.1, "valid_targets_min": 811 }, { "epoch": 4.545454545454545, "grad_norm": 0.44495333907690426, "learning_rate": 1.3217758930693608e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.14287234842777252, "step": 2850, "valid_targets_mean": 4819.1, "valid_targets_min": 1363 }, { "epoch": 4.553429027113237, "grad_norm": 0.4803993591600635, "learning_rate": 1.314299147226887e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.1529885232448578, "step": 2855, "valid_targets_mean": 4219.8, "valid_targets_min": 1637 }, { "epoch": 4.56140350877193, "grad_norm": 0.534456680714764, "learning_rate": 1.3068332451389969e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.18377503752708435, "step": 2860, "valid_targets_mean": 4056.7, "valid_targets_min": 1252 }, { "epoch": 4.569377990430622, "grad_norm": 0.5715320414560933, "learning_rate": 1.2993783048723515e-05, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.14145058393478394, "step": 2865, "valid_targets_mean": 2752.7, "valid_targets_min": 634 }, { "epoch": 4.577352472089315, "grad_norm": 0.490531412083574, "learning_rate": 1.2919344443202602e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.13521042466163635, "step": 2870, "valid_targets_mean": 3873.3, "valid_targets_min": 1432 }, { "epoch": 4.585326953748006, "grad_norm": 0.4960382986414196, "learning_rate": 1.2845017812008158e-05, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.13930058479309082, "step": 2875, "valid_targets_mean": 4009.3, "valid_targets_min": 1653 }, { "epoch": 4.5933014354066986, "grad_norm": 0.45490882957573536, "learning_rate": 1.277080433055034e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.16347578167915344, "step": 2880, "valid_targets_mean": 4968.5, "valid_targets_min": 2414 }, { "epoch": 4.601275917065391, "grad_norm": 0.49053829703055934, "learning_rate": 1.2696705172449944e-05, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.17954492568969727, "step": 2885, "valid_targets_mean": 4561.9, "valid_targets_min": 937 }, { "epoch": 4.6092503987240825, "grad_norm": 0.49085289338663335, "learning_rate": 1.2622721509519846e-05, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.14600206911563873, "step": 2890, "valid_targets_mean": 4638.7, "valid_targets_min": 1362 }, { "epoch": 4.617224880382775, "grad_norm": 0.4440863342043673, "learning_rate": 1.2548854511746461e-05, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1403721123933792, "step": 2895, "valid_targets_mean": 4791.0, "valid_targets_min": 1727 }, { "epoch": 4.625199362041467, "grad_norm": 0.4290742285274184, "learning_rate": 1.247510534727125e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.14262665808200836, "step": 2900, "valid_targets_mean": 4883.1, "valid_targets_min": 1800 }, { "epoch": 4.63317384370016, "grad_norm": 0.48233893104018916, "learning_rate": 1.240147518237224e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.1487930715084076, "step": 2905, "valid_targets_mean": 4299.9, "valid_targets_min": 720 }, { "epoch": 4.641148325358852, "grad_norm": 0.49119003845245157, "learning_rate": 1.2327965181445593e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.15125395357608795, "step": 2910, "valid_targets_mean": 4226.4, "valid_targets_min": 412 }, { "epoch": 4.649122807017544, "grad_norm": 0.5514755092195026, "learning_rate": 1.2254576506987182e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.20615872740745544, "step": 2915, "valid_targets_mean": 3670.6, "valid_targets_min": 287 }, { "epoch": 4.657097288676236, "grad_norm": 0.4836449422046179, "learning_rate": 1.21813103195742e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.1694192886352539, "step": 2920, "valid_targets_mean": 4252.4, "valid_targets_min": 1091 }, { "epoch": 4.6650717703349285, "grad_norm": 0.5227248323901297, "learning_rate": 1.2108167777846815e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.1699051558971405, "step": 2925, "valid_targets_mean": 4134.8, "valid_targets_min": 716 }, { "epoch": 4.67304625199362, "grad_norm": 0.4660658722544293, "learning_rate": 1.203515003848987e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.15797314047813416, "step": 2930, "valid_targets_mean": 4928.8, "valid_targets_min": 1582 }, { "epoch": 4.681020733652312, "grad_norm": 0.6376936646502744, "learning_rate": 1.1962258256214545e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.14403367042541504, "step": 2935, "valid_targets_mean": 3905.9, "valid_targets_min": 766 }, { "epoch": 4.688995215311005, "grad_norm": 0.4353897798410051, "learning_rate": 1.1889493583740124e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.17408692836761475, "step": 2940, "valid_targets_mean": 5558.9, "valid_targets_min": 1941 }, { "epoch": 4.696969696969697, "grad_norm": 0.5138974967310053, "learning_rate": 1.1816857171775767e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.18357430398464203, "step": 2945, "valid_targets_mean": 4750.4, "valid_targets_min": 2115 }, { "epoch": 4.70494417862839, "grad_norm": 0.5058909214087609, "learning_rate": 1.1744350169002308e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.1348288655281067, "step": 2950, "valid_targets_mean": 3484.4, "valid_targets_min": 1397 }, { "epoch": 4.712918660287081, "grad_norm": 0.49111490538221414, "learning_rate": 1.1671973722054077e-05, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464148610830307, "step": 2955, "valid_targets_mean": 4043.7, "valid_targets_min": 1224 }, { "epoch": 4.720893141945774, "grad_norm": 0.551693194914327, "learning_rate": 1.159972897550079e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.18348699808120728, "step": 2960, "valid_targets_mean": 3622.8, "valid_targets_min": 1035 }, { "epoch": 4.728867623604466, "grad_norm": 0.48537829529174753, "learning_rate": 1.1527617071829447e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.12741652131080627, "step": 2965, "valid_targets_mean": 4625.4, "valid_targets_min": 1135 }, { "epoch": 4.7368421052631575, "grad_norm": 0.5167280393109993, "learning_rate": 1.145563915142622e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.1738428771495819, "step": 2970, "valid_targets_mean": 4045.1, "valid_targets_min": 1934 }, { "epoch": 4.74481658692185, "grad_norm": 0.46590567459493326, "learning_rate": 1.1383796352558489e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390235275030136, "step": 2975, "valid_targets_mean": 4557.5, "valid_targets_min": 377 }, { "epoch": 4.752791068580542, "grad_norm": 0.45132284661428174, "learning_rate": 1.1312089811356803e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.14673513174057007, "step": 2980, "valid_targets_mean": 4593.8, "valid_targets_min": 1424 }, { "epoch": 4.760765550239235, "grad_norm": 0.5190466302755331, "learning_rate": 1.1240520661796882e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.15376582741737366, "step": 2985, "valid_targets_mean": 3806.1, "valid_targets_min": 858 }, { "epoch": 4.768740031897926, "grad_norm": 0.48812938806701267, "learning_rate": 1.1169090035681772e-05, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.14771802723407745, "step": 2990, "valid_targets_mean": 4181.2, "valid_targets_min": 1647 }, { "epoch": 4.776714513556619, "grad_norm": 0.5183768837688895, "learning_rate": 1.109779906262383e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.17195749282836914, "step": 2995, "valid_targets_mean": 4079.7, "valid_targets_min": 1639 }, { "epoch": 4.784688995215311, "grad_norm": 0.7151241582202109, "learning_rate": 1.102664887002698e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.1477375328540802, "step": 3000, "valid_targets_mean": 3195.2, "valid_targets_min": 1061 }, { "epoch": 4.7926634768740035, "grad_norm": 0.5340265757646905, "learning_rate": 1.0955640583068802e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.15154235064983368, "step": 3005, "valid_targets_mean": 3735.8, "valid_targets_min": 1180 }, { "epoch": 4.800637958532695, "grad_norm": 0.5191731924116039, "learning_rate": 1.0884775324682755e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.15678870677947998, "step": 3010, "valid_targets_mean": 4505.0, "valid_targets_min": 1436 }, { "epoch": 4.8086124401913874, "grad_norm": 0.577257395101735, "learning_rate": 1.081405421554044e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.15045231580734253, "step": 3015, "valid_targets_mean": 3325.9, "valid_targets_min": 349 }, { "epoch": 4.81658692185008, "grad_norm": 0.47952301871619524, "learning_rate": 1.074347837403387e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.15675462782382965, "step": 3020, "valid_targets_mean": 4365.0, "valid_targets_min": 2000 }, { "epoch": 4.824561403508772, "grad_norm": 0.5171197959497484, "learning_rate": 1.067304891625776e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.21107935905456543, "step": 3025, "valid_targets_mean": 4033.0, "valid_targets_min": 1431 }, { "epoch": 4.832535885167464, "grad_norm": 0.457639324980029, "learning_rate": 1.0602766955991913e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.1720237135887146, "step": 3030, "valid_targets_mean": 4731.8, "valid_targets_min": 1708 }, { "epoch": 4.840510366826156, "grad_norm": 0.48700471070095636, "learning_rate": 1.053263360468358e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.14990770816802979, "step": 3035, "valid_targets_mean": 4321.4, "valid_targets_min": 271 }, { "epoch": 4.848484848484849, "grad_norm": 0.4333197612254627, "learning_rate": 1.0462649971429884e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.14838045835494995, "step": 3040, "valid_targets_mean": 5209.8, "valid_targets_min": 1739 }, { "epoch": 4.856459330143541, "grad_norm": 0.4874500871691921, "learning_rate": 1.0392817162960304e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.13294383883476257, "step": 3045, "valid_targets_mean": 4401.8, "valid_targets_min": 907 }, { "epoch": 4.8644338118022326, "grad_norm": 0.5503368290230514, "learning_rate": 1.0323136283619167e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.18634894490242004, "step": 3050, "valid_targets_mean": 3853.9, "valid_targets_min": 2069 }, { "epoch": 4.872408293460925, "grad_norm": 0.5438858738387928, "learning_rate": 1.0253608435348136e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.17999961972236633, "step": 3055, "valid_targets_mean": 4998.1, "valid_targets_min": 1754 }, { "epoch": 4.880382775119617, "grad_norm": 0.484007746641252, "learning_rate": 1.0184234717668867e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.14526879787445068, "step": 3060, "valid_targets_mean": 4370.1, "valid_targets_min": 2135 }, { "epoch": 4.88835725677831, "grad_norm": 0.4798298193869541, "learning_rate": 1.0115016227665544e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.17290471494197845, "step": 3065, "valid_targets_mean": 4554.9, "valid_targets_min": 690 }, { "epoch": 4.896331738437001, "grad_norm": 0.4847848102732291, "learning_rate": 1.0045954059967577e-05, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.1566402018070221, "step": 3070, "valid_targets_mean": 4250.6, "valid_targets_min": 1662 }, { "epoch": 4.904306220095694, "grad_norm": 0.5079181491087512, "learning_rate": 9.977049306732287e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.15510109066963196, "step": 3075, "valid_targets_mean": 4287.0, "valid_targets_min": 1349 }, { "epoch": 4.912280701754386, "grad_norm": 0.49369228412711796, "learning_rate": 9.908303057627591e-06, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516781747341156, "step": 3080, "valid_targets_mean": 4807.1, "valid_targets_min": 1399 }, { "epoch": 4.920255183413078, "grad_norm": 0.46206631563701656, "learning_rate": 9.83971639981484e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.15620173513889313, "step": 3085, "valid_targets_mean": 4509.9, "valid_targets_min": 1755 }, { "epoch": 4.92822966507177, "grad_norm": 0.4764073964647667, "learning_rate": 9.771290417931559e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.14277634024620056, "step": 3090, "valid_targets_mean": 4633.9, "valid_targets_min": 540 }, { "epoch": 4.9362041467304625, "grad_norm": 0.499728819601026, "learning_rate": 9.703026194074342e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.14103826880455017, "step": 3095, "valid_targets_mean": 4783.8, "valid_targets_min": 1889 }, { "epoch": 4.944178628389155, "grad_norm": 0.5030379720704173, "learning_rate": 9.634924807781729e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.18518777191638947, "step": 3100, "valid_targets_mean": 4487.1, "valid_targets_min": 1345 }, { "epoch": 4.952153110047847, "grad_norm": 0.5312971046827829, "learning_rate": 9.566987336017102e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.13996370136737823, "step": 3105, "valid_targets_mean": 3201.3, "valid_targets_min": 1367 }, { "epoch": 4.960127591706539, "grad_norm": 0.47987309157405533, "learning_rate": 9.499214853151699e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.142959326505661, "step": 3110, "valid_targets_mean": 4422.2, "valid_targets_min": 1032 }, { "epoch": 4.968102073365231, "grad_norm": 0.5664816415312744, "learning_rate": 9.431608430947619e-06, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.176031231880188, "step": 3115, "valid_targets_mean": 4770.7, "valid_targets_min": 891 }, { "epoch": 4.976076555023924, "grad_norm": 0.5518137212422529, "learning_rate": 9.364169138540805e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.15234243869781494, "step": 3120, "valid_targets_mean": 4083.6, "valid_targets_min": 1519 }, { "epoch": 4.984051036682615, "grad_norm": 0.4682479995624355, "learning_rate": 9.296898042424237e-06, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.16865205764770508, "step": 3125, "valid_targets_mean": 4818.3, "valid_targets_min": 1142 }, { "epoch": 4.992025518341308, "grad_norm": 0.5040455659035196, "learning_rate": 9.229796206431015e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.14097434282302856, "step": 3130, "valid_targets_mean": 4541.0, "valid_targets_min": 1290 }, { "epoch": 5.0, "grad_norm": 0.47913131975592566, "learning_rate": 9.162864691717513e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1694181263446808, "step": 3135, "valid_targets_mean": 4800.7, "valid_targets_min": 1983 }, { "epoch": 5.007974481658692, "grad_norm": 0.4631690140133372, "learning_rate": 9.096104556746654e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334855705499649, "step": 3140, "valid_targets_mean": 4212.7, "valid_targets_min": 1470 }, { "epoch": 5.015948963317384, "grad_norm": 0.4738719091728486, "learning_rate": 9.029516857271115e-06, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.15238399803638458, "step": 3145, "valid_targets_mean": 4365.6, "valid_targets_min": 861 }, { "epoch": 5.023923444976076, "grad_norm": 0.5490118882632362, "learning_rate": 8.963102646316677e-06, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.1590614765882492, "step": 3150, "valid_targets_mean": 3971.9, "valid_targets_min": 1032 }, { "epoch": 5.031897926634769, "grad_norm": 0.5723827642772381, "learning_rate": 8.896862974165553e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.1540474146604538, "step": 3155, "valid_targets_mean": 3627.2, "valid_targets_min": 1479 }, { "epoch": 5.039872408293461, "grad_norm": 0.47302389032511105, "learning_rate": 8.830798888339756e-06, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.14463520050048828, "step": 3160, "valid_targets_mean": 4906.4, "valid_targets_min": 1707 }, { "epoch": 5.047846889952153, "grad_norm": 0.5469416912728198, "learning_rate": 8.764911433584581e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.1377723217010498, "step": 3165, "valid_targets_mean": 3464.6, "valid_targets_min": 578 }, { "epoch": 5.055821371610845, "grad_norm": 0.5582713551464368, "learning_rate": 8.699201651852056e-06, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.14744654297828674, "step": 3170, "valid_targets_mean": 4384.8, "valid_targets_min": 455 }, { "epoch": 5.0637958532695375, "grad_norm": 0.4525826677728015, "learning_rate": 8.633670582284446e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.12246271222829819, "step": 3175, "valid_targets_mean": 5568.0, "valid_targets_min": 1686 }, { "epoch": 5.07177033492823, "grad_norm": 0.4802895756565889, "learning_rate": 8.56831926119787e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.13796019554138184, "step": 3180, "valid_targets_mean": 4717.9, "valid_targets_min": 883 }, { "epoch": 5.0797448165869215, "grad_norm": 0.47933543045230076, "learning_rate": 8.503148722065851e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501651108264923, "step": 3185, "valid_targets_mean": 4850.2, "valid_targets_min": 792 }, { "epoch": 5.087719298245614, "grad_norm": 0.46167193488495856, "learning_rate": 8.43815999550303e-06, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.17034366726875305, "step": 3190, "valid_targets_mean": 5809.8, "valid_targets_min": 2272 }, { "epoch": 5.095693779904306, "grad_norm": 0.5147068478030644, "learning_rate": 8.373354109248842e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.13025915622711182, "step": 3195, "valid_targets_mean": 3514.9, "valid_targets_min": 1532 }, { "epoch": 5.103668261562999, "grad_norm": 0.4918615867478781, "learning_rate": 8.308732088151245e-06, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.16296672821044922, "step": 3200, "valid_targets_mean": 5018.5, "valid_targets_min": 1439 }, { "epoch": 5.11164274322169, "grad_norm": 0.5788923126986796, "learning_rate": 8.24429495415054e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.1460484266281128, "step": 3205, "valid_targets_mean": 4154.6, "valid_targets_min": 670 }, { "epoch": 5.119617224880383, "grad_norm": 0.4553069456977529, "learning_rate": 8.180043726263216e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.12702570855617523, "step": 3210, "valid_targets_mean": 4684.9, "valid_targets_min": 2310 }, { "epoch": 5.127591706539075, "grad_norm": 0.5218901188519967, "learning_rate": 8.115979420565794e-06, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.14124715328216553, "step": 3215, "valid_targets_mean": 3825.7, "valid_targets_min": 1939 }, { "epoch": 5.1355661881977674, "grad_norm": 0.455006451357129, "learning_rate": 8.052103050178806e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13781721889972687, "step": 3220, "valid_targets_mean": 4437.4, "valid_targets_min": 1007 }, { "epoch": 5.143540669856459, "grad_norm": 0.5047251677784329, "learning_rate": 7.988415625250755e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.14169715344905853, "step": 3225, "valid_targets_mean": 3893.2, "valid_targets_min": 1632 }, { "epoch": 5.151515151515151, "grad_norm": 0.48563253677866414, "learning_rate": 7.924918152942117e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.13769680261611938, "step": 3230, "valid_targets_mean": 4708.1, "valid_targets_min": 2084 }, { "epoch": 5.159489633173844, "grad_norm": 0.49252720325100796, "learning_rate": 7.861611637409462e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1714155673980713, "step": 3235, "valid_targets_mean": 4988.3, "valid_targets_min": 1499 }, { "epoch": 5.167464114832536, "grad_norm": 0.564418000148086, "learning_rate": 7.798497079789513e-06, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.14852869510650635, "step": 3240, "valid_targets_mean": 3508.2, "valid_targets_min": 1539 }, { "epoch": 5.175438596491228, "grad_norm": 0.5346686667466659, "learning_rate": 7.735575478183381e-06, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.15654098987579346, "step": 3245, "valid_targets_mean": 4420.9, "valid_targets_min": 1403 }, { "epoch": 5.18341307814992, "grad_norm": 0.5129242426435193, "learning_rate": 7.672847827640735e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.1257268786430359, "step": 3250, "valid_targets_mean": 3798.2, "valid_targets_min": 632 }, { "epoch": 5.1913875598086126, "grad_norm": 0.5278462460463896, "learning_rate": 7.610315120144067e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.1487414836883545, "step": 3255, "valid_targets_mean": 3692.8, "valid_targets_min": 1770 }, { "epoch": 5.199362041467305, "grad_norm": 0.5164937797343533, "learning_rate": 7.5479783445930414e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.14907556772232056, "step": 3260, "valid_targets_mean": 4389.5, "valid_targets_min": 1326 }, { "epoch": 5.2073365231259965, "grad_norm": 0.5605235918702897, "learning_rate": 7.485838486788803e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.15365715324878693, "step": 3265, "valid_targets_mean": 3910.3, "valid_targets_min": 510 }, { "epoch": 5.215311004784689, "grad_norm": 0.4804446704770563, "learning_rate": 7.4238965294184374e-06, "loss": 0.1386, "loss_nan_ranks": 0, "loss_rank_avg": 0.11510901153087616, "step": 3270, "valid_targets_mean": 4616.4, "valid_targets_min": 2092 }, { "epoch": 5.223285486443381, "grad_norm": 0.48788340937166225, "learning_rate": 7.362153452039409e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.12575878202915192, "step": 3275, "valid_targets_mean": 4244.5, "valid_targets_min": 2169 }, { "epoch": 5.231259968102074, "grad_norm": 0.4998963625738302, "learning_rate": 7.300610231064056e-06, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.1369197964668274, "step": 3280, "valid_targets_mean": 4486.5, "valid_targets_min": 1157 }, { "epoch": 5.239234449760765, "grad_norm": 0.5597438659865254, "learning_rate": 7.239267839744166e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.13235260546207428, "step": 3285, "valid_targets_mean": 3675.8, "valid_targets_min": 1767 }, { "epoch": 5.247208931419458, "grad_norm": 0.4637157957912727, "learning_rate": 7.178127248155604e-06, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.12913677096366882, "step": 3290, "valid_targets_mean": 5069.9, "valid_targets_min": 2045 }, { "epoch": 5.25518341307815, "grad_norm": 0.5234421904422631, "learning_rate": 7.117189423182917e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.1609647274017334, "step": 3295, "valid_targets_mean": 4219.6, "valid_targets_min": 1568 }, { "epoch": 5.2631578947368425, "grad_norm": 0.8939060446670861, "learning_rate": 7.056455328504104e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.17754587531089783, "step": 3300, "valid_targets_mean": 4179.9, "valid_targets_min": 1021 }, { "epoch": 5.271132376395534, "grad_norm": 0.5613035580302348, "learning_rate": 6.995925924575342e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.14372298121452332, "step": 3305, "valid_targets_mean": 3731.8, "valid_targets_min": 1233 }, { "epoch": 5.279106858054226, "grad_norm": 0.4154591658982006, "learning_rate": 6.935602168615792e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.12290593981742859, "step": 3310, "valid_targets_mean": 5637.1, "valid_targets_min": 1673 }, { "epoch": 5.287081339712919, "grad_norm": 0.6416800447593414, "learning_rate": 6.875485014592493e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.1722438931465149, "step": 3315, "valid_targets_mean": 4116.6, "valid_targets_min": 1508 }, { "epoch": 5.295055821371611, "grad_norm": 0.5871320560825972, "learning_rate": 6.815575413205235e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.13305939733982086, "step": 3320, "valid_targets_mean": 3895.7, "valid_targets_min": 416 }, { "epoch": 5.303030303030303, "grad_norm": 0.5007068898056246, "learning_rate": 6.755874311871562e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.12426762282848358, "step": 3325, "valid_targets_mean": 3973.1, "valid_targets_min": 1233 }, { "epoch": 5.311004784688995, "grad_norm": 0.5044473336922294, "learning_rate": 6.696382654711777e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.13455146551132202, "step": 3330, "valid_targets_mean": 3863.1, "valid_targets_min": 1300 }, { "epoch": 5.318979266347688, "grad_norm": 0.4845451776935124, "learning_rate": 6.637101382533986e-06, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.15252287685871124, "step": 3335, "valid_targets_mean": 4714.7, "valid_targets_min": 1551 }, { "epoch": 5.32695374800638, "grad_norm": 0.49995222258967786, "learning_rate": 6.578031432819263e-06, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.13115063309669495, "step": 3340, "valid_targets_mean": 3895.4, "valid_targets_min": 342 }, { "epoch": 5.3349282296650715, "grad_norm": 0.5147718024489065, "learning_rate": 6.5191737397068015e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.1277836561203003, "step": 3345, "valid_targets_mean": 4424.9, "valid_targets_min": 1402 }, { "epoch": 5.342902711323764, "grad_norm": 0.581498600134185, "learning_rate": 6.460529233979127e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.13812121748924255, "step": 3350, "valid_targets_mean": 3206.0, "valid_targets_min": 1569 }, { "epoch": 5.350877192982456, "grad_norm": 0.44412427640952046, "learning_rate": 6.402098843047417e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.14585547149181366, "step": 3355, "valid_targets_mean": 5636.0, "valid_targets_min": 2343 }, { "epoch": 5.358851674641148, "grad_norm": 0.46631543622836114, "learning_rate": 6.343883490936791e-06, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.1294684112071991, "step": 3360, "valid_targets_mean": 5182.2, "valid_targets_min": 1761 }, { "epoch": 5.36682615629984, "grad_norm": 0.7967138290866428, "learning_rate": 6.285884098271739e-06, "loss": 0.1386, "loss_nan_ranks": 0, "loss_rank_avg": 0.13547652959823608, "step": 3365, "valid_targets_mean": 4249.9, "valid_targets_min": 738 }, { "epoch": 5.374800637958533, "grad_norm": 0.5636272491598279, "learning_rate": 6.228101582261532e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.13094601035118103, "step": 3370, "valid_targets_mean": 4631.6, "valid_targets_min": 692 }, { "epoch": 5.382775119617225, "grad_norm": 0.5018163908163288, "learning_rate": 6.170536856685716e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.17899195849895477, "step": 3375, "valid_targets_mean": 5286.1, "valid_targets_min": 2007 }, { "epoch": 5.3907496012759175, "grad_norm": 0.5181322415866998, "learning_rate": 6.113190831879698e-06, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.13492557406425476, "step": 3380, "valid_targets_mean": 4542.4, "valid_targets_min": 1544 }, { "epoch": 5.398724082934609, "grad_norm": 0.49897907969004646, "learning_rate": 6.056064414720317e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.1465134173631668, "step": 3385, "valid_targets_mean": 4784.2, "valid_targets_min": 1590 }, { "epoch": 5.4066985645933014, "grad_norm": 0.511553521072539, "learning_rate": 5.999158508611496e-06, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.133215069770813, "step": 3390, "valid_targets_mean": 3946.7, "valid_targets_min": 1646 }, { "epoch": 5.414673046251994, "grad_norm": 0.5330358447457354, "learning_rate": 5.942474013469983e-06, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.16982445120811462, "step": 3395, "valid_targets_mean": 4178.5, "valid_targets_min": 1664 }, { "epoch": 5.422647527910685, "grad_norm": 0.5597901604211492, "learning_rate": 5.886011825711117e-06, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.17069560289382935, "step": 3400, "valid_targets_mean": 4582.6, "valid_targets_min": 1345 }, { "epoch": 5.430622009569378, "grad_norm": 0.5472872828033137, "learning_rate": 5.829772838234615e-06, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.15048807859420776, "step": 3405, "valid_targets_mean": 4030.6, "valid_targets_min": 1675 }, { "epoch": 5.43859649122807, "grad_norm": 0.5792848668345226, "learning_rate": 5.773757940410503e-06, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.1506005823612213, "step": 3410, "valid_targets_mean": 4001.0, "valid_targets_min": 652 }, { "epoch": 5.446570972886763, "grad_norm": 0.5741421209243341, "learning_rate": 5.7179680180650055e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489039659500122, "step": 3415, "valid_targets_mean": 3604.6, "valid_targets_min": 1131 }, { "epoch": 5.454545454545454, "grad_norm": 0.4976492316442447, "learning_rate": 5.6624039534665775e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.1596824824810028, "step": 3420, "valid_targets_mean": 5098.1, "valid_targets_min": 1663 }, { "epoch": 5.4625199362041466, "grad_norm": 0.5192694981391627, "learning_rate": 5.607066625311925e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.18752288818359375, "step": 3425, "valid_targets_mean": 4772.7, "valid_targets_min": 1762 }, { "epoch": 5.470494417862839, "grad_norm": 0.4898189694458072, "learning_rate": 5.55195690871211e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.136124387383461, "step": 3430, "valid_targets_mean": 4446.1, "valid_targets_min": 1368 }, { "epoch": 5.478468899521531, "grad_norm": 0.5134289481443551, "learning_rate": 5.497075675178727e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.12175813317298889, "step": 3435, "valid_targets_mean": 3663.2, "valid_targets_min": 1077 }, { "epoch": 5.486443381180223, "grad_norm": 0.4923964128209256, "learning_rate": 5.442423792610118e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.158582404255867, "step": 3440, "valid_targets_mean": 4724.8, "valid_targets_min": 1120 }, { "epoch": 5.494417862838915, "grad_norm": 0.5728414484181402, "learning_rate": 5.388002125277627e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.15127599239349365, "step": 3445, "valid_targets_mean": 3708.5, "valid_targets_min": 1555 }, { "epoch": 5.502392344497608, "grad_norm": 0.5316153344749247, "learning_rate": 5.333811533811945e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.1468171775341034, "step": 3450, "valid_targets_mean": 4261.4, "valid_targets_min": 1179 }, { "epoch": 5.5103668261563, "grad_norm": 0.5059201934559844, "learning_rate": 5.2798528751895265e-06, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.16418465971946716, "step": 3455, "valid_targets_mean": 4627.7, "valid_targets_min": 659 }, { "epoch": 5.518341307814992, "grad_norm": 0.5138855686834195, "learning_rate": 5.226127002718984e-06, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.14713597297668457, "step": 3460, "valid_targets_mean": 4193.9, "valid_targets_min": 465 }, { "epoch": 5.526315789473684, "grad_norm": 0.8327422979910104, "learning_rate": 5.1726347660276424e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.12202882766723633, "step": 3465, "valid_targets_mean": 3889.8, "valid_targets_min": 2307 }, { "epoch": 5.5342902711323765, "grad_norm": 0.5417866845035682, "learning_rate": 5.119377011048066e-06, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.15193571150302887, "step": 3470, "valid_targets_mean": 3883.6, "valid_targets_min": 1027 }, { "epoch": 5.542264752791069, "grad_norm": 0.4869683717405225, "learning_rate": 5.066354580004713e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.12537409365177155, "step": 3475, "valid_targets_mean": 4069.8, "valid_targets_min": 1800 }, { "epoch": 5.55023923444976, "grad_norm": 0.4657169670509649, "learning_rate": 5.013568311400599e-06, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.1281999796628952, "step": 3480, "valid_targets_mean": 4824.8, "valid_targets_min": 1840 }, { "epoch": 5.558213716108453, "grad_norm": 0.48908460901251527, "learning_rate": 4.96101904000402e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.14244484901428223, "step": 3485, "valid_targets_mean": 4372.4, "valid_targets_min": 588 }, { "epoch": 5.566188197767145, "grad_norm": 0.5080720826305037, "learning_rate": 4.908707596835396e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.13216745853424072, "step": 3490, "valid_targets_mean": 4219.7, "valid_targets_min": 1831 }, { "epoch": 5.574162679425838, "grad_norm": 0.49012390976455616, "learning_rate": 4.856634809154093e-06, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.1266259402036667, "step": 3495, "valid_targets_mean": 4140.4, "valid_targets_min": 1462 }, { "epoch": 5.582137161084529, "grad_norm": 0.4655698992214377, "learning_rate": 4.804801500445338e-06, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.1438761204481125, "step": 3500, "valid_targets_mean": 5119.6, "valid_targets_min": 1727 }, { "epoch": 5.590111642743222, "grad_norm": 0.47702768130088696, "learning_rate": 4.753208490407233e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.13481447100639343, "step": 3505, "valid_targets_mean": 4350.1, "valid_targets_min": 1564 }, { "epoch": 5.598086124401914, "grad_norm": 0.5869307333733439, "learning_rate": 4.701856594937744e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.13290971517562866, "step": 3510, "valid_targets_mean": 3775.4, "valid_targets_min": 1844 }, { "epoch": 5.606060606060606, "grad_norm": 0.5164996482721174, "learning_rate": 4.650746626121838e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.18071457743644714, "step": 3515, "valid_targets_mean": 4425.1, "valid_targets_min": 1501 }, { "epoch": 5.614035087719298, "grad_norm": 0.5064382852224343, "learning_rate": 4.5998793922186315e-06, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.13357748091220856, "step": 3520, "valid_targets_mean": 4476.5, "valid_targets_min": 311 }, { "epoch": 5.62200956937799, "grad_norm": 0.4774092956312079, "learning_rate": 4.549255697648576e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.13738349080085754, "step": 3525, "valid_targets_mean": 4918.1, "valid_targets_min": 1763 }, { "epoch": 5.629984051036683, "grad_norm": 0.4869106482742091, "learning_rate": 4.498876342980796e-06, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.13851019740104675, "step": 3530, "valid_targets_mean": 4753.4, "valid_targets_min": 2359 }, { "epoch": 5.637958532695375, "grad_norm": 0.5444025100400355, "learning_rate": 4.448742124920368e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.15897592902183533, "step": 3535, "valid_targets_mean": 4504.8, "valid_targets_min": 1086 }, { "epoch": 5.645933014354067, "grad_norm": 0.5202794879141485, "learning_rate": 4.39885383629576e-06, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.12069641053676605, "step": 3540, "valid_targets_mean": 3759.1, "valid_targets_min": 840 }, { "epoch": 5.653907496012759, "grad_norm": 0.4955637184896322, "learning_rate": 4.349212266046285e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.15988540649414062, "step": 3545, "valid_targets_mean": 4708.2, "valid_targets_min": 2546 }, { "epoch": 5.6618819776714515, "grad_norm": 0.5349829325713732, "learning_rate": 4.299818199209629e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.15441840887069702, "step": 3550, "valid_targets_mean": 3981.0, "valid_targets_min": 1162 }, { "epoch": 5.669856459330144, "grad_norm": 0.5752960820375173, "learning_rate": 4.250672416909407e-06, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.1708446890115738, "step": 3555, "valid_targets_mean": 4396.9, "valid_targets_min": 1424 }, { "epoch": 5.6778309409888355, "grad_norm": 0.5751417483583992, "learning_rate": 4.201775696342862e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.18202140927314758, "step": 3560, "valid_targets_mean": 4092.4, "valid_targets_min": 630 }, { "epoch": 5.685805422647528, "grad_norm": 1.1827861103154333, "learning_rate": 4.153128810768517e-06, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.14385861158370972, "step": 3565, "valid_targets_mean": 4737.3, "valid_targets_min": 1622 }, { "epoch": 5.69377990430622, "grad_norm": 0.5422374910484713, "learning_rate": 4.104732529493991e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.139515221118927, "step": 3570, "valid_targets_mean": 4079.3, "valid_targets_min": 1344 }, { "epoch": 5.701754385964913, "grad_norm": 0.5363029556528964, "learning_rate": 4.056587617863825e-06, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.1622910350561142, "step": 3575, "valid_targets_mean": 4282.9, "valid_targets_min": 316 }, { "epoch": 5.709728867623604, "grad_norm": 0.4597016933287751, "learning_rate": 4.008694837247345e-06, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.13833516836166382, "step": 3580, "valid_targets_mean": 5463.1, "valid_targets_min": 1688 }, { "epoch": 5.717703349282297, "grad_norm": 0.5063083170748712, "learning_rate": 3.961054945026674e-06, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.15499377250671387, "step": 3585, "valid_targets_mean": 4217.2, "valid_targets_min": 1999 }, { "epoch": 5.725677830940989, "grad_norm": 0.5248353026554393, "learning_rate": 3.913668694584705e-06, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.15698176622390747, "step": 3590, "valid_targets_mean": 4311.0, "valid_targets_min": 1237 }, { "epoch": 5.733652312599681, "grad_norm": 0.5039937842772115, "learning_rate": 3.866536835293227e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.1316099911928177, "step": 3595, "valid_targets_mean": 4095.2, "valid_targets_min": 1637 }, { "epoch": 5.741626794258373, "grad_norm": 0.5325358744438344, "learning_rate": 3.819660112501053e-06, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.14324098825454712, "step": 3600, "valid_targets_mean": 4207.9, "valid_targets_min": 876 }, { "epoch": 5.749601275917065, "grad_norm": 0.47962766801791007, "learning_rate": 3.773039267522227e-06, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.13331088423728943, "step": 3605, "valid_targets_mean": 4672.8, "valid_targets_min": 414 }, { "epoch": 5.757575757575758, "grad_norm": 0.513570541506682, "learning_rate": 3.72667503762433e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.11546094715595245, "step": 3610, "valid_targets_mean": 4141.8, "valid_targets_min": 1381 }, { "epoch": 5.76555023923445, "grad_norm": 0.7010946630275743, "learning_rate": 3.680568156016786e-06, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.14983190596103668, "step": 3615, "valid_targets_mean": 4744.1, "valid_targets_min": 302 }, { "epoch": 5.773524720893142, "grad_norm": 0.5750246801245077, "learning_rate": 3.6347193518392776e-06, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.15094132721424103, "step": 3620, "valid_targets_mean": 3853.7, "valid_targets_min": 1087 }, { "epoch": 5.781499202551834, "grad_norm": 0.4450147099326662, "learning_rate": 3.58912935015024e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.1421867311000824, "step": 3625, "valid_targets_mean": 5715.1, "valid_targets_min": 2194 }, { "epoch": 5.7894736842105265, "grad_norm": 0.539335801690844, "learning_rate": 3.543798871915367e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14866751432418823, "step": 3630, "valid_targets_mean": 3839.4, "valid_targets_min": 1946 }, { "epoch": 5.797448165869218, "grad_norm": 0.5828493833087499, "learning_rate": 3.498728633996209e-06, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.1669713258743286, "step": 3635, "valid_targets_mean": 5967.7, "valid_targets_min": 1818 }, { "epoch": 5.8054226475279105, "grad_norm": 0.534453291890428, "learning_rate": 3.453919349138859e-06, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.12102772295475006, "step": 3640, "valid_targets_mean": 3891.5, "valid_targets_min": 1323 }, { "epoch": 5.813397129186603, "grad_norm": 0.48171779799429404, "learning_rate": 3.4093717259626514e-06, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.14127930998802185, "step": 3645, "valid_targets_mean": 4453.7, "valid_targets_min": 736 }, { "epoch": 5.821371610845295, "grad_norm": 0.49861046151709937, "learning_rate": 3.365086468948988e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14490726590156555, "step": 3650, "valid_targets_mean": 4365.1, "valid_targets_min": 1254 }, { "epoch": 5.829346092503988, "grad_norm": 0.5855078575877344, "learning_rate": 3.321064278430175e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.18041715025901794, "step": 3655, "valid_targets_mean": 3792.9, "valid_targets_min": 1380 }, { "epoch": 5.837320574162679, "grad_norm": 0.6060290822284615, "learning_rate": 3.277305850578345e-06, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.14750179648399353, "step": 3660, "valid_targets_mean": 4823.8, "valid_targets_min": 1604 }, { "epoch": 5.845295055821372, "grad_norm": 0.49296159557823577, "learning_rate": 3.2338118773944684e-06, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.16297249495983124, "step": 3665, "valid_targets_mean": 4690.5, "valid_targets_min": 1229 }, { "epoch": 5.853269537480064, "grad_norm": 0.5335159615396101, "learning_rate": 3.1905830466973975e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.13889795541763306, "step": 3670, "valid_targets_mean": 4028.1, "valid_targets_min": 1224 }, { "epoch": 5.861244019138756, "grad_norm": 0.48653483581031726, "learning_rate": 3.14762004211298e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.14789119362831116, "step": 3675, "valid_targets_mean": 4518.0, "valid_targets_min": 1242 }, { "epoch": 5.869218500797448, "grad_norm": 0.44980623299065636, "learning_rate": 3.1049235430632696e-06, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.14088287949562073, "step": 3680, "valid_targets_mean": 5030.7, "valid_targets_min": 2268 }, { "epoch": 5.87719298245614, "grad_norm": 0.5454087979799263, "learning_rate": 3.062494224755759e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.14683279395103455, "step": 3685, "valid_targets_mean": 3636.9, "valid_targets_min": 1406 }, { "epoch": 5.885167464114833, "grad_norm": 0.5284650556492287, "learning_rate": 3.0203327581727195e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14028066396713257, "step": 3690, "valid_targets_mean": 3733.6, "valid_targets_min": 1271 }, { "epoch": 5.893141945773524, "grad_norm": 1.3422902233127916, "learning_rate": 2.9784398100605937e-06, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.14661850035190582, "step": 3695, "valid_targets_mean": 3551.7, "valid_targets_min": 1107 }, { "epoch": 5.901116427432217, "grad_norm": 0.5040044272291349, "learning_rate": 2.9368160429194127e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.13759127259254456, "step": 3700, "valid_targets_mean": 4007.2, "valid_targets_min": 458 }, { "epoch": 5.909090909090909, "grad_norm": 0.6963247570508141, "learning_rate": 2.895462114992371e-06, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433190256357193, "step": 3705, "valid_targets_mean": 3502.1, "valid_targets_min": 1281 }, { "epoch": 5.917065390749602, "grad_norm": 0.5251079681315951, "learning_rate": 2.8543786802553943e-06, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.1811850666999817, "step": 3710, "valid_targets_mean": 5324.9, "valid_targets_min": 882 }, { "epoch": 5.925039872408293, "grad_norm": 0.5241665849437455, "learning_rate": 2.813566388406781e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358180046081543, "step": 3715, "valid_targets_mean": 3920.8, "valid_targets_min": 599 }, { "epoch": 5.9330143540669855, "grad_norm": 0.49869493382972957, "learning_rate": 2.773025884856957e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.1408381462097168, "step": 3720, "valid_targets_mean": 4674.2, "valid_targets_min": 1306 }, { "epoch": 5.940988835725678, "grad_norm": 0.5711342385096281, "learning_rate": 2.7327578107182585e-06, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.1314079761505127, "step": 3725, "valid_targets_mean": 3162.1, "valid_targets_min": 892 }, { "epoch": 5.94896331738437, "grad_norm": 0.6108334839280424, "learning_rate": 2.692762802794775e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.12222002446651459, "step": 3730, "valid_targets_mean": 3391.4, "valid_targets_min": 961 }, { "epoch": 5.956937799043062, "grad_norm": 0.5027197439334232, "learning_rate": 2.6530414935723104e-06, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.13072869181632996, "step": 3735, "valid_targets_mean": 3994.5, "valid_targets_min": 1639 }, { "epoch": 5.964912280701754, "grad_norm": 0.5075537096649687, "learning_rate": 2.6135945112083506e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.12960845232009888, "step": 3740, "valid_targets_mean": 4494.9, "valid_targets_min": 597 }, { "epoch": 5.972886762360447, "grad_norm": 0.5380248417532908, "learning_rate": 2.574422479522156e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1744580864906311, "step": 3745, "valid_targets_mean": 4334.4, "valid_targets_min": 1703 }, { "epoch": 5.980861244019139, "grad_norm": 0.5515990373712637, "learning_rate": 2.535526017984884e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.14526067674160004, "step": 3750, "valid_targets_mean": 3798.1, "valid_targets_min": 353 }, { "epoch": 5.988835725677831, "grad_norm": 0.49011701337432784, "learning_rate": 2.4969057417097807e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.15856046974658966, "step": 3755, "valid_targets_mean": 5457.1, "valid_targets_min": 893 }, { "epoch": 5.996810207336523, "grad_norm": 0.5383249113038507, "learning_rate": 2.458562261442483e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.14745956659317017, "step": 3760, "valid_targets_mean": 4042.0, "valid_targets_min": 900 }, { "epoch": 6.0047846889952154, "grad_norm": 0.49430702596220477, "learning_rate": 2.4204961835513263e-06, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.14110133051872253, "step": 3765, "valid_targets_mean": 4544.2, "valid_targets_min": 1362 }, { "epoch": 6.012759170653908, "grad_norm": 0.5009175563097514, "learning_rate": 2.3827081100177797e-06, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.1476556956768036, "step": 3770, "valid_targets_mean": 5110.4, "valid_targets_min": 1185 }, { "epoch": 6.020733652312599, "grad_norm": 0.49313677516660054, "learning_rate": 2.3451986384269266e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.13937491178512573, "step": 3775, "valid_targets_mean": 4621.9, "valid_targets_min": 1624 }, { "epoch": 6.028708133971292, "grad_norm": 0.6860362912088609, "learning_rate": 2.307968361957993e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.187550351023674, "step": 3780, "valid_targets_mean": 4856.3, "valid_targets_min": 1571 }, { "epoch": 6.036682615629984, "grad_norm": 0.5773716723883122, "learning_rate": 2.2710178693749805e-06, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.1661595106124878, "step": 3785, "valid_targets_mean": 3802.4, "valid_targets_min": 1601 }, { "epoch": 6.044657097288677, "grad_norm": 0.497541583677315, "learning_rate": 2.2343477450173665e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.11052682250738144, "step": 3790, "valid_targets_mean": 3915.4, "valid_targets_min": 1388 }, { "epoch": 6.052631578947368, "grad_norm": 0.4960366052870153, "learning_rate": 2.197958568790839e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.14265236258506775, "step": 3795, "valid_targets_mean": 4880.4, "valid_targets_min": 2259 }, { "epoch": 6.0606060606060606, "grad_norm": 0.4925604930180625, "learning_rate": 2.161850916158148e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.13926450908184052, "step": 3800, "valid_targets_mean": 4805.2, "valid_targets_min": 1930 }, { "epoch": 6.068580542264753, "grad_norm": 0.49478746503871057, "learning_rate": 2.1260253581299996e-06, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.1338876485824585, "step": 3805, "valid_targets_mean": 4109.5, "valid_targets_min": 414 }, { "epoch": 6.076555023923445, "grad_norm": 0.5064549765633942, "learning_rate": 2.0904824612560046e-06, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.1764906346797943, "step": 3810, "valid_targets_mean": 4899.3, "valid_targets_min": 1593 }, { "epoch": 6.084529505582137, "grad_norm": 0.5180065700775449, "learning_rate": 2.0552227876157536e-06, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.1284601241350174, "step": 3815, "valid_targets_mean": 3687.7, "valid_targets_min": 732 }, { "epoch": 6.092503987240829, "grad_norm": 0.5259373294338707, "learning_rate": 2.020246894809912e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.13603927195072174, "step": 3820, "valid_targets_mean": 4060.6, "valid_targets_min": 308 }, { "epoch": 6.100478468899522, "grad_norm": 0.5235335460898032, "learning_rate": 1.9855553359513836e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.11099904775619507, "step": 3825, "valid_targets_mean": 4016.0, "valid_targets_min": 1483 }, { "epoch": 6.108452950558214, "grad_norm": 0.6341054094850744, "learning_rate": 1.9511486596566054e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.17271441221237183, "step": 3830, "valid_targets_mean": 3144.9, "valid_targets_min": 1179 }, { "epoch": 6.116427432216906, "grad_norm": 0.5684654706262051, "learning_rate": 1.917027410036825e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.15632422268390656, "step": 3835, "valid_targets_mean": 3489.4, "valid_targets_min": 440 }, { "epoch": 6.124401913875598, "grad_norm": 0.47186770873479894, "learning_rate": 1.8831921266895348e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.12489638477563858, "step": 3840, "valid_targets_mean": 4751.5, "valid_targets_min": 564 }, { "epoch": 6.1323763955342905, "grad_norm": 0.5812261927451817, "learning_rate": 1.8496433446899197e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.11479625850915909, "step": 3845, "valid_targets_mean": 3060.4, "valid_targets_min": 1069 }, { "epoch": 6.140350877192983, "grad_norm": 0.5402386536039824, "learning_rate": 1.8163815945823881e-06, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345522552728653, "step": 3850, "valid_targets_mean": 4273.4, "valid_targets_min": 1083 }, { "epoch": 6.148325358851674, "grad_norm": 0.496965598633163, "learning_rate": 1.7834074023722082e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.12266291677951813, "step": 3855, "valid_targets_mean": 4934.3, "valid_targets_min": 1487 }, { "epoch": 6.156299840510367, "grad_norm": 0.5519860673495093, "learning_rate": 1.7507212895171632e-06, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.1321459710597992, "step": 3860, "valid_targets_mean": 3861.4, "valid_targets_min": 686 }, { "epoch": 6.164274322169059, "grad_norm": 0.49076514558644085, "learning_rate": 1.7183237729193081e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.15181314945220947, "step": 3865, "valid_targets_mean": 5045.6, "valid_targets_min": 1188 }, { "epoch": 6.172248803827751, "grad_norm": 0.5372730767695284, "learning_rate": 1.6862153649168211e-06, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.12448375672101974, "step": 3870, "valid_targets_mean": 3875.8, "valid_targets_min": 1162 }, { "epoch": 6.180223285486443, "grad_norm": 0.49684499279704325, "learning_rate": 1.6543965732758737e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1295873075723648, "step": 3875, "valid_targets_mean": 4275.8, "valid_targets_min": 1810 }, { "epoch": 6.188197767145136, "grad_norm": 0.5504960661897019, "learning_rate": 1.6228679011826032e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.1351630687713623, "step": 3880, "valid_targets_mean": 3684.4, "valid_targets_min": 1036 }, { "epoch": 6.196172248803828, "grad_norm": 0.4995587060471986, "learning_rate": 1.591629847235172e-06, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12718336284160614, "step": 3885, "valid_targets_mean": 4705.2, "valid_targets_min": 1038 }, { "epoch": 6.2041467304625195, "grad_norm": 0.4959141881965582, "learning_rate": 1.5606829054358686e-06, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419508159160614, "step": 3890, "valid_targets_mean": 4684.0, "valid_targets_min": 2001 }, { "epoch": 6.212121212121212, "grad_norm": 0.623950185968585, "learning_rate": 1.5300275651832963e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.13223516941070557, "step": 3895, "valid_targets_mean": 5110.7, "valid_targets_min": 1969 }, { "epoch": 6.220095693779904, "grad_norm": 0.6346640130343832, "learning_rate": 1.499664311264648e-06, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.16367286443710327, "step": 3900, "valid_targets_mean": 3819.8, "valid_targets_min": 860 }, { "epoch": 6.228070175438597, "grad_norm": 0.6122246042123756, "learning_rate": 1.4695936238480135e-06, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.12655913829803467, "step": 3905, "valid_targets_mean": 3684.9, "valid_targets_min": 736 }, { "epoch": 6.236044657097288, "grad_norm": 0.5744548130501511, "learning_rate": 1.4398159784748144e-06, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.16123470664024353, "step": 3910, "valid_targets_mean": 3574.8, "valid_targets_min": 1859 }, { "epoch": 6.244019138755981, "grad_norm": 0.5996106329357315, "learning_rate": 1.4103318460522598e-06, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.1403590589761734, "step": 3915, "valid_targets_mean": 3877.1, "valid_targets_min": 625 }, { "epoch": 6.251993620414673, "grad_norm": 0.5132749502243364, "learning_rate": 1.3811416928459177e-06, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.14636051654815674, "step": 3920, "valid_targets_mean": 4128.2, "valid_targets_min": 465 }, { "epoch": 6.2599681020733655, "grad_norm": 0.5650057439215522, "learning_rate": 1.3522459804723353e-06, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.1392631232738495, "step": 3925, "valid_targets_mean": 4433.2, "valid_targets_min": 916 }, { "epoch": 6.267942583732057, "grad_norm": 0.5185553837899172, "learning_rate": 1.3236451658917293e-06, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.13320839405059814, "step": 3930, "valid_targets_mean": 4020.2, "valid_targets_min": 1580 }, { "epoch": 6.2759170653907494, "grad_norm": 0.5525213441195974, "learning_rate": 1.2953397014007728e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.17850124835968018, "step": 3935, "valid_targets_mean": 4348.1, "valid_targets_min": 1432 }, { "epoch": 6.283891547049442, "grad_norm": 0.488391409608166, "learning_rate": 1.2673300346254447e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.15462128818035126, "step": 3940, "valid_targets_mean": 4733.1, "valid_targets_min": 1935 }, { "epoch": 6.291866028708134, "grad_norm": 0.5108981894562138, "learning_rate": 1.239616608513925e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.1496082842350006, "step": 3945, "valid_targets_mean": 4025.8, "valid_targets_min": 535 }, { "epoch": 6.299840510366826, "grad_norm": 0.6093838052506947, "learning_rate": 1.2121998613296259e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.10867314040660858, "step": 3950, "valid_targets_mean": 3494.8, "valid_targets_min": 670 }, { "epoch": 6.307814992025518, "grad_norm": 0.5119509074281289, "learning_rate": 1.1850802266442396e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.16429255902767181, "step": 3955, "valid_targets_mean": 4612.4, "valid_targets_min": 759 }, { "epoch": 6.315789473684211, "grad_norm": 0.5347696760359358, "learning_rate": 1.1582581333308784e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.1720159351825714, "step": 3960, "valid_targets_mean": 4205.4, "valid_targets_min": 515 }, { "epoch": 6.323763955342903, "grad_norm": 0.4852207515725228, "learning_rate": 1.1317340055573122e-06, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445663422346115, "step": 3965, "valid_targets_mean": 5052.6, "valid_targets_min": 1283 }, { "epoch": 6.3317384370015946, "grad_norm": 0.507436285150948, "learning_rate": 1.1055082627792357e-06, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.12436027824878693, "step": 3970, "valid_targets_mean": 4297.2, "valid_targets_min": 1663 }, { "epoch": 6.339712918660287, "grad_norm": 0.5368792578229027, "learning_rate": 1.0795813197336602e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.11996762454509735, "step": 3975, "valid_targets_mean": 3953.6, "valid_targets_min": 1257 }, { "epoch": 6.347687400318979, "grad_norm": 0.48044682571789116, "learning_rate": 1.0539535864323391e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.1088440790772438, "step": 3980, "valid_targets_mean": 4750.7, "valid_targets_min": 1344 }, { "epoch": 6.355661881977672, "grad_norm": 0.5329144232637667, "learning_rate": 1.0286254681552777e-06, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612853854894638, "step": 3985, "valid_targets_mean": 4179.6, "valid_targets_min": 1229 }, { "epoch": 6.363636363636363, "grad_norm": 0.5748925946370642, "learning_rate": 1.0035973654443466e-06, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.12145799398422241, "step": 3990, "valid_targets_mean": 4831.9, "valid_targets_min": 861 }, { "epoch": 6.371610845295056, "grad_norm": 0.5705983078076705, "learning_rate": 9.788696740969295e-07, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.14661964774131775, "step": 3995, "valid_targets_mean": 3695.1, "valid_targets_min": 550 }, { "epoch": 6.379585326953748, "grad_norm": 0.5645513513745306, "learning_rate": 9.544427851596661e-07, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.13105720281600952, "step": 4000, "valid_targets_mean": 3997.6, "valid_targets_min": 287 }, { "epoch": 6.3875598086124405, "grad_norm": 0.5275976634530215, "learning_rate": 9.303170849222764e-07, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15079137682914734, "step": 4005, "valid_targets_mean": 4694.5, "valid_targets_min": 359 }, { "epoch": 6.395534290271132, "grad_norm": 0.5285990530880269, "learning_rate": 9.064929549114421e-07, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.10869532823562622, "step": 4010, "valid_targets_mean": 3649.6, "valid_targets_min": 1504 }, { "epoch": 6.4035087719298245, "grad_norm": 0.7090154333622751, "learning_rate": 8.829707718847835e-07, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.14588609337806702, "step": 4015, "valid_targets_mean": 3740.7, "valid_targets_min": 1132 }, { "epoch": 6.411483253588517, "grad_norm": 0.5137768138489031, "learning_rate": 8.597509078248923e-07, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488763988018036, "step": 4020, "valid_targets_mean": 4146.1, "valid_targets_min": 531 }, { "epoch": 6.419457735247209, "grad_norm": 0.48049275831230703, "learning_rate": 8.368337299334461e-07, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.11516915261745453, "step": 4025, "valid_targets_mean": 4326.6, "valid_targets_min": 1295 }, { "epoch": 6.427432216905901, "grad_norm": 0.5161570168262671, "learning_rate": 8.142196006254144e-07, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.12275591492652893, "step": 4030, "valid_targets_mean": 4094.8, "valid_targets_min": 1898 }, { "epoch": 6.435406698564593, "grad_norm": 0.5362563187603275, "learning_rate": 7.919088775233264e-07, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.13758490979671478, "step": 4035, "valid_targets_mean": 3916.8, "valid_targets_min": 1555 }, { "epoch": 6.443381180223286, "grad_norm": 0.49875755343739087, "learning_rate": 7.699019134515917e-07, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.1160312294960022, "step": 4040, "valid_targets_mean": 4468.5, "valid_targets_min": 2508 }, { "epoch": 6.451355661881978, "grad_norm": 0.5262408222186133, "learning_rate": 7.48199056430956e-07, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.1481764316558838, "step": 4045, "valid_targets_mean": 4616.4, "valid_targets_min": 458 }, { "epoch": 6.45933014354067, "grad_norm": 0.507178503336427, "learning_rate": 7.268006496729762e-07, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.13112816214561462, "step": 4050, "valid_targets_mean": 3990.1, "valid_targets_min": 641 }, { "epoch": 6.467304625199362, "grad_norm": 0.5669657663732001, "learning_rate": 7.057070315745851e-07, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.11124549061059952, "step": 4055, "valid_targets_mean": 3979.8, "valid_targets_min": 1798 }, { "epoch": 6.475279106858054, "grad_norm": 0.5377654564783906, "learning_rate": 6.849185357127686e-07, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.13395267724990845, "step": 4060, "valid_targets_mean": 4332.1, "valid_targets_min": 1825 }, { "epoch": 6.483253588516747, "grad_norm": 0.6589422038099677, "learning_rate": 6.64435490839257e-07, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.12837636470794678, "step": 4065, "valid_targets_mean": 3748.6, "valid_targets_min": 291 }, { "epoch": 6.491228070175438, "grad_norm": 0.46549715916839196, "learning_rate": 6.442582208753578e-07, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.16415579617023468, "step": 4070, "valid_targets_mean": 5833.8, "valid_targets_min": 1597 }, { "epoch": 6.499202551834131, "grad_norm": 0.6622687035422515, "learning_rate": 6.243870449068068e-07, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.1493580937385559, "step": 4075, "valid_targets_mean": 4838.5, "valid_targets_min": 867 }, { "epoch": 6.507177033492823, "grad_norm": 0.5198345078048688, "learning_rate": 6.048222771787382e-07, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.1303584724664688, "step": 4080, "valid_targets_mean": 4566.9, "valid_targets_min": 1867 }, { "epoch": 6.515151515151516, "grad_norm": 0.48509162868152, "learning_rate": 5.85564227090707e-07, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16224688291549683, "step": 4085, "valid_targets_mean": 5195.4, "valid_targets_min": 1471 }, { "epoch": 6.523125996810207, "grad_norm": 0.5873719255870822, "learning_rate": 5.666131991917989e-07, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.13083861768245697, "step": 4090, "valid_targets_mean": 3929.3, "valid_targets_min": 376 }, { "epoch": 6.5311004784688995, "grad_norm": 0.5977724356369237, "learning_rate": 5.479694931758194e-07, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.13004256784915924, "step": 4095, "valid_targets_mean": 3322.4, "valid_targets_min": 854 }, { "epoch": 6.539074960127592, "grad_norm": 0.5240351703130457, "learning_rate": 5.296334038765483e-07, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.13967791199684143, "step": 4100, "valid_targets_mean": 3777.9, "valid_targets_min": 1111 }, { "epoch": 6.5470494417862835, "grad_norm": 0.5440153780671622, "learning_rate": 5.116052212630696e-07, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.11996950209140778, "step": 4105, "valid_targets_mean": 3631.4, "valid_targets_min": 1837 }, { "epoch": 6.555023923444976, "grad_norm": 0.48914053795353435, "learning_rate": 4.938852304352026e-07, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.11675041913986206, "step": 4110, "valid_targets_mean": 4209.9, "valid_targets_min": 1039 }, { "epoch": 6.562998405103668, "grad_norm": 0.5196936360126563, "learning_rate": 4.7647371161898547e-07, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14445306360721588, "step": 4115, "valid_targets_mean": 4266.6, "valid_targets_min": 1671 }, { "epoch": 6.570972886762361, "grad_norm": 0.6270985256379639, "learning_rate": 4.593709401622359e-07, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.11855871975421906, "step": 4120, "valid_targets_mean": 4256.4, "valid_targets_min": 1403 }, { "epoch": 6.578947368421053, "grad_norm": 0.5513191005216137, "learning_rate": 4.425771865302153e-07, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.16223138570785522, "step": 4125, "valid_targets_mean": 5632.7, "valid_targets_min": 2783 }, { "epoch": 6.586921850079745, "grad_norm": 0.47622414847630423, "learning_rate": 4.2609271630133174e-07, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.15721635520458221, "step": 4130, "valid_targets_mean": 4821.3, "valid_targets_min": 1248 }, { "epoch": 6.594896331738437, "grad_norm": 0.5867580468822079, "learning_rate": 4.099177901629525e-07, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1569528430700302, "step": 4135, "valid_targets_mean": 4191.9, "valid_targets_min": 351 }, { "epoch": 6.6028708133971294, "grad_norm": 0.5051611881659711, "learning_rate": 3.9405266390727836e-07, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.13498680293560028, "step": 4140, "valid_targets_mean": 4330.7, "valid_targets_min": 338 }, { "epoch": 6.610845295055821, "grad_norm": 0.47853079889882155, "learning_rate": 3.7849758842729344e-07, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.12443745136260986, "step": 4145, "valid_targets_mean": 4602.2, "valid_targets_min": 1840 }, { "epoch": 6.618819776714513, "grad_norm": 0.5338550959823287, "learning_rate": 3.632528097128085e-07, "loss": 0.1234, "loss_nan_ranks": 0, "loss_rank_avg": 0.12975472211837769, "step": 4150, "valid_targets_mean": 4234.5, "valid_targets_min": 943 }, { "epoch": 6.626794258373206, "grad_norm": 0.49688890655045326, "learning_rate": 3.48318568846564e-07, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.13185477256774902, "step": 4155, "valid_targets_mean": 4626.2, "valid_targets_min": 481 }, { "epoch": 6.634768740031898, "grad_norm": 0.5763693407472297, "learning_rate": 3.336951020004087e-07, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.19649842381477356, "step": 4160, "valid_targets_mean": 4184.9, "valid_targets_min": 1350 }, { "epoch": 6.64274322169059, "grad_norm": 0.5531016551635043, "learning_rate": 3.1938264043158694e-07, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.17289824783802032, "step": 4165, "valid_targets_mean": 4395.6, "valid_targets_min": 1557 }, { "epoch": 6.650717703349282, "grad_norm": 0.47177742265711486, "learning_rate": 3.05381410479062e-07, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.17544347047805786, "step": 4170, "valid_targets_mean": 5182.7, "valid_targets_min": 1911 }, { "epoch": 6.6586921850079746, "grad_norm": 0.5216521849278853, "learning_rate": 2.916916335599407e-07, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.11967335641384125, "step": 4175, "valid_targets_mean": 3633.3, "valid_targets_min": 1290 }, { "epoch": 6.666666666666667, "grad_norm": 0.5244652547649694, "learning_rate": 2.783135261659831e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.14524878561496735, "step": 4180, "valid_targets_mean": 5046.4, "valid_targets_min": 1755 }, { "epoch": 6.6746411483253585, "grad_norm": 0.5242548984299902, "learning_rate": 2.6524729986016293e-07, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.1346084475517273, "step": 4185, "valid_targets_mean": 4556.6, "valid_targets_min": 1156 }, { "epoch": 6.682615629984051, "grad_norm": 0.48588135941150645, "learning_rate": 2.524931612733328e-07, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.12049822509288788, "step": 4190, "valid_targets_mean": 4792.8, "valid_targets_min": 583 }, { "epoch": 6.690590111642743, "grad_norm": 0.5157831592987673, "learning_rate": 2.400513121009529e-07, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.12056033313274384, "step": 4195, "valid_targets_mean": 3902.8, "valid_targets_min": 900 }, { "epoch": 6.698564593301436, "grad_norm": 0.6181941397201824, "learning_rate": 2.279219490998985e-07, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.12805788218975067, "step": 4200, "valid_targets_mean": 4067.9, "valid_targets_min": 448 }, { "epoch": 6.706539074960127, "grad_norm": 0.5411702652574677, "learning_rate": 2.161052640853578e-07, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.13948936760425568, "step": 4205, "valid_targets_mean": 4612.0, "valid_targets_min": 2172 }, { "epoch": 6.71451355661882, "grad_norm": 0.5203767410756568, "learning_rate": 2.0460144392778768e-07, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.14677637815475464, "step": 4210, "valid_targets_mean": 4351.0, "valid_targets_min": 1795 }, { "epoch": 6.722488038277512, "grad_norm": 0.48076115868735375, "learning_rate": 1.9341067054996277e-07, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.12446603178977966, "step": 4215, "valid_targets_mean": 4783.4, "valid_targets_min": 1169 }, { "epoch": 6.7304625199362045, "grad_norm": 0.4938032695536993, "learning_rate": 1.8253312092409992e-07, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.14762309193611145, "step": 4220, "valid_targets_mean": 5270.6, "valid_targets_min": 2308 }, { "epoch": 6.738437001594896, "grad_norm": 0.5073690650738787, "learning_rate": 1.7196896706906273e-07, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.13876202702522278, "step": 4225, "valid_targets_mean": 4535.9, "valid_targets_min": 2133 }, { "epoch": 6.746411483253588, "grad_norm": 0.6239349122520454, "learning_rate": 1.6171837604762597e-07, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.14759038388729095, "step": 4230, "valid_targets_mean": 3153.2, "valid_targets_min": 712 }, { "epoch": 6.754385964912281, "grad_norm": 0.5294503911396128, "learning_rate": 1.5178150996385755e-07, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.14934271574020386, "step": 4235, "valid_targets_mean": 4826.8, "valid_targets_min": 2045 }, { "epoch": 6.762360446570973, "grad_norm": 0.5474589095143887, "learning_rate": 1.421585259605318e-07, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.17565397918224335, "step": 4240, "valid_targets_mean": 3994.0, "valid_targets_min": 811 }, { "epoch": 6.770334928229665, "grad_norm": 0.4968111197576825, "learning_rate": 1.3284957621666039e-07, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.15295177698135376, "step": 4245, "valid_targets_mean": 5280.7, "valid_targets_min": 2153 }, { "epoch": 6.778309409888357, "grad_norm": 0.5712193249343777, "learning_rate": 1.2385480794507853e-07, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.15290597081184387, "step": 4250, "valid_targets_mean": 4323.8, "valid_targets_min": 1528 }, { "epoch": 6.78628389154705, "grad_norm": 0.5387472877772308, "learning_rate": 1.1517436339011589e-07, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.16408362984657288, "step": 4255, "valid_targets_mean": 4533.3, "valid_targets_min": 1733 }, { "epoch": 6.794258373205742, "grad_norm": 0.5262055497554436, "learning_rate": 1.0680837982535607e-07, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.17279741168022156, "step": 4260, "valid_targets_mean": 4844.5, "valid_targets_min": 1115 }, { "epoch": 6.8022328548644335, "grad_norm": 0.5393251228907873, "learning_rate": 9.875698955145174e-08, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.17203345894813538, "step": 4265, "valid_targets_mean": 4560.6, "valid_targets_min": 835 }, { "epoch": 6.810207336523126, "grad_norm": 0.4950986090823543, "learning_rate": 9.102031989404403e-08, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278517246246338, "step": 4270, "valid_targets_mean": 4280.2, "valid_targets_min": 271 }, { "epoch": 6.818181818181818, "grad_norm": 0.5322683037430497, "learning_rate": 8.359849320174196e-08, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.14759370684623718, "step": 4275, "valid_targets_mean": 4334.2, "valid_targets_min": 1141 }, { "epoch": 6.826156299840511, "grad_norm": 0.5106524077335042, "learning_rate": 7.649162684419731e-08, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.13630405068397522, "step": 4280, "valid_targets_mean": 5122.1, "valid_targets_min": 1651 }, { "epoch": 6.834130781499202, "grad_norm": 0.48090627611402476, "learning_rate": 6.969983321023499e-08, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.14416742324829102, "step": 4285, "valid_targets_mean": 4816.6, "valid_targets_min": 1821 }, { "epoch": 6.842105263157895, "grad_norm": 0.48778544545536157, "learning_rate": 6.322321970608337e-08, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.1339418888092041, "step": 4290, "valid_targets_mean": 4488.4, "valid_targets_min": 1616 }, { "epoch": 6.850079744816587, "grad_norm": 0.46499159243236704, "learning_rate": 5.7061888753677796e-08, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.14237193763256073, "step": 4295, "valid_targets_mean": 4920.9, "valid_targets_min": 1271 }, { "epoch": 6.858054226475279, "grad_norm": 0.4818822507608203, "learning_rate": 5.121593778903755e-08, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.13319122791290283, "step": 4300, "valid_targets_mean": 4507.4, "valid_targets_min": 2343 }, { "epoch": 6.866028708133971, "grad_norm": 0.5030961917930569, "learning_rate": 4.5685459260722544e-08, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.15166345238685608, "step": 4305, "valid_targets_mean": 4678.6, "valid_targets_min": 1154 }, { "epoch": 6.8740031897926634, "grad_norm": 0.5753815923974399, "learning_rate": 4.047054062837452e-08, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.16344240307807922, "step": 4310, "valid_targets_mean": 4398.2, "valid_targets_min": 1732 }, { "epoch": 6.881977671451356, "grad_norm": 0.5355466593328079, "learning_rate": 3.55712643613404e-08, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.14519166946411133, "step": 4315, "valid_targets_mean": 4389.8, "valid_targets_min": 1213 }, { "epoch": 6.889952153110048, "grad_norm": 0.5278125498932654, "learning_rate": 3.0987707937351066e-08, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.13044758141040802, "step": 4320, "valid_targets_mean": 4127.8, "valid_targets_min": 1647 }, { "epoch": 6.89792663476874, "grad_norm": 0.4856712767135322, "learning_rate": 2.6719943841311268e-08, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.13070060312747955, "step": 4325, "valid_targets_mean": 4700.8, "valid_targets_min": 608 }, { "epoch": 6.905901116427432, "grad_norm": 0.6415911642154425, "learning_rate": 2.2768039564151635e-08, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.1640297770500183, "step": 4330, "valid_targets_mean": 3901.8, "valid_targets_min": 655 }, { "epoch": 6.913875598086125, "grad_norm": 0.6626092253360519, "learning_rate": 1.913205760175174e-08, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.1504662036895752, "step": 4335, "valid_targets_mean": 5199.6, "valid_targets_min": 1387 }, { "epoch": 6.921850079744816, "grad_norm": 0.5982491019172199, "learning_rate": 1.5812055453963136e-08, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.14008523523807526, "step": 4340, "valid_targets_mean": 4319.2, "valid_targets_min": 1729 }, { "epoch": 6.9298245614035086, "grad_norm": 0.5104174835877258, "learning_rate": 1.280808562369229e-08, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.133617103099823, "step": 4345, "valid_targets_mean": 4219.4, "valid_targets_min": 1451 }, { "epoch": 6.937799043062201, "grad_norm": 0.4877409631231481, "learning_rate": 1.01201956160768e-08, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.174456387758255, "step": 4350, "valid_targets_mean": 4994.6, "valid_targets_min": 1946 }, { "epoch": 6.945773524720893, "grad_norm": 0.5184348308045106, "learning_rate": 7.74842793772601e-09, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.1534990817308426, "step": 4355, "valid_targets_mean": 4945.9, "valid_targets_min": 1800 }, { "epoch": 6.953748006379586, "grad_norm": 0.5492476418437654, "learning_rate": 5.692820096054874e-09, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.14275865256786346, "step": 4360, "valid_targets_mean": 4028.4, "valid_targets_min": 1148 }, { "epoch": 6.961722488038277, "grad_norm": 0.5057721726447473, "learning_rate": 3.9534045986888706e-09, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.13061657547950745, "step": 4365, "valid_targets_mean": 4621.9, "valid_targets_min": 1483 }, { "epoch": 6.96969696969697, "grad_norm": 0.5165832319676158, "learning_rate": 2.530208952953306e-09, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.15254126489162445, "step": 4370, "valid_targets_mean": 4441.8, "valid_targets_min": 1501 }, { "epoch": 6.977671451355662, "grad_norm": 0.4938874383244835, "learning_rate": 1.4232556654314445e-09, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.12354663759469986, "step": 4375, "valid_targets_mean": 4462.6, "valid_targets_min": 396 }, { "epoch": 6.985645933014354, "grad_norm": 0.5172931781731442, "learning_rate": 6.325622416136767e-10, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.12898609042167664, "step": 4380, "valid_targets_mean": 4070.1, "valid_targets_min": 1645 }, { "epoch": 6.993620414673046, "grad_norm": 0.5813118538526274, "learning_rate": 1.581411856199644e-10, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.12935660779476166, "step": 4385, "valid_targets_mean": 3541.5, "valid_targets_min": 1587 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.12793053686618805, "step": 4389, "total_flos": 1406471795245056.0, "train_loss": 0.18805862067907703, "train_runtime": 23263.3401, "train_samples_per_second": 3.014, "train_steps_per_second": 0.189, "valid_targets_mean": 3981.4, "valid_targets_min": 1669 } ], "logging_steps": 5, "max_steps": 4389, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1406471795245056.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }