{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 6187, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.005659309564233163, "grad_norm": 13.932631974720623, "learning_rate": 2.584814216478191e-07, "loss": 0.6701, "loss_nan_ranks": 0, "loss_rank_avg": 0.3416905999183655, "step": 5, "valid_targets_mean": 7214.4, "valid_targets_min": 4847 }, { "epoch": 0.011318619128466326, "grad_norm": 13.104201365603958, "learning_rate": 5.815831987075929e-07, "loss": 0.6193, "loss_nan_ranks": 0, "loss_rank_avg": 0.30890709161758423, "step": 10, "valid_targets_mean": 6417.1, "valid_targets_min": 4480 }, { "epoch": 0.01697792869269949, "grad_norm": 12.986646595432257, "learning_rate": 9.046849757673668e-07, "loss": 0.6611, "loss_nan_ranks": 0, "loss_rank_avg": 0.3296949863433838, "step": 15, "valid_targets_mean": 7605.4, "valid_targets_min": 5236 }, { "epoch": 0.022637238256932653, "grad_norm": 12.202975712757784, "learning_rate": 1.2277867528271405e-06, "loss": 0.6527, "loss_nan_ranks": 0, "loss_rank_avg": 0.29244548082351685, "step": 20, "valid_targets_mean": 5827.9, "valid_targets_min": 4727 }, { "epoch": 0.028296547821165818, "grad_norm": 8.284738278527138, "learning_rate": 1.5508885298869145e-06, "loss": 0.6323, "loss_nan_ranks": 0, "loss_rank_avg": 0.3284326195716858, "step": 25, "valid_targets_mean": 6448.2, "valid_targets_min": 4211 }, { "epoch": 0.03395585738539898, "grad_norm": 6.699927356351593, "learning_rate": 1.8739903069466882e-06, "loss": 0.5787, "loss_nan_ranks": 0, "loss_rank_avg": 0.3189699649810791, "step": 30, "valid_targets_mean": 6108.1, "valid_targets_min": 4279 }, { "epoch": 0.039615166949632144, "grad_norm": 5.491375033981934, "learning_rate": 2.197092084006462e-06, "loss": 0.5324, "loss_nan_ranks": 0, "loss_rank_avg": 0.2483714073896408, "step": 35, "valid_targets_mean": 5962.4, "valid_targets_min": 4589 }, { "epoch": 0.045274476513865305, "grad_norm": 5.479122606853314, "learning_rate": 2.5201938610662364e-06, "loss": 0.5064, "loss_nan_ranks": 0, "loss_rank_avg": 0.21808978915214539, "step": 40, "valid_targets_mean": 3503.2, "valid_targets_min": 2015 }, { "epoch": 0.050933786078098474, "grad_norm": 2.1266074610168677, "learning_rate": 2.84329563812601e-06, "loss": 0.4299, "loss_nan_ranks": 0, "loss_rank_avg": 0.1883259415626526, "step": 45, "valid_targets_mean": 6102.5, "valid_targets_min": 4778 }, { "epoch": 0.056593095642331635, "grad_norm": 1.5323390515097495, "learning_rate": 3.166397415185784e-06, "loss": 0.4095, "loss_nan_ranks": 0, "loss_rank_avg": 0.19586817920207977, "step": 50, "valid_targets_mean": 5868.2, "valid_targets_min": 4612 }, { "epoch": 0.0622524052065648, "grad_norm": 1.159860405025848, "learning_rate": 3.489499192245558e-06, "loss": 0.4175, "loss_nan_ranks": 0, "loss_rank_avg": 0.21410322189331055, "step": 55, "valid_targets_mean": 6105.8, "valid_targets_min": 4491 }, { "epoch": 0.06791171477079797, "grad_norm": 0.894038373410666, "learning_rate": 3.812600969305332e-06, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.17711375653743744, "step": 60, "valid_targets_mean": 6962.0, "valid_targets_min": 4754 }, { "epoch": 0.07357102433503113, "grad_norm": 0.8624955501056109, "learning_rate": 4.1357027463651056e-06, "loss": 0.3707, "loss_nan_ranks": 0, "loss_rank_avg": 0.1949971616268158, "step": 65, "valid_targets_mean": 6035.1, "valid_targets_min": 4787 }, { "epoch": 0.07923033389926429, "grad_norm": 0.7091607001817442, "learning_rate": 4.458804523424879e-06, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.18302902579307556, "step": 70, "valid_targets_mean": 6028.5, "valid_targets_min": 5213 }, { "epoch": 0.08488964346349745, "grad_norm": 0.585307554413562, "learning_rate": 4.781906300484653e-06, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.14917157590389252, "step": 75, "valid_targets_mean": 6814.1, "valid_targets_min": 4664 }, { "epoch": 0.09054895302773061, "grad_norm": 0.6376342595638888, "learning_rate": 5.105008077544427e-06, "loss": 0.3567, "loss_nan_ranks": 0, "loss_rank_avg": 0.16629627346992493, "step": 80, "valid_targets_mean": 6281.5, "valid_targets_min": 4996 }, { "epoch": 0.09620826259196379, "grad_norm": 0.5883660151243281, "learning_rate": 5.4281098546042014e-06, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.16139009594917297, "step": 85, "valid_targets_mean": 6628.9, "valid_targets_min": 4582 }, { "epoch": 0.10186757215619695, "grad_norm": 0.5306968778726449, "learning_rate": 5.751211631663974e-06, "loss": 0.3247, "loss_nan_ranks": 0, "loss_rank_avg": 0.1460968554019928, "step": 90, "valid_targets_mean": 6536.6, "valid_targets_min": 5205 }, { "epoch": 0.10752688172043011, "grad_norm": 0.5036303188428934, "learning_rate": 6.074313408723749e-06, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.15533623099327087, "step": 95, "valid_targets_mean": 7031.0, "valid_targets_min": 5098 }, { "epoch": 0.11318619128466327, "grad_norm": 0.516720651939086, "learning_rate": 6.397415185783522e-06, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.1776922047138214, "step": 100, "valid_targets_mean": 6514.2, "valid_targets_min": 5016 }, { "epoch": 0.11884550084889643, "grad_norm": 0.538952735082876, "learning_rate": 6.7205169628432965e-06, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.20050251483917236, "step": 105, "valid_targets_mean": 6330.0, "valid_targets_min": 965 }, { "epoch": 0.1245048104131296, "grad_norm": 0.5135956002010927, "learning_rate": 7.043618739903069e-06, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.15224193036556244, "step": 110, "valid_targets_mean": 6293.1, "valid_targets_min": 5218 }, { "epoch": 0.13016411997736277, "grad_norm": 0.4731793435324797, "learning_rate": 7.366720516962844e-06, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.13703802227973938, "step": 115, "valid_targets_mean": 6957.4, "valid_targets_min": 4213 }, { "epoch": 0.13582342954159593, "grad_norm": 0.5989726776221539, "learning_rate": 7.689822294022618e-06, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.16760709881782532, "step": 120, "valid_targets_mean": 5888.5, "valid_targets_min": 4923 }, { "epoch": 0.1414827391058291, "grad_norm": 0.4926854131506727, "learning_rate": 8.012924071082391e-06, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.19979137182235718, "step": 125, "valid_targets_mean": 7822.9, "valid_targets_min": 4993 }, { "epoch": 0.14714204867006225, "grad_norm": 0.6268142920401387, "learning_rate": 8.336025848142165e-06, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.16050826013088226, "step": 130, "valid_targets_mean": 6098.6, "valid_targets_min": 4872 }, { "epoch": 0.15280135823429541, "grad_norm": 0.6293607807525029, "learning_rate": 8.659127625201939e-06, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.15364673733711243, "step": 135, "valid_targets_mean": 6892.2, "valid_targets_min": 4706 }, { "epoch": 0.15846066779852858, "grad_norm": 0.6156398588670324, "learning_rate": 8.982229402261713e-06, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.13796129822731018, "step": 140, "valid_targets_mean": 6352.0, "valid_targets_min": 4889 }, { "epoch": 0.16411997736276174, "grad_norm": 0.5767454589802685, "learning_rate": 9.305331179321486e-06, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.13889192044734955, "step": 145, "valid_targets_mean": 5948.9, "valid_targets_min": 3888 }, { "epoch": 0.1697792869269949, "grad_norm": 0.6287336280725723, "learning_rate": 9.62843295638126e-06, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.13580778241157532, "step": 150, "valid_targets_mean": 5846.2, "valid_targets_min": 4051 }, { "epoch": 0.17543859649122806, "grad_norm": 0.4685830287171293, "learning_rate": 9.951534733441036e-06, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.14092932641506195, "step": 155, "valid_targets_mean": 7319.2, "valid_targets_min": 5230 }, { "epoch": 0.18109790605546122, "grad_norm": 0.5282874259897358, "learning_rate": 1.0274636510500808e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.14267754554748535, "step": 160, "valid_targets_mean": 8235.1, "valid_targets_min": 4997 }, { "epoch": 0.1867572156196944, "grad_norm": 0.5395936939838358, "learning_rate": 1.0597738287560582e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.14883150160312653, "step": 165, "valid_targets_mean": 6402.5, "valid_targets_min": 5364 }, { "epoch": 0.19241652518392757, "grad_norm": 0.5333879494600592, "learning_rate": 1.0920840064620357e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.1588222235441208, "step": 170, "valid_targets_mean": 7117.4, "valid_targets_min": 3391 }, { "epoch": 0.19807583474816073, "grad_norm": 0.4867516211322162, "learning_rate": 1.124394184168013e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.1317976713180542, "step": 175, "valid_targets_mean": 7542.8, "valid_targets_min": 4829 }, { "epoch": 0.2037351443123939, "grad_norm": 0.5420891751146504, "learning_rate": 1.1567043618739904e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1280643194913864, "step": 180, "valid_targets_mean": 6284.4, "valid_targets_min": 5180 }, { "epoch": 0.20939445387662706, "grad_norm": 0.6661403521505342, "learning_rate": 1.1890145395799677e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.14606133103370667, "step": 185, "valid_targets_mean": 5806.2, "valid_targets_min": 5101 }, { "epoch": 0.21505376344086022, "grad_norm": 0.5210883149895804, "learning_rate": 1.2213247172859452e-05, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.12868677079677582, "step": 190, "valid_targets_mean": 6697.9, "valid_targets_min": 4527 }, { "epoch": 0.22071307300509338, "grad_norm": 0.5097320565529695, "learning_rate": 1.2536348949919226e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.15265926718711853, "step": 195, "valid_targets_mean": 6410.4, "valid_targets_min": 3082 }, { "epoch": 0.22637238256932654, "grad_norm": 0.49409646681977326, "learning_rate": 1.2859450726979e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1307762712240219, "step": 200, "valid_targets_mean": 6847.1, "valid_targets_min": 4685 }, { "epoch": 0.2320316921335597, "grad_norm": 0.5881665700498941, "learning_rate": 1.3182552504038773e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.13722704350948334, "step": 205, "valid_targets_mean": 6194.0, "valid_targets_min": 4644 }, { "epoch": 0.23769100169779286, "grad_norm": 0.5147963094755471, "learning_rate": 1.3505654281098549e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.12045536190271378, "step": 210, "valid_targets_mean": 6283.8, "valid_targets_min": 4433 }, { "epoch": 0.24335031126202603, "grad_norm": 1.0878536917736155, "learning_rate": 1.382875605815832e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.12820014357566833, "step": 215, "valid_targets_mean": 5917.2, "valid_targets_min": 4857 }, { "epoch": 0.2490096208262592, "grad_norm": 0.5533070005440421, "learning_rate": 1.4151857835218094e-05, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599322259426117, "step": 220, "valid_targets_mean": 6986.4, "valid_targets_min": 5101 }, { "epoch": 0.2546689303904924, "grad_norm": 0.8360192901625697, "learning_rate": 1.4474959612277868e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.1139596477150917, "step": 225, "valid_targets_mean": 5299.5, "valid_targets_min": 4442 }, { "epoch": 0.26032823995472554, "grad_norm": 0.5113052700220211, "learning_rate": 1.4798061389337644e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.10088923573493958, "step": 230, "valid_targets_mean": 6133.9, "valid_targets_min": 5130 }, { "epoch": 0.2659875495189587, "grad_norm": 0.556777937085549, "learning_rate": 1.5121163166397417e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.13561654090881348, "step": 235, "valid_targets_mean": 6477.4, "valid_targets_min": 4162 }, { "epoch": 0.27164685908319186, "grad_norm": 0.5097652957820101, "learning_rate": 1.544426494345719e-05, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.11574803292751312, "step": 240, "valid_targets_mean": 6350.4, "valid_targets_min": 3940 }, { "epoch": 0.277306168647425, "grad_norm": 0.5471177439544483, "learning_rate": 1.5767366720516963e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.14649951457977295, "step": 245, "valid_targets_mean": 6625.1, "valid_targets_min": 4642 }, { "epoch": 0.2829654782116582, "grad_norm": 0.6360629397684805, "learning_rate": 1.609046849757674e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.13972824811935425, "step": 250, "valid_targets_mean": 4907.0, "valid_targets_min": 4431 }, { "epoch": 0.28862478777589134, "grad_norm": 0.5114528328133985, "learning_rate": 1.641357027463651e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.13421732187271118, "step": 255, "valid_targets_mean": 6465.0, "valid_targets_min": 5333 }, { "epoch": 0.2942840973401245, "grad_norm": 0.5662488412896973, "learning_rate": 1.6736672051696286e-05, "loss": 0.247, "loss_nan_ranks": 0, "loss_rank_avg": 0.13066646456718445, "step": 260, "valid_targets_mean": 5650.5, "valid_targets_min": 4769 }, { "epoch": 0.29994340690435767, "grad_norm": 0.596415912061785, "learning_rate": 1.7059773828756058e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.1249205470085144, "step": 265, "valid_targets_mean": 5540.0, "valid_targets_min": 4281 }, { "epoch": 0.30560271646859083, "grad_norm": 0.5414221324867248, "learning_rate": 1.7382875605815834e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.1712135374546051, "step": 270, "valid_targets_mean": 6499.0, "valid_targets_min": 4844 }, { "epoch": 0.311262026032824, "grad_norm": 0.4800403021295474, "learning_rate": 1.770597738287561e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.11049605160951614, "step": 275, "valid_targets_mean": 5736.5, "valid_targets_min": 5227 }, { "epoch": 0.31692133559705715, "grad_norm": 0.4602797707086169, "learning_rate": 1.802907915993538e-05, "loss": 0.2484, "loss_nan_ranks": 0, "loss_rank_avg": 0.09841249883174896, "step": 280, "valid_targets_mean": 5857.2, "valid_targets_min": 2461 }, { "epoch": 0.3225806451612903, "grad_norm": 0.5144413634754103, "learning_rate": 1.8352180936995153e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.11220520734786987, "step": 285, "valid_targets_mean": 5793.4, "valid_targets_min": 2815 }, { "epoch": 0.3282399547255235, "grad_norm": 0.518213039234328, "learning_rate": 1.867528271405493e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.10794945061206818, "step": 290, "valid_targets_mean": 6588.8, "valid_targets_min": 4875 }, { "epoch": 0.33389926428975664, "grad_norm": 0.5028338131244561, "learning_rate": 1.8998384491114704e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.11335889995098114, "step": 295, "valid_targets_mean": 5984.8, "valid_targets_min": 4901 }, { "epoch": 0.3395585738539898, "grad_norm": 0.5014172240561889, "learning_rate": 1.9321486268174476e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.11073829233646393, "step": 300, "valid_targets_mean": 6067.4, "valid_targets_min": 3786 }, { "epoch": 0.34521788341822296, "grad_norm": 0.5159175569899495, "learning_rate": 1.9644588045234248e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.12275815010070801, "step": 305, "valid_targets_mean": 5852.5, "valid_targets_min": 5057 }, { "epoch": 0.3508771929824561, "grad_norm": 0.4920285069970866, "learning_rate": 1.9967689822294024e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.13101038336753845, "step": 310, "valid_targets_mean": 6362.2, "valid_targets_min": 3952 }, { "epoch": 0.3565365025466893, "grad_norm": 0.5829499325070455, "learning_rate": 2.0290791599353796e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.12691429257392883, "step": 315, "valid_targets_mean": 5360.2, "valid_targets_min": 4267 }, { "epoch": 0.36219581211092244, "grad_norm": 0.5106185491779682, "learning_rate": 2.0613893376413575e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.14615000784397125, "step": 320, "valid_targets_mean": 6842.1, "valid_targets_min": 4785 }, { "epoch": 0.3678551216751556, "grad_norm": 0.46986873220654096, "learning_rate": 2.0936995153473347e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.11088338494300842, "step": 325, "valid_targets_mean": 6188.5, "valid_targets_min": 5438 }, { "epoch": 0.3735144312393888, "grad_norm": 0.5155604844270958, "learning_rate": 2.1260096930533122e-05, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.12904900312423706, "step": 330, "valid_targets_mean": 5848.6, "valid_targets_min": 4734 }, { "epoch": 0.379173740803622, "grad_norm": 0.5286196270158149, "learning_rate": 2.1583198707592894e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.10007612407207489, "step": 335, "valid_targets_mean": 6278.2, "valid_targets_min": 5636 }, { "epoch": 0.38483305036785515, "grad_norm": 0.6422666761769791, "learning_rate": 2.1906300484652666e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.10531717538833618, "step": 340, "valid_targets_mean": 6168.9, "valid_targets_min": 4206 }, { "epoch": 0.3904923599320883, "grad_norm": 0.4809008293583508, "learning_rate": 2.2229402261712442e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.1038937121629715, "step": 345, "valid_targets_mean": 6226.5, "valid_targets_min": 4535 }, { "epoch": 0.39615166949632147, "grad_norm": 0.4200796846107823, "learning_rate": 2.2552504038772214e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.11499610543251038, "step": 350, "valid_targets_mean": 7821.6, "valid_targets_min": 5471 }, { "epoch": 0.40181097906055463, "grad_norm": 0.46601849681120616, "learning_rate": 2.2875605815831986e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.10218453407287598, "step": 355, "valid_targets_mean": 6843.0, "valid_targets_min": 5243 }, { "epoch": 0.4074702886247878, "grad_norm": 0.5592711031433829, "learning_rate": 2.3198707592891765e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.138760507106781, "step": 360, "valid_targets_mean": 6658.6, "valid_targets_min": 4906 }, { "epoch": 0.41312959818902095, "grad_norm": 0.4764946128159071, "learning_rate": 2.3521809369951537e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.1221180111169815, "step": 365, "valid_targets_mean": 6799.5, "valid_targets_min": 5168 }, { "epoch": 0.4187889077532541, "grad_norm": 0.5633069925985472, "learning_rate": 2.3844911147011312e-05, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.13051849603652954, "step": 370, "valid_targets_mean": 5376.2, "valid_targets_min": 3130 }, { "epoch": 0.4244482173174873, "grad_norm": 0.980342272097954, "learning_rate": 2.4168012924071084e-05, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.11312370002269745, "step": 375, "valid_targets_mean": 2843.1, "valid_targets_min": 1990 }, { "epoch": 0.43010752688172044, "grad_norm": 0.822944627042817, "learning_rate": 2.449111470113086e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.1140211820602417, "step": 380, "valid_targets_mean": 2532.2, "valid_targets_min": 324 }, { "epoch": 0.4357668364459536, "grad_norm": 0.6701905365467292, "learning_rate": 2.4814216478190632e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.08650068193674088, "step": 385, "valid_targets_mean": 2359.2, "valid_targets_min": 982 }, { "epoch": 0.44142614601018676, "grad_norm": 0.5747277053205969, "learning_rate": 2.5137318255250404e-05, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.0882439985871315, "step": 390, "valid_targets_mean": 3640.0, "valid_targets_min": 2479 }, { "epoch": 0.4470854555744199, "grad_norm": 0.5225775305209468, "learning_rate": 2.546042003231018e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.057190995663404465, "step": 395, "valid_targets_mean": 3079.5, "valid_targets_min": 811 }, { "epoch": 0.4527447651386531, "grad_norm": 0.5826735610560169, "learning_rate": 2.5783521809369955e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.0974460318684578, "step": 400, "valid_targets_mean": 3113.4, "valid_targets_min": 1431 }, { "epoch": 0.45840407470288624, "grad_norm": 1.0037976393338115, "learning_rate": 2.610662358642973e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.1623167097568512, "step": 405, "valid_targets_mean": 1990.9, "valid_targets_min": 702 }, { "epoch": 0.4640633842671194, "grad_norm": 0.5191241155436422, "learning_rate": 2.6429725363489502e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.08460583537817001, "step": 410, "valid_targets_mean": 3221.6, "valid_targets_min": 621 }, { "epoch": 0.46972269383135257, "grad_norm": 0.677644881422118, "learning_rate": 2.6752827140549274e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.0884869396686554, "step": 415, "valid_targets_mean": 2591.4, "valid_targets_min": 846 }, { "epoch": 0.47538200339558573, "grad_norm": 0.6341714358056391, "learning_rate": 2.707592891760905e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.10547944158315659, "step": 420, "valid_targets_mean": 3738.9, "valid_targets_min": 1369 }, { "epoch": 0.4810413129598189, "grad_norm": 0.5089106640165426, "learning_rate": 2.7399030694668822e-05, "loss": 0.1232, "loss_nan_ranks": 0, "loss_rank_avg": 0.07162182033061981, "step": 425, "valid_targets_mean": 2715.4, "valid_targets_min": 754 }, { "epoch": 0.48670062252405205, "grad_norm": 0.6511128875447165, "learning_rate": 2.7722132471728597e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.09212324023246765, "step": 430, "valid_targets_mean": 2725.9, "valid_targets_min": 776 }, { "epoch": 0.4923599320882852, "grad_norm": 0.468238315396383, "learning_rate": 2.804523424878837e-05, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.09181820601224899, "step": 435, "valid_targets_mean": 3194.4, "valid_targets_min": 754 }, { "epoch": 0.4980192416525184, "grad_norm": 0.8727612672516372, "learning_rate": 2.8368336025848148e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.2480352222919464, "step": 440, "valid_targets_mean": 2053.8, "valid_targets_min": 664 }, { "epoch": 0.5036785512167515, "grad_norm": 0.5210005323173948, "learning_rate": 2.869143780290792e-05, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.08143844455480576, "step": 445, "valid_targets_mean": 3771.4, "valid_targets_min": 2542 }, { "epoch": 0.5093378607809848, "grad_norm": 0.5379047687704024, "learning_rate": 2.9014539579967692e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.09487590193748474, "step": 450, "valid_targets_mean": 3486.2, "valid_targets_min": 2988 }, { "epoch": 0.5149971703452179, "grad_norm": 0.5672323966032542, "learning_rate": 2.9337641357027468e-05, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.08703413605690002, "step": 455, "valid_targets_mean": 3779.4, "valid_targets_min": 3281 }, { "epoch": 0.5206564799094511, "grad_norm": 0.6137232437450363, "learning_rate": 2.966074313408724e-05, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.07755735516548157, "step": 460, "valid_targets_mean": 3471.1, "valid_targets_min": 2189 }, { "epoch": 0.5263157894736842, "grad_norm": 0.5015341485462157, "learning_rate": 2.9983844911147012e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.06586933135986328, "step": 465, "valid_targets_mean": 3483.6, "valid_targets_min": 1788 }, { "epoch": 0.5319750990379174, "grad_norm": 0.7406309314592703, "learning_rate": 3.0306946688206787e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.09322462230920792, "step": 470, "valid_targets_mean": 2562.1, "valid_targets_min": 597 }, { "epoch": 0.5376344086021505, "grad_norm": 0.7033983658453125, "learning_rate": 3.063004846526656e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.07036390900611877, "step": 475, "valid_targets_mean": 2272.8, "valid_targets_min": 701 }, { "epoch": 0.5432937181663837, "grad_norm": 0.6806014114354145, "learning_rate": 3.095315024232634e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.11313560605049133, "step": 480, "valid_targets_mean": 2971.0, "valid_targets_min": 1652 }, { "epoch": 0.5489530277306168, "grad_norm": 0.47880028331211966, "learning_rate": 3.127625201938611e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.07742761820554733, "step": 485, "valid_targets_mean": 3747.4, "valid_targets_min": 1908 }, { "epoch": 0.55461233729485, "grad_norm": 0.6132600376986139, "learning_rate": 3.159935379644588e-05, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.058801814913749695, "step": 490, "valid_targets_mean": 3247.8, "valid_targets_min": 971 }, { "epoch": 0.5602716468590832, "grad_norm": 0.5322542810337509, "learning_rate": 3.1922455573505654e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.0757409855723381, "step": 495, "valid_targets_mean": 3422.2, "valid_targets_min": 2552 }, { "epoch": 0.5659309564233164, "grad_norm": 0.555861116706065, "learning_rate": 3.224555735056543e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.061425432562828064, "step": 500, "valid_targets_mean": 2948.9, "valid_targets_min": 753 }, { "epoch": 0.5715902659875495, "grad_norm": 0.692458977719794, "learning_rate": 3.2568659127625205e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.06144799664616585, "step": 505, "valid_targets_mean": 1090.5, "valid_targets_min": 568 }, { "epoch": 0.5772495755517827, "grad_norm": 0.6074379759592959, "learning_rate": 3.289176090468498e-05, "loss": 0.3801, "loss_nan_ranks": 0, "loss_rank_avg": 0.16443628072738647, "step": 510, "valid_targets_mean": 2921.1, "valid_targets_min": 1070 }, { "epoch": 0.5829088851160158, "grad_norm": 0.7139647841577196, "learning_rate": 3.321486268174475e-05, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.07074105739593506, "step": 515, "valid_targets_mean": 2052.1, "valid_targets_min": 329 }, { "epoch": 0.588568194680249, "grad_norm": 0.9997802597595687, "learning_rate": 3.353796445880453e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.08975844085216522, "step": 520, "valid_targets_mean": 998.2, "valid_targets_min": 608 }, { "epoch": 0.5942275042444821, "grad_norm": 0.5353719487561314, "learning_rate": 3.38610662358643e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.08616983890533447, "step": 525, "valid_targets_mean": 4405.9, "valid_targets_min": 2772 }, { "epoch": 0.5998868138087153, "grad_norm": 0.37012257410615623, "learning_rate": 3.418416801292407e-05, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.03389976918697357, "step": 530, "valid_targets_mean": 5138.2, "valid_targets_min": 3778 }, { "epoch": 0.6055461233729486, "grad_norm": 0.42309989480020843, "learning_rate": 3.450726978998385e-05, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.07327836751937866, "step": 535, "valid_targets_mean": 4641.0, "valid_targets_min": 2336 }, { "epoch": 0.6112054329371817, "grad_norm": 0.4767188679502289, "learning_rate": 3.483037156704362e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.09635117650032043, "step": 540, "valid_targets_mean": 3962.1, "valid_targets_min": 2161 }, { "epoch": 0.6168647425014149, "grad_norm": 0.4625024398234958, "learning_rate": 3.5153473344103395e-05, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.07724954187870026, "step": 545, "valid_targets_mean": 3271.8, "valid_targets_min": 798 }, { "epoch": 0.622524052065648, "grad_norm": 0.5338159680740975, "learning_rate": 3.547657512116317e-05, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.05782943218946457, "step": 550, "valid_targets_mean": 1915.8, "valid_targets_min": 533 }, { "epoch": 0.6281833616298812, "grad_norm": 0.5326298581049448, "learning_rate": 3.579967689822294e-05, "loss": 0.1356, "loss_nan_ranks": 0, "loss_rank_avg": 0.06620592623949051, "step": 555, "valid_targets_mean": 2589.2, "valid_targets_min": 833 }, { "epoch": 0.6338426711941143, "grad_norm": 0.3929364751105547, "learning_rate": 3.612277867528272e-05, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.06302763521671295, "step": 560, "valid_targets_mean": 3888.0, "valid_targets_min": 3391 }, { "epoch": 0.6395019807583475, "grad_norm": 0.6449559476750033, "learning_rate": 3.644588045234249e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.0976746454834938, "step": 565, "valid_targets_mean": 1517.1, "valid_targets_min": 732 }, { "epoch": 0.6451612903225806, "grad_norm": 0.7287905778647281, "learning_rate": 3.676898222940227e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.09375546127557755, "step": 570, "valid_targets_mean": 1623.9, "valid_targets_min": 538 }, { "epoch": 0.6508205998868138, "grad_norm": 0.9334597399750638, "learning_rate": 3.709208400646204e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.07705486565828323, "step": 575, "valid_targets_mean": 1158.1, "valid_targets_min": 720 }, { "epoch": 0.656479909451047, "grad_norm": 0.520582326302511, "learning_rate": 3.741518578352181e-05, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.0693022832274437, "step": 580, "valid_targets_mean": 2982.2, "valid_targets_min": 2328 }, { "epoch": 0.6621392190152802, "grad_norm": 0.5193502586396022, "learning_rate": 3.7738287560581585e-05, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.05764622613787651, "step": 585, "valid_targets_mean": 2637.0, "valid_targets_min": 684 }, { "epoch": 0.6677985285795133, "grad_norm": 0.5086958802467102, "learning_rate": 3.806138933764136e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.0691675916314125, "step": 590, "valid_targets_mean": 3441.4, "valid_targets_min": 2795 }, { "epoch": 0.6734578381437465, "grad_norm": 0.4850447820432571, "learning_rate": 3.838449111470113e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.07534271478652954, "step": 595, "valid_targets_mean": 3286.4, "valid_targets_min": 744 }, { "epoch": 0.6791171477079796, "grad_norm": 0.48421566338639804, "learning_rate": 3.870759289176091e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.05804857611656189, "step": 600, "valid_targets_mean": 3976.5, "valid_targets_min": 3279 }, { "epoch": 0.6847764572722128, "grad_norm": 0.7226548407603152, "learning_rate": 3.903069466882068e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.07041174173355103, "step": 605, "valid_targets_mean": 1140.4, "valid_targets_min": 536 }, { "epoch": 0.6904357668364459, "grad_norm": 0.571223926526635, "learning_rate": 3.935379644588046e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.06768079102039337, "step": 610, "valid_targets_mean": 2468.8, "valid_targets_min": 853 }, { "epoch": 0.6960950764006791, "grad_norm": 0.5652274695532502, "learning_rate": 3.967689822294023e-05, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.0701763778924942, "step": 615, "valid_targets_mean": 3205.8, "valid_targets_min": 2621 }, { "epoch": 0.7017543859649122, "grad_norm": 0.7631423275049859, "learning_rate": 4e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.07661966979503632, "step": 620, "valid_targets_mean": 1332.4, "valid_targets_min": 728 }, { "epoch": 0.7074136955291455, "grad_norm": 0.7426645119465096, "learning_rate": 3.999992044178504e-05, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.07438753545284271, "step": 625, "valid_targets_mean": 1538.9, "valid_targets_min": 618 }, { "epoch": 0.7130730050933786, "grad_norm": 0.434165182746641, "learning_rate": 3.9999681767773104e-05, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.08520899713039398, "step": 630, "valid_targets_mean": 4142.9, "valid_targets_min": 907 }, { "epoch": 0.7187323146576118, "grad_norm": 0.6276743040350341, "learning_rate": 3.999928397986304e-05, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.11276379972696304, "step": 635, "valid_targets_mean": 3060.4, "valid_targets_min": 577 }, { "epoch": 0.7243916242218449, "grad_norm": 0.4341449304787945, "learning_rate": 3.9998727081219585e-05, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.056107230484485626, "step": 640, "valid_targets_mean": 3732.2, "valid_targets_min": 726 }, { "epoch": 0.7300509337860781, "grad_norm": 0.40263084785984393, "learning_rate": 3.999801107627332e-05, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.0675823912024498, "step": 645, "valid_targets_mean": 4288.9, "valid_targets_min": 2252 }, { "epoch": 0.7357102433503112, "grad_norm": 0.5991957808916428, "learning_rate": 3.9997135970720655e-05, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.07685792446136475, "step": 650, "valid_targets_mean": 2427.5, "valid_targets_min": 531 }, { "epoch": 0.7413695529145444, "grad_norm": 0.5224063375277248, "learning_rate": 3.9996101771523766e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.061697687953710556, "step": 655, "valid_targets_mean": 2126.6, "valid_targets_min": 744 }, { "epoch": 0.7470288624787776, "grad_norm": 0.4345176533930879, "learning_rate": 3.999490848691057e-05, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.06378062069416046, "step": 660, "valid_targets_mean": 3755.5, "valid_targets_min": 3024 }, { "epoch": 0.7526881720430108, "grad_norm": 0.4569816247653973, "learning_rate": 3.999355612637461e-05, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.07932804524898529, "step": 665, "valid_targets_mean": 3352.0, "valid_targets_min": 2366 }, { "epoch": 0.758347481607244, "grad_norm": 0.5751225435233932, "learning_rate": 3.999204470067504e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.07831130921840668, "step": 670, "valid_targets_mean": 956.8, "valid_targets_min": 509 }, { "epoch": 0.7640067911714771, "grad_norm": 0.48072853866166537, "learning_rate": 3.9990374221836484e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.06048751622438431, "step": 675, "valid_targets_mean": 3013.6, "valid_targets_min": 1158 }, { "epoch": 0.7696661007357103, "grad_norm": 0.40749695301719024, "learning_rate": 3.998854470314898e-05, "loss": 0.1127, "loss_nan_ranks": 0, "loss_rank_avg": 0.05904872715473175, "step": 680, "valid_targets_mean": 3860.5, "valid_targets_min": 3044 }, { "epoch": 0.7753254102999434, "grad_norm": 0.4479181701407655, "learning_rate": 3.9986556159167846e-05, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.04606478661298752, "step": 685, "valid_targets_mean": 2286.4, "valid_targets_min": 539 }, { "epoch": 0.7809847198641766, "grad_norm": 0.4692149977774639, "learning_rate": 3.998440860571358e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.059417132288217545, "step": 690, "valid_targets_mean": 2865.5, "valid_targets_min": 912 }, { "epoch": 0.7866440294284097, "grad_norm": 0.6595632418113099, "learning_rate": 3.998210205987175e-05, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.08933501690626144, "step": 695, "valid_targets_mean": 2087.4, "valid_targets_min": 872 }, { "epoch": 0.7923033389926429, "grad_norm": 0.43788134024153513, "learning_rate": 3.9979636539992805e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.05341676250100136, "step": 700, "valid_targets_mean": 3380.1, "valid_targets_min": 2254 }, { "epoch": 0.797962648556876, "grad_norm": 0.8001613859076356, "learning_rate": 3.9977012065692e-05, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.09082688391208649, "step": 705, "valid_targets_mean": 1274.0, "valid_targets_min": 605 }, { "epoch": 0.8036219581211093, "grad_norm": 0.5094244900852393, "learning_rate": 3.997422865784916e-05, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.07657082378864288, "step": 710, "valid_targets_mean": 2289.0, "valid_targets_min": 1117 }, { "epoch": 0.8092812676853424, "grad_norm": 0.4600031239543275, "learning_rate": 3.99712863386086e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.06370458006858826, "step": 715, "valid_targets_mean": 3169.9, "valid_targets_min": 1132 }, { "epoch": 0.8149405772495756, "grad_norm": 0.5229218472624875, "learning_rate": 3.9968185131378876e-05, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.04839629679918289, "step": 720, "valid_targets_mean": 2107.4, "valid_targets_min": 524 }, { "epoch": 0.8205998868138087, "grad_norm": 0.5010534381484323, "learning_rate": 3.996492506083264e-05, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.05224666744470596, "step": 725, "valid_targets_mean": 1705.8, "valid_targets_min": 516 }, { "epoch": 0.8262591963780419, "grad_norm": 0.5503804393257022, "learning_rate": 3.9961506152906445e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.07331585884094238, "step": 730, "valid_targets_mean": 2088.2, "valid_targets_min": 342 }, { "epoch": 0.831918505942275, "grad_norm": 0.35323711189740525, "learning_rate": 3.995792843480051e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.06214073300361633, "step": 735, "valid_targets_mean": 3528.1, "valid_targets_min": 1935 }, { "epoch": 0.8375778155065082, "grad_norm": 0.5249098117659579, "learning_rate": 3.9954191934978494e-05, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.043227165937423706, "step": 740, "valid_targets_mean": 1818.2, "valid_targets_min": 564 }, { "epoch": 0.8432371250707413, "grad_norm": 0.3299099340846902, "learning_rate": 3.995029668316735e-05, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.06274382770061493, "step": 745, "valid_targets_mean": 5238.9, "valid_targets_min": 3653 }, { "epoch": 0.8488964346349746, "grad_norm": 0.36575794432079584, "learning_rate": 3.9946242710356994e-05, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.040668781846761703, "step": 750, "valid_targets_mean": 2983.4, "valid_targets_min": 684 }, { "epoch": 0.8545557441992077, "grad_norm": 0.5075588125856926, "learning_rate": 3.994203004880012e-05, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.06988832354545593, "step": 755, "valid_targets_mean": 3324.8, "valid_targets_min": 726 }, { "epoch": 0.8602150537634409, "grad_norm": 0.39852501254916606, "learning_rate": 3.9937658732011905e-05, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.0661604031920433, "step": 760, "valid_targets_mean": 4154.5, "valid_targets_min": 3469 }, { "epoch": 0.865874363327674, "grad_norm": 0.686455143981827, "learning_rate": 3.993312879476976e-05, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.19141210615634918, "step": 765, "valid_targets_mean": 2561.6, "valid_targets_min": 1536 }, { "epoch": 0.8715336728919072, "grad_norm": 0.43519246110287957, "learning_rate": 3.992844027311307e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.06963059306144714, "step": 770, "valid_targets_mean": 2912.4, "valid_targets_min": 582 }, { "epoch": 0.8771929824561403, "grad_norm": 0.3610697013476402, "learning_rate": 3.992359320434287e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.049161579459905624, "step": 775, "valid_targets_mean": 3388.5, "valid_targets_min": 633 }, { "epoch": 0.8828522920203735, "grad_norm": 0.4253116172505089, "learning_rate": 3.9918587627021566e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.05305824428796768, "step": 780, "valid_targets_mean": 3263.6, "valid_targets_min": 1130 }, { "epoch": 0.8885116015846066, "grad_norm": 0.41320327540238194, "learning_rate": 3.991342358097265e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.0637916624546051, "step": 785, "valid_targets_mean": 2866.5, "valid_targets_min": 492 }, { "epoch": 0.8941709111488398, "grad_norm": 0.828001679310075, "learning_rate": 3.990810110728034e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.10161933302879333, "step": 790, "valid_targets_mean": 2353.8, "valid_targets_min": 1045 }, { "epoch": 0.8998302207130731, "grad_norm": 0.38967894220881866, "learning_rate": 3.99026202482893e-05, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.04142877459526062, "step": 795, "valid_targets_mean": 3043.9, "valid_targets_min": 647 }, { "epoch": 0.9054895302773062, "grad_norm": 0.7579700154789877, "learning_rate": 3.989698104760425e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.11227335035800934, "step": 800, "valid_targets_mean": 2093.0, "valid_targets_min": 806 }, { "epoch": 0.9111488398415394, "grad_norm": 0.6550049745460668, "learning_rate": 3.989118355008968e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.06615293025970459, "step": 805, "valid_targets_mean": 1208.8, "valid_targets_min": 575 }, { "epoch": 0.9168081494057725, "grad_norm": 0.5313531127641108, "learning_rate": 3.988522780186943e-05, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.058285586535930634, "step": 810, "valid_targets_mean": 3447.5, "valid_targets_min": 2784 }, { "epoch": 0.9224674589700057, "grad_norm": 0.42281770147833686, "learning_rate": 3.987911385032638e-05, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.05373559519648552, "step": 815, "valid_targets_mean": 3721.6, "valid_targets_min": 2525 }, { "epoch": 0.9281267685342388, "grad_norm": 0.4127768410682695, "learning_rate": 3.987284174410203e-05, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.05588556081056595, "step": 820, "valid_targets_mean": 2665.2, "valid_targets_min": 767 }, { "epoch": 0.933786078098472, "grad_norm": 0.4894787437319876, "learning_rate": 3.986641153309615e-05, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.052959829568862915, "step": 825, "valid_targets_mean": 2277.6, "valid_targets_min": 870 }, { "epoch": 0.9394453876627051, "grad_norm": 0.7402127878724636, "learning_rate": 3.985982326846634e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.09184592217206955, "step": 830, "valid_targets_mean": 1535.8, "valid_targets_min": 758 }, { "epoch": 0.9451046972269384, "grad_norm": 0.46799832031998007, "learning_rate": 3.985307700262765e-05, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.059100307524204254, "step": 835, "valid_targets_mean": 2024.1, "valid_targets_min": 797 }, { "epoch": 0.9507640067911715, "grad_norm": 0.3657972143765407, "learning_rate": 3.984617278925218e-05, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.05874822288751602, "step": 840, "valid_targets_mean": 3299.5, "valid_targets_min": 1606 }, { "epoch": 0.9564233163554047, "grad_norm": 0.433457585178867, "learning_rate": 3.9839110683268624e-05, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.0675329715013504, "step": 845, "valid_targets_mean": 3055.0, "valid_targets_min": 678 }, { "epoch": 0.9620826259196378, "grad_norm": 0.3318398548480011, "learning_rate": 3.9831890740861826e-05, "loss": 0.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.06505134701728821, "step": 850, "valid_targets_mean": 4980.6, "valid_targets_min": 1078 }, { "epoch": 0.967741935483871, "grad_norm": 0.3441479953856927, "learning_rate": 3.982451301947236e-05, "loss": 0.1129, "loss_nan_ranks": 0, "loss_rank_avg": 0.04246465489268303, "step": 855, "valid_targets_mean": 2680.8, "valid_targets_min": 706 }, { "epoch": 0.9734012450481041, "grad_norm": 0.6698327188776084, "learning_rate": 3.981697757779606e-05, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.08046382665634155, "step": 860, "valid_targets_mean": 1580.4, "valid_targets_min": 580 }, { "epoch": 0.9790605546123373, "grad_norm": 0.6426747257677874, "learning_rate": 3.980928447578356e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.10326772928237915, "step": 865, "valid_targets_mean": 2592.1, "valid_targets_min": 780 }, { "epoch": 0.9847198641765704, "grad_norm": 0.4076799742075529, "learning_rate": 3.98014337746398e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.04925592988729477, "step": 870, "valid_targets_mean": 3478.2, "valid_targets_min": 2861 }, { "epoch": 0.9903791737408036, "grad_norm": 0.40044366441837925, "learning_rate": 3.9793425536823555e-05, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.06652865558862686, "step": 875, "valid_targets_mean": 3846.5, "valid_targets_min": 2453 }, { "epoch": 0.9960384833050367, "grad_norm": 0.43952559861608015, "learning_rate": 3.978525982604695e-05, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.07187198102474213, "step": 880, "valid_targets_mean": 3881.8, "valid_targets_min": 3389 }, { "epoch": 1.0011318619128466, "grad_norm": 0.6856007855669121, "learning_rate": 3.977693670727491e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.13266420364379883, "step": 885, "valid_targets_mean": 6935.0, "valid_targets_min": 5295 }, { "epoch": 1.0067911714770799, "grad_norm": 0.43379131857748404, "learning_rate": 3.9768456246724675e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.1459798812866211, "step": 890, "valid_targets_mean": 7672.9, "valid_targets_min": 5066 }, { "epoch": 1.0124504810413129, "grad_norm": 0.4683116079781387, "learning_rate": 3.97598185118653e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.12084569036960602, "step": 895, "valid_targets_mean": 7347.6, "valid_targets_min": 4923 }, { "epoch": 1.018109790605546, "grad_norm": 0.48855719634434, "learning_rate": 3.975102357141704e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.11077947914600372, "step": 900, "valid_targets_mean": 5446.8, "valid_targets_min": 3922 }, { "epoch": 1.0237691001697793, "grad_norm": 0.42798402935325797, "learning_rate": 3.974207149535088e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.1109333485364914, "step": 905, "valid_targets_mean": 6924.9, "valid_targets_min": 4797 }, { "epoch": 1.0294284097340125, "grad_norm": 0.4351702732960488, "learning_rate": 3.9732962354887936e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.12490881234407425, "step": 910, "valid_targets_mean": 6443.5, "valid_targets_min": 3853 }, { "epoch": 1.0350877192982457, "grad_norm": 0.47752325780331667, "learning_rate": 3.972369622249891e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.1165180504322052, "step": 915, "valid_targets_mean": 5446.5, "valid_targets_min": 4487 }, { "epoch": 1.0407470288624787, "grad_norm": 0.55468198932523, "learning_rate": 3.9714273171903486e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.11226481199264526, "step": 920, "valid_targets_mean": 6210.2, "valid_targets_min": 4137 }, { "epoch": 1.046406338426712, "grad_norm": 0.5656955802461123, "learning_rate": 3.970469327806978e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.20384201407432556, "step": 925, "valid_targets_mean": 5404.4, "valid_targets_min": 698 }, { "epoch": 1.0520656479909452, "grad_norm": 0.42478256890845617, "learning_rate": 3.969495661721372e-05, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.13021141290664673, "step": 930, "valid_targets_mean": 7197.6, "valid_targets_min": 4499 }, { "epoch": 1.0577249575551784, "grad_norm": 0.47440889374120215, "learning_rate": 3.9685063266798434e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.15133237838745117, "step": 935, "valid_targets_mean": 5538.4, "valid_targets_min": 4291 }, { "epoch": 1.0633842671194114, "grad_norm": 0.45853285772484853, "learning_rate": 3.967501330553366e-05, "loss": 0.2201, "loss_nan_ranks": 0, "loss_rank_avg": 0.09450241178274155, "step": 940, "valid_targets_mean": 5531.4, "valid_targets_min": 4050 }, { "epoch": 1.0690435766836446, "grad_norm": 0.4165165821206238, "learning_rate": 3.966480681337508e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.12836091220378876, "step": 945, "valid_targets_mean": 7526.6, "valid_targets_min": 5196 }, { "epoch": 1.0747028862478778, "grad_norm": 0.4439127191876095, "learning_rate": 3.965444387152375e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.103563092648983, "step": 950, "valid_targets_mean": 6248.9, "valid_targets_min": 4749 }, { "epoch": 1.080362195812111, "grad_norm": 0.5042962353960474, "learning_rate": 3.9643924562425365e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.05952709913253784, "step": 955, "valid_targets_mean": 3248.5, "valid_targets_min": 1908 }, { "epoch": 1.086021505376344, "grad_norm": 0.4245617765773125, "learning_rate": 3.963324896976968e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.10588788986206055, "step": 960, "valid_targets_mean": 6225.6, "valid_targets_min": 4808 }, { "epoch": 1.0916808149405772, "grad_norm": 0.44302682414413963, "learning_rate": 3.962241717848979e-05, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.10773646831512451, "step": 965, "valid_targets_mean": 5383.0, "valid_targets_min": 3774 }, { "epoch": 1.0973401245048104, "grad_norm": 0.4090806507981392, "learning_rate": 3.961142927476151e-05, "loss": 0.2164, "loss_nan_ranks": 0, "loss_rank_avg": 0.11196926236152649, "step": 970, "valid_targets_mean": 6291.4, "valid_targets_min": 5335 }, { "epoch": 1.1029994340690437, "grad_norm": 0.3734040338697041, "learning_rate": 3.960028534600264e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.11295393109321594, "step": 975, "valid_targets_mean": 7749.1, "valid_targets_min": 6205 }, { "epoch": 1.1086587436332767, "grad_norm": 0.3906381278203426, "learning_rate": 3.9588985480872275e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.10481761395931244, "step": 980, "valid_targets_mean": 6882.1, "valid_targets_min": 4428 }, { "epoch": 1.1143180531975099, "grad_norm": 0.4456420223942386, "learning_rate": 3.9577529769270137e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.11185906827449799, "step": 985, "valid_targets_mean": 5751.8, "valid_targets_min": 4458 }, { "epoch": 1.119977362761743, "grad_norm": 0.4397561377985395, "learning_rate": 3.9565918302335816e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.09672285616397858, "step": 990, "valid_targets_mean": 6003.9, "valid_targets_min": 4458 }, { "epoch": 1.1256366723259763, "grad_norm": 0.4329998383462111, "learning_rate": 3.955415117244807e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.09833373129367828, "step": 995, "valid_targets_mean": 6033.8, "valid_targets_min": 4066 }, { "epoch": 1.1312959818902093, "grad_norm": 0.41841572645344943, "learning_rate": 3.9542228473224086e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.11922608315944672, "step": 1000, "valid_targets_mean": 6601.0, "valid_targets_min": 4708 }, { "epoch": 1.1369552914544425, "grad_norm": 0.4315438341662908, "learning_rate": 3.953015029951874e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.12108911573886871, "step": 1005, "valid_targets_mean": 6092.1, "valid_targets_min": 4789 }, { "epoch": 1.1426146010186757, "grad_norm": 0.40535781524675796, "learning_rate": 3.9517916747423804e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.12264654040336609, "step": 1010, "valid_targets_mean": 6474.6, "valid_targets_min": 4224 }, { "epoch": 1.148273910582909, "grad_norm": 0.41571559354767595, "learning_rate": 3.9505527914267255e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.11821147054433823, "step": 1015, "valid_targets_mean": 6312.4, "valid_targets_min": 4617 }, { "epoch": 1.1539332201471422, "grad_norm": 0.40714327444148485, "learning_rate": 3.949298389861243e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.11297283321619034, "step": 1020, "valid_targets_mean": 6333.8, "valid_targets_min": 4783 }, { "epoch": 1.1595925297113752, "grad_norm": 0.45247118108391804, "learning_rate": 3.948028480025728e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.11267365515232086, "step": 1025, "valid_targets_mean": 7380.1, "valid_targets_min": 6020 }, { "epoch": 1.1652518392756084, "grad_norm": 0.4357879080967964, "learning_rate": 3.9467430720233555e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.11564698815345764, "step": 1030, "valid_targets_mean": 6009.0, "valid_targets_min": 3049 }, { "epoch": 1.1709111488398416, "grad_norm": 0.4468978613451375, "learning_rate": 3.945442176080604e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.10168086737394333, "step": 1035, "valid_targets_mean": 5973.1, "valid_targets_min": 4822 }, { "epoch": 1.1765704584040746, "grad_norm": 0.4644751057173812, "learning_rate": 3.944125802547168e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.104912169277668, "step": 1040, "valid_targets_mean": 5754.9, "valid_targets_min": 2910 }, { "epoch": 1.1822297679683078, "grad_norm": 0.4750656628065809, "learning_rate": 3.942793961895881e-05, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.12494048476219177, "step": 1045, "valid_targets_mean": 6414.6, "valid_targets_min": 4791 }, { "epoch": 1.187889077532541, "grad_norm": 0.46661891824647705, "learning_rate": 3.941446664722629e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.11205330491065979, "step": 1050, "valid_targets_mean": 5675.9, "valid_targets_min": 3983 }, { "epoch": 1.1935483870967742, "grad_norm": 0.3693476342351284, "learning_rate": 3.940083921746268e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.08969860523939133, "step": 1055, "valid_targets_mean": 6975.5, "valid_targets_min": 4383 }, { "epoch": 1.1992076966610075, "grad_norm": 0.3893171784380533, "learning_rate": 3.938705743808538e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.1054840236902237, "step": 1060, "valid_targets_mean": 6417.1, "valid_targets_min": 3182 }, { "epoch": 1.2048670062252405, "grad_norm": 0.4534363275965842, "learning_rate": 3.9373121418739765e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.11998751014471054, "step": 1065, "valid_targets_mean": 6218.6, "valid_targets_min": 5077 }, { "epoch": 1.2105263157894737, "grad_norm": 0.49747070693615936, "learning_rate": 3.935903127029832e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.11035722494125366, "step": 1070, "valid_targets_mean": 4774.9, "valid_targets_min": 3663 }, { "epoch": 1.216185625353707, "grad_norm": 0.4539470299738808, "learning_rate": 3.934478710485975e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.11278726160526276, "step": 1075, "valid_targets_mean": 6316.8, "valid_targets_min": 4105 }, { "epoch": 1.22184493491794, "grad_norm": 0.4150450186888815, "learning_rate": 3.9330389035748086e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.09741287678480148, "step": 1080, "valid_targets_mean": 6528.9, "valid_targets_min": 4537 }, { "epoch": 1.227504244482173, "grad_norm": 0.4102218195249173, "learning_rate": 3.9315837177511816e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.09937061369419098, "step": 1085, "valid_targets_mean": 6416.8, "valid_targets_min": 2494 }, { "epoch": 1.2331635540464063, "grad_norm": 0.4554765624706927, "learning_rate": 3.93011316459229e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.1132006049156189, "step": 1090, "valid_targets_mean": 6070.9, "valid_targets_min": 4921 }, { "epoch": 1.2388228636106395, "grad_norm": 0.46305531026666913, "learning_rate": 3.928627255797593e-05, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.11665916442871094, "step": 1095, "valid_targets_mean": 6701.4, "valid_targets_min": 5285 }, { "epoch": 1.2444821731748728, "grad_norm": 0.4177211742532018, "learning_rate": 3.927126003188717e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.10000447928905487, "step": 1100, "valid_targets_mean": 6273.9, "valid_targets_min": 4464 }, { "epoch": 1.2501414827391057, "grad_norm": 0.4227921157715367, "learning_rate": 3.925609418709358e-05, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.09662619233131409, "step": 1105, "valid_targets_mean": 5554.8, "valid_targets_min": 4439 }, { "epoch": 1.255800792303339, "grad_norm": 0.39346061104081265, "learning_rate": 3.924077514425193e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.09001141786575317, "step": 1110, "valid_targets_mean": 6043.0, "valid_targets_min": 4686 }, { "epoch": 1.2614601018675722, "grad_norm": 0.4138966359666768, "learning_rate": 3.922530302523779e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.09198030829429626, "step": 1115, "valid_targets_mean": 5912.5, "valid_targets_min": 3381 }, { "epoch": 1.2671194114318054, "grad_norm": 0.379265006887859, "learning_rate": 3.920967795314456e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.09785998612642288, "step": 1120, "valid_targets_mean": 6495.5, "valid_targets_min": 5309 }, { "epoch": 1.2727787209960386, "grad_norm": 0.41391321836622774, "learning_rate": 3.919390005228254e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.10846744477748871, "step": 1125, "valid_targets_mean": 6483.9, "valid_targets_min": 5161 }, { "epoch": 1.2784380305602716, "grad_norm": 0.49875136898167355, "learning_rate": 3.9177969448177884e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.10463844239711761, "step": 1130, "valid_targets_mean": 5958.9, "valid_targets_min": 4666 }, { "epoch": 1.2840973401245048, "grad_norm": 0.6505825282340078, "learning_rate": 3.916188626757164e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.125363290309906, "step": 1135, "valid_targets_mean": 1691.5, "valid_targets_min": 1440 }, { "epoch": 1.289756649688738, "grad_norm": 0.4550942995720742, "learning_rate": 3.9145650638418724e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.09323972463607788, "step": 1140, "valid_targets_mean": 5299.1, "valid_targets_min": 4547 }, { "epoch": 1.295415959252971, "grad_norm": 0.48730645845105025, "learning_rate": 3.91292626898869e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.10699446499347687, "step": 1145, "valid_targets_mean": 6003.5, "valid_targets_min": 5031 }, { "epoch": 1.3010752688172043, "grad_norm": 0.36627880501682747, "learning_rate": 3.911272255235576e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.09872409701347351, "step": 1150, "valid_targets_mean": 8169.6, "valid_targets_min": 5487 }, { "epoch": 1.3067345783814375, "grad_norm": 0.39046063875124754, "learning_rate": 3.909603035741568e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.10074116289615631, "step": 1155, "valid_targets_mean": 6474.9, "valid_targets_min": 4253 }, { "epoch": 1.3123938879456707, "grad_norm": 0.4056457954329597, "learning_rate": 3.90791862378668e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.1214001476764679, "step": 1160, "valid_targets_mean": 7021.0, "valid_targets_min": 4990 }, { "epoch": 1.318053197509904, "grad_norm": 0.4295987244796204, "learning_rate": 3.906219032771791e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.1252824068069458, "step": 1165, "valid_targets_mean": 6356.0, "valid_targets_min": 4385 }, { "epoch": 1.323712507074137, "grad_norm": 0.38071643326705473, "learning_rate": 3.904504276218545e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.11139969527721405, "step": 1170, "valid_targets_mean": 6815.1, "valid_targets_min": 5164 }, { "epoch": 1.3293718166383701, "grad_norm": 0.4511869701543047, "learning_rate": 3.902774367769238e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.07966958731412888, "step": 1175, "valid_targets_mean": 5588.5, "valid_targets_min": 4098 }, { "epoch": 1.3350311262026033, "grad_norm": 0.40443974143086536, "learning_rate": 3.901029321186715e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.10711172968149185, "step": 1180, "valid_targets_mean": 6167.6, "valid_targets_min": 4801 }, { "epoch": 1.3406904357668363, "grad_norm": 0.5025063120071397, "learning_rate": 3.8992691503542526e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.22311510145664215, "step": 1185, "valid_targets_mean": 6224.9, "valid_targets_min": 4772 }, { "epoch": 1.3463497453310695, "grad_norm": 0.43096078673252874, "learning_rate": 3.8974938692754565e-05, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.11844121664762497, "step": 1190, "valid_targets_mean": 6549.2, "valid_targets_min": 5025 }, { "epoch": 1.3520090548953028, "grad_norm": 0.4411764049541238, "learning_rate": 3.895703492074147e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.1157045066356659, "step": 1195, "valid_targets_mean": 6680.8, "valid_targets_min": 4818 }, { "epoch": 1.357668364459536, "grad_norm": 0.4327381745312927, "learning_rate": 3.893898032994244e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.10466340184211731, "step": 1200, "valid_targets_mean": 5835.1, "valid_targets_min": 4111 }, { "epoch": 1.3633276740237692, "grad_norm": 0.41626129249832783, "learning_rate": 3.892077506399659e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.10042882710695267, "step": 1205, "valid_targets_mean": 7029.9, "valid_targets_min": 2275 }, { "epoch": 1.3689869835880022, "grad_norm": 0.3941078540715684, "learning_rate": 3.890241926774176e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.08970265835523605, "step": 1210, "valid_targets_mean": 5621.2, "valid_targets_min": 4826 }, { "epoch": 1.3746462931522354, "grad_norm": 0.4328651679860648, "learning_rate": 3.888391308721339e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.09326186776161194, "step": 1215, "valid_targets_mean": 6858.8, "valid_targets_min": 4710 }, { "epoch": 1.3803056027164686, "grad_norm": 0.3858063007563162, "learning_rate": 3.8865256669643345e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.13152405619621277, "step": 1220, "valid_targets_mean": 7012.5, "valid_targets_min": 5421 }, { "epoch": 1.3859649122807016, "grad_norm": 0.3744177832844025, "learning_rate": 3.884645016345876e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.09377632290124893, "step": 1225, "valid_targets_mean": 6967.6, "valid_targets_min": 4949 }, { "epoch": 1.3916242218449348, "grad_norm": 0.3859158266030199, "learning_rate": 3.882749371828084e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.10139726847410202, "step": 1230, "valid_targets_mean": 6348.5, "valid_targets_min": 4831 }, { "epoch": 1.397283531409168, "grad_norm": 0.40628323849120285, "learning_rate": 3.880838748492367e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.12447110563516617, "step": 1235, "valid_targets_mean": 6597.2, "valid_targets_min": 4018 }, { "epoch": 1.4029428409734013, "grad_norm": 0.3728400695414987, "learning_rate": 3.878913161539304e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.07373258471488953, "step": 1240, "valid_targets_mean": 6420.9, "valid_targets_min": 5034 }, { "epoch": 1.4086021505376345, "grad_norm": 0.41679011568104735, "learning_rate": 3.876972626288521e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.11582024395465851, "step": 1245, "valid_targets_mean": 6962.4, "valid_targets_min": 5442 }, { "epoch": 1.4142614601018675, "grad_norm": 0.44005462344702845, "learning_rate": 3.87501715817857e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.1077890619635582, "step": 1250, "valid_targets_mean": 5610.9, "valid_targets_min": 4609 }, { "epoch": 1.4199207696661007, "grad_norm": 0.46782563125127635, "learning_rate": 3.873046772766806e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.10515996068716049, "step": 1255, "valid_targets_mean": 5038.4, "valid_targets_min": 2301 }, { "epoch": 1.425580079230334, "grad_norm": 0.6393525154542397, "learning_rate": 3.871061485729264e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.11196956783533096, "step": 1260, "valid_targets_mean": 1449.8, "valid_targets_min": 363 }, { "epoch": 1.4312393887945671, "grad_norm": 0.3961715756785153, "learning_rate": 3.8690613128605325e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.07758249342441559, "step": 1265, "valid_targets_mean": 3729.8, "valid_targets_min": 3074 }, { "epoch": 1.4368986983588004, "grad_norm": 0.514411411172113, "learning_rate": 3.867046270073631e-05, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.06430846452713013, "step": 1270, "valid_targets_mean": 2272.8, "valid_targets_min": 700 }, { "epoch": 1.4425580079230333, "grad_norm": 0.4844248582697401, "learning_rate": 3.8650163733998796e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.057508524507284164, "step": 1275, "valid_targets_mean": 2997.5, "valid_targets_min": 803 }, { "epoch": 1.4482173174872666, "grad_norm": 0.4495056164678961, "learning_rate": 3.862971638988774e-05, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.06564734131097794, "step": 1280, "valid_targets_mean": 2655.5, "valid_targets_min": 920 }, { "epoch": 1.4538766270514998, "grad_norm": 0.4256726932838878, "learning_rate": 3.860912083107856e-05, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.06890624016523361, "step": 1285, "valid_targets_mean": 3263.8, "valid_targets_min": 806 }, { "epoch": 1.4595359366157328, "grad_norm": 0.7987833397224602, "learning_rate": 3.8588377221425846e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.10396931320428848, "step": 1290, "valid_targets_mean": 1644.4, "valid_targets_min": 718 }, { "epoch": 1.465195246179966, "grad_norm": 0.41071930776105053, "learning_rate": 3.8567485725962054e-05, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.0699780210852623, "step": 1295, "valid_targets_mean": 3399.4, "valid_targets_min": 1133 }, { "epoch": 1.4708545557441992, "grad_norm": 0.4669417191292071, "learning_rate": 3.8546446510896196e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.052286192774772644, "step": 1300, "valid_targets_mean": 1808.9, "valid_targets_min": 859 }, { "epoch": 1.4765138653084324, "grad_norm": 0.279190024858727, "learning_rate": 3.8525259743612504e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.04190339148044586, "step": 1305, "valid_targets_mean": 5541.4, "valid_targets_min": 5150 }, { "epoch": 1.4821731748726656, "grad_norm": 0.3783760567491969, "learning_rate": 3.850392559266912e-05, "loss": 0.1072, "loss_nan_ranks": 0, "loss_rank_avg": 0.07370060682296753, "step": 1310, "valid_targets_mean": 4000.1, "valid_targets_min": 502 }, { "epoch": 1.4878324844368986, "grad_norm": 0.37009657456448125, "learning_rate": 3.848244422779675e-05, "loss": 0.114, "loss_nan_ranks": 0, "loss_rank_avg": 0.06480339169502258, "step": 1315, "valid_targets_mean": 3906.9, "valid_targets_min": 600 }, { "epoch": 1.4934917940011319, "grad_norm": 0.4432314283510275, "learning_rate": 3.8460815819897275e-05, "loss": 0.1126, "loss_nan_ranks": 0, "loss_rank_avg": 0.05141071975231171, "step": 1320, "valid_targets_mean": 2979.5, "valid_targets_min": 518 }, { "epoch": 1.499151103565365, "grad_norm": 0.4118835024522952, "learning_rate": 3.8439040541042477e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.06730692833662033, "step": 1325, "valid_targets_mean": 3522.5, "valid_targets_min": 549 }, { "epoch": 1.504810413129598, "grad_norm": 0.3453526365894916, "learning_rate": 3.8417118564472566e-05, "loss": 0.1057, "loss_nan_ranks": 0, "loss_rank_avg": 0.04490172117948532, "step": 1330, "valid_targets_mean": 3878.5, "valid_targets_min": 3170 }, { "epoch": 1.5104697226938315, "grad_norm": 0.5973143983949719, "learning_rate": 3.8395050064594886e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.07379209250211716, "step": 1335, "valid_targets_mean": 1656.0, "valid_targets_min": 644 }, { "epoch": 1.5161290322580645, "grad_norm": 0.3322282229333689, "learning_rate": 3.8372835216982474e-05, "loss": 0.0988, "loss_nan_ranks": 0, "loss_rank_avg": 0.030613193288445473, "step": 1340, "valid_targets_mean": 2891.8, "valid_targets_min": 720 }, { "epoch": 1.5217883418222977, "grad_norm": 0.4763357740709184, "learning_rate": 3.83504741983727e-05, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.05212488770484924, "step": 1345, "valid_targets_mean": 1775.6, "valid_targets_min": 516 }, { "epoch": 1.527447651386531, "grad_norm": 0.5616103799879494, "learning_rate": 3.832796718666583e-05, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.0769435241818428, "step": 1350, "valid_targets_mean": 2018.6, "valid_targets_min": 557 }, { "epoch": 1.533106960950764, "grad_norm": 0.43822923169816463, "learning_rate": 3.830531436092363e-05, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.07701824605464935, "step": 1355, "valid_targets_mean": 3398.1, "valid_targets_min": 1086 }, { "epoch": 1.5387662705149971, "grad_norm": 0.4317930795508292, "learning_rate": 3.828251590136795e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.07521131634712219, "step": 1360, "valid_targets_mean": 2532.9, "valid_targets_min": 1008 }, { "epoch": 1.5444255800792304, "grad_norm": 0.5245145698637755, "learning_rate": 3.8259571989379256e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.046158429235219955, "step": 1365, "valid_targets_mean": 3481.1, "valid_targets_min": 2756 }, { "epoch": 1.5500848896434634, "grad_norm": 0.3296178101522478, "learning_rate": 3.8236482807495214e-05, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.04727683216333389, "step": 1370, "valid_targets_mean": 4113.5, "valid_targets_min": 3798 }, { "epoch": 1.5557441992076968, "grad_norm": 0.8548617148468368, "learning_rate": 3.8213248539409236e-05, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.11022968590259552, "step": 1375, "valid_targets_mean": 1058.6, "valid_targets_min": 598 }, { "epoch": 1.5614035087719298, "grad_norm": 0.41271716216436005, "learning_rate": 3.8189869369969016e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.04818184673786163, "step": 1380, "valid_targets_mean": 2403.5, "valid_targets_min": 754 }, { "epoch": 1.567062818336163, "grad_norm": 0.34511489195605416, "learning_rate": 3.816634548517505e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.06006976217031479, "step": 1385, "valid_targets_mean": 4045.8, "valid_targets_min": 3390 }, { "epoch": 1.5727221279003962, "grad_norm": 0.6490300241903905, "learning_rate": 3.814267707217917e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.16865617036819458, "step": 1390, "valid_targets_mean": 2255.9, "valid_targets_min": 1052 }, { "epoch": 1.5783814374646292, "grad_norm": 0.4099557009711887, "learning_rate": 3.8118864319283025e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.07171247899532318, "step": 1395, "valid_targets_mean": 3214.0, "valid_targets_min": 2176 }, { "epoch": 1.5840407470288624, "grad_norm": 0.48507846475715394, "learning_rate": 3.809490741593665e-05, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.057411808520555496, "step": 1400, "valid_targets_mean": 2396.0, "valid_targets_min": 1074 }, { "epoch": 1.5897000565930957, "grad_norm": 0.46213090035219073, "learning_rate": 3.807080655273689e-05, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.06575348228216171, "step": 1405, "valid_targets_mean": 3271.8, "valid_targets_min": 1212 }, { "epoch": 1.5953593661573287, "grad_norm": 0.4504573910708974, "learning_rate": 3.8046561921425895e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.07250872254371643, "step": 1410, "valid_targets_mean": 3990.8, "valid_targets_min": 2258 }, { "epoch": 1.601018675721562, "grad_norm": 0.31830121418698293, "learning_rate": 3.802217371488964e-05, "loss": 0.0989, "loss_nan_ranks": 0, "loss_rank_avg": 0.06969204545021057, "step": 1415, "valid_targets_mean": 3730.2, "valid_targets_min": 1466 }, { "epoch": 1.606677985285795, "grad_norm": 0.38404044511110647, "learning_rate": 3.799764212715633e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.06129370257258415, "step": 1420, "valid_targets_mean": 3557.1, "valid_targets_min": 560 }, { "epoch": 1.6123372948500283, "grad_norm": 0.3782342128182197, "learning_rate": 3.7972967353394906e-05, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.06335802376270294, "step": 1425, "valid_targets_mean": 3222.9, "valid_targets_min": 1189 }, { "epoch": 1.6179966044142615, "grad_norm": 0.3631388391112149, "learning_rate": 3.794814958991346e-05, "loss": 0.1072, "loss_nan_ranks": 0, "loss_rank_avg": 0.048005443066358566, "step": 1430, "valid_targets_mean": 3665.2, "valid_targets_min": 2257 }, { "epoch": 1.6236559139784945, "grad_norm": 0.36678907072924855, "learning_rate": 3.792318903415769e-05, "loss": 0.1066, "loss_nan_ranks": 0, "loss_rank_avg": 0.04388028010725975, "step": 1435, "valid_targets_mean": 3314.4, "valid_targets_min": 886 }, { "epoch": 1.629315223542728, "grad_norm": 0.3876337194785037, "learning_rate": 3.789808588470932e-05, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.05543633550405502, "step": 1440, "valid_targets_mean": 3377.5, "valid_targets_min": 2409 }, { "epoch": 1.634974533106961, "grad_norm": 0.37020115100592305, "learning_rate": 3.787284034128453e-05, "loss": 0.1046, "loss_nan_ranks": 0, "loss_rank_avg": 0.04897238314151764, "step": 1445, "valid_targets_mean": 3241.8, "valid_targets_min": 820 }, { "epoch": 1.6406338426711942, "grad_norm": 0.9398974150849458, "learning_rate": 3.784745260473235e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.13083994388580322, "step": 1450, "valid_targets_mean": 2264.2, "valid_targets_min": 813 }, { "epoch": 1.6462931522354274, "grad_norm": 0.3455411095404806, "learning_rate": 3.782192287703309e-05, "loss": 0.1016, "loss_nan_ranks": 0, "loss_rank_avg": 0.0457475408911705, "step": 1455, "valid_targets_mean": 3651.9, "valid_targets_min": 2877 }, { "epoch": 1.6519524617996604, "grad_norm": 0.5320280185554186, "learning_rate": 3.7796251361296695e-05, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.06856375932693481, "step": 1460, "valid_targets_mean": 2384.0, "valid_targets_min": 667 }, { "epoch": 1.6576117713638936, "grad_norm": 0.33107100848601195, "learning_rate": 3.777043826176117e-05, "loss": 0.0984, "loss_nan_ranks": 0, "loss_rank_avg": 0.046754010021686554, "step": 1465, "valid_targets_mean": 3488.6, "valid_targets_min": 2353 }, { "epoch": 1.6632710809281268, "grad_norm": 0.3889838725270318, "learning_rate": 3.7744483783790924e-05, "loss": 0.1037, "loss_nan_ranks": 0, "loss_rank_avg": 0.0684385597705841, "step": 1470, "valid_targets_mean": 3189.9, "valid_targets_min": 549 }, { "epoch": 1.6689303904923598, "grad_norm": 0.3441656776900516, "learning_rate": 3.771838813387516e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.048582062125205994, "step": 1475, "valid_targets_mean": 3826.5, "valid_targets_min": 3340 }, { "epoch": 1.6745897000565932, "grad_norm": 0.4277143254856908, "learning_rate": 3.7692151519626196e-05, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.0704786479473114, "step": 1480, "valid_targets_mean": 2178.2, "valid_targets_min": 647 }, { "epoch": 1.6802490096208262, "grad_norm": 0.47124270373672383, "learning_rate": 3.766577414977786e-05, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.06369224935770035, "step": 1485, "valid_targets_mean": 1558.9, "valid_targets_min": 804 }, { "epoch": 1.6859083191850595, "grad_norm": 0.753103958134033, "learning_rate": 3.763925623418379e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.12379364669322968, "step": 1490, "valid_targets_mean": 1855.1, "valid_targets_min": 702 }, { "epoch": 1.6915676287492927, "grad_norm": 0.48046832764275127, "learning_rate": 3.7612597983815797e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.08387649059295654, "step": 1495, "valid_targets_mean": 2858.1, "valid_targets_min": 945 }, { "epoch": 1.6972269383135257, "grad_norm": 0.49583149151554834, "learning_rate": 3.7585799610762166e-05, "loss": 0.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.07928980141878128, "step": 1500, "valid_targets_mean": 2879.5, "valid_targets_min": 703 }, { "epoch": 1.7028862478777589, "grad_norm": 0.42423476563437235, "learning_rate": 3.755886132822596e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.06221155822277069, "step": 1505, "valid_targets_mean": 3950.5, "valid_targets_min": 3051 }, { "epoch": 1.708545557441992, "grad_norm": 0.5882449890510761, "learning_rate": 3.753178335052335e-05, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.08767211437225342, "step": 1510, "valid_targets_mean": 1759.8, "valid_targets_min": 523 }, { "epoch": 1.714204867006225, "grad_norm": 0.3446555532092815, "learning_rate": 3.750456589308189e-05, "loss": 0.1097, "loss_nan_ranks": 0, "loss_rank_avg": 0.05195833742618561, "step": 1515, "valid_targets_mean": 2138.2, "valid_targets_min": 468 }, { "epoch": 1.7198641765704585, "grad_norm": 0.25061409519259453, "learning_rate": 3.7477209172438824e-05, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.03194167837500572, "step": 1520, "valid_targets_mean": 4428.1, "valid_targets_min": 885 }, { "epoch": 1.7255234861346915, "grad_norm": 0.369656846375251, "learning_rate": 3.744971340623932e-05, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.04173450544476509, "step": 1525, "valid_targets_mean": 2478.5, "valid_targets_min": 546 }, { "epoch": 1.7311827956989247, "grad_norm": 0.33231186695325116, "learning_rate": 3.74220788132348e-05, "loss": 0.1024, "loss_nan_ranks": 0, "loss_rank_avg": 0.05705367028713226, "step": 1530, "valid_targets_mean": 3910.5, "valid_targets_min": 981 }, { "epoch": 1.736842105263158, "grad_norm": 0.48276957868170417, "learning_rate": 3.739430561328116e-05, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.06112513691186905, "step": 1535, "valid_targets_mean": 1519.9, "valid_targets_min": 697 }, { "epoch": 1.742501414827391, "grad_norm": 0.41746150621793054, "learning_rate": 3.736639402733699e-05, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.05486248433589935, "step": 1540, "valid_targets_mean": 3473.4, "valid_targets_min": 2777 }, { "epoch": 1.7481607243916242, "grad_norm": 0.42139772843391654, "learning_rate": 3.733834427746192e-05, "loss": 0.1234, "loss_nan_ranks": 0, "loss_rank_avg": 0.061300329864025116, "step": 1545, "valid_targets_mean": 3932.4, "valid_targets_min": 3061 }, { "epoch": 1.7538200339558574, "grad_norm": 0.340496756363664, "learning_rate": 3.7310156586814736e-05, "loss": 0.1077, "loss_nan_ranks": 0, "loss_rank_avg": 0.054317034780979156, "step": 1550, "valid_targets_mean": 2882.2, "valid_targets_min": 868 }, { "epoch": 1.7594793435200904, "grad_norm": 0.437913008532826, "learning_rate": 3.7281831179651674e-05, "loss": 0.1112, "loss_nan_ranks": 0, "loss_rank_avg": 0.04469527676701546, "step": 1555, "valid_targets_mean": 2506.6, "valid_targets_min": 752 }, { "epoch": 1.7651386530843238, "grad_norm": 0.4597022925107832, "learning_rate": 3.725336828132462e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.055792104452848434, "step": 1560, "valid_targets_mean": 3418.9, "valid_targets_min": 1141 }, { "epoch": 1.7707979626485568, "grad_norm": 0.3140091225890798, "learning_rate": 3.722476811827931e-05, "loss": 0.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.052371345460414886, "step": 1565, "valid_targets_mean": 3901.2, "valid_targets_min": 3540 }, { "epoch": 1.77645727221279, "grad_norm": 0.3873586711176246, "learning_rate": 3.719603091805354e-05, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.048507675528526306, "step": 1570, "valid_targets_mean": 2808.2, "valid_targets_min": 773 }, { "epoch": 1.7821165817770233, "grad_norm": 0.4072289949420176, "learning_rate": 3.716715690927534e-05, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.03962133452296257, "step": 1575, "valid_targets_mean": 3550.5, "valid_targets_min": 2587 }, { "epoch": 1.7877758913412563, "grad_norm": 0.423490356907719, "learning_rate": 3.713814632166117e-05, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.05531451851129532, "step": 1580, "valid_targets_mean": 2700.6, "valid_targets_min": 773 }, { "epoch": 1.7934352009054897, "grad_norm": 0.4459507286833836, "learning_rate": 3.7108999386014094e-05, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.06484959274530411, "step": 1585, "valid_targets_mean": 3615.9, "valid_targets_min": 2962 }, { "epoch": 1.7990945104697227, "grad_norm": 0.5974029415055255, "learning_rate": 3.707971633422192e-05, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.06666037440299988, "step": 1590, "valid_targets_mean": 1766.6, "valid_targets_min": 649 }, { "epoch": 1.804753820033956, "grad_norm": 0.5371457964206325, "learning_rate": 3.705029739925539e-05, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.06027115881443024, "step": 1595, "valid_targets_mean": 1668.4, "valid_targets_min": 708 }, { "epoch": 1.8104131295981891, "grad_norm": 0.4105963034912273, "learning_rate": 3.702074281516629e-05, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.051896438002586365, "step": 1600, "valid_targets_mean": 2129.5, "valid_targets_min": 617 }, { "epoch": 1.8160724391624221, "grad_norm": 0.4304740098082602, "learning_rate": 3.699105281708562e-05, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.05431009829044342, "step": 1605, "valid_targets_mean": 2495.0, "valid_targets_min": 720 }, { "epoch": 1.8217317487266553, "grad_norm": 0.5735926965861751, "learning_rate": 3.69612276412217e-05, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.06785906851291656, "step": 1610, "valid_targets_mean": 1537.8, "valid_targets_min": 628 }, { "epoch": 1.8273910582908885, "grad_norm": 0.5898530064935896, "learning_rate": 3.693126752485833e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.10182633996009827, "step": 1615, "valid_targets_mean": 2155.2, "valid_targets_min": 821 }, { "epoch": 1.8330503678551215, "grad_norm": 0.30947250284869365, "learning_rate": 3.6901172706352804e-05, "loss": 0.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.03451775759458542, "step": 1620, "valid_targets_mean": 3628.1, "valid_targets_min": 2863 }, { "epoch": 1.838709677419355, "grad_norm": 0.3690235938558517, "learning_rate": 3.687094342513416e-05, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.03967660665512085, "step": 1625, "valid_targets_mean": 3585.2, "valid_targets_min": 1773 }, { "epoch": 1.844368986983588, "grad_norm": 0.4516985285671224, "learning_rate": 3.6840579921701155e-05, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.06410881876945496, "step": 1630, "valid_targets_mean": 2356.6, "valid_targets_min": 721 }, { "epoch": 1.8500282965478212, "grad_norm": 0.359767615703714, "learning_rate": 3.68100824376204e-05, "loss": 0.0951, "loss_nan_ranks": 0, "loss_rank_avg": 0.06105772778391838, "step": 1635, "valid_targets_mean": 5092.5, "valid_targets_min": 4222 }, { "epoch": 1.8556876061120544, "grad_norm": 0.34713169199052546, "learning_rate": 3.6779451215524425e-05, "loss": 0.0952, "loss_nan_ranks": 0, "loss_rank_avg": 0.05121070519089699, "step": 1640, "valid_targets_mean": 4604.0, "valid_targets_min": 2020 }, { "epoch": 1.8613469156762874, "grad_norm": 0.3719471726084662, "learning_rate": 3.6748686499109784e-05, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.04059560224413872, "step": 1645, "valid_targets_mean": 3097.9, "valid_targets_min": 739 }, { "epoch": 1.8670062252405206, "grad_norm": 0.4061457385537339, "learning_rate": 3.6717788533135056e-05, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.058897800743579865, "step": 1650, "valid_targets_mean": 3696.1, "valid_targets_min": 2945 }, { "epoch": 1.8726655348047538, "grad_norm": 0.3617521099651027, "learning_rate": 3.6686757563418945e-05, "loss": 0.1112, "loss_nan_ranks": 0, "loss_rank_avg": 0.061327625066041946, "step": 1655, "valid_targets_mean": 3112.8, "valid_targets_min": 704 }, { "epoch": 1.8783248443689868, "grad_norm": 0.3604517782802872, "learning_rate": 3.665559383683832e-05, "loss": 0.1148, "loss_nan_ranks": 0, "loss_rank_avg": 0.05376065522432327, "step": 1660, "valid_targets_mean": 2490.9, "valid_targets_min": 774 }, { "epoch": 1.8839841539332203, "grad_norm": 0.33553954553952914, "learning_rate": 3.6624297601326205e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.043106965720653534, "step": 1665, "valid_targets_mean": 2570.2, "valid_targets_min": 485 }, { "epoch": 1.8896434634974533, "grad_norm": 0.3897113819731708, "learning_rate": 3.659286910586988e-05, "loss": 0.1074, "loss_nan_ranks": 0, "loss_rank_avg": 0.04850570484995842, "step": 1670, "valid_targets_mean": 3087.4, "valid_targets_min": 1048 }, { "epoch": 1.8953027730616865, "grad_norm": 0.37895239456846863, "learning_rate": 3.656130860050883e-05, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.052234359085559845, "step": 1675, "valid_targets_mean": 2753.6, "valid_targets_min": 722 }, { "epoch": 1.9009620826259197, "grad_norm": 0.5106105258979503, "learning_rate": 3.652961633633282e-05, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.06938277184963226, "step": 1680, "valid_targets_mean": 1836.2, "valid_targets_min": 865 }, { "epoch": 1.9066213921901527, "grad_norm": 0.521228149558116, "learning_rate": 3.649779256547984e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.060481246560811996, "step": 1685, "valid_targets_mean": 2377.5, "valid_targets_min": 675 }, { "epoch": 1.912280701754386, "grad_norm": 0.39880685753741063, "learning_rate": 3.6465837541134114e-05, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.0540006123483181, "step": 1690, "valid_targets_mean": 3323.0, "valid_targets_min": 782 }, { "epoch": 1.9179400113186191, "grad_norm": 0.42108885956864084, "learning_rate": 3.643375151752414e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.05214047059416771, "step": 1695, "valid_targets_mean": 2581.8, "valid_targets_min": 795 }, { "epoch": 1.9235993208828521, "grad_norm": 0.4156569687453574, "learning_rate": 3.6401534749920566e-05, "loss": 0.1122, "loss_nan_ranks": 0, "loss_rank_avg": 0.0582006499171257, "step": 1700, "valid_targets_mean": 3264.6, "valid_targets_min": 2017 }, { "epoch": 1.9292586304470856, "grad_norm": 0.3723182247552374, "learning_rate": 3.636918749463426e-05, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.04763641208410263, "step": 1705, "valid_targets_mean": 2319.6, "valid_targets_min": 798 }, { "epoch": 1.9349179400113186, "grad_norm": 0.3569396345560108, "learning_rate": 3.633671000901422e-05, "loss": 0.0985, "loss_nan_ranks": 0, "loss_rank_avg": 0.05561841279268265, "step": 1710, "valid_targets_mean": 3299.6, "valid_targets_min": 860 }, { "epoch": 1.9405772495755518, "grad_norm": 0.4168083888615434, "learning_rate": 3.63041025514455e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.0583263598382473, "step": 1715, "valid_targets_mean": 3302.4, "valid_targets_min": 878 }, { "epoch": 1.946236559139785, "grad_norm": 0.3357389283054348, "learning_rate": 3.627136538134723e-05, "loss": 0.0957, "loss_nan_ranks": 0, "loss_rank_avg": 0.039092086255550385, "step": 1720, "valid_targets_mean": 3832.2, "valid_targets_min": 2602 }, { "epoch": 1.951895868704018, "grad_norm": 0.4848350300498934, "learning_rate": 3.623849875917049e-05, "loss": 0.1133, "loss_nan_ranks": 0, "loss_rank_avg": 0.06840664148330688, "step": 1725, "valid_targets_mean": 2736.5, "valid_targets_min": 945 }, { "epoch": 1.9575551782682514, "grad_norm": 0.4192988003009786, "learning_rate": 3.620550294639625e-05, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.06918597221374512, "step": 1730, "valid_targets_mean": 3831.1, "valid_targets_min": 3128 }, { "epoch": 1.9632144878324844, "grad_norm": 0.346024934816044, "learning_rate": 3.6172378205533316e-05, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.05582546442747116, "step": 1735, "valid_targets_mean": 3966.2, "valid_targets_min": 2529 }, { "epoch": 1.9688737973967176, "grad_norm": 0.3488468452500612, "learning_rate": 3.613912480011621e-05, "loss": 0.0953, "loss_nan_ranks": 0, "loss_rank_avg": 0.06639085710048676, "step": 1740, "valid_targets_mean": 4704.8, "valid_targets_min": 892 }, { "epoch": 1.9745331069609509, "grad_norm": 0.27640089567785464, "learning_rate": 3.610574299470308e-05, "loss": 0.1067, "loss_nan_ranks": 0, "loss_rank_avg": 0.03565194457769394, "step": 1745, "valid_targets_mean": 4471.1, "valid_targets_min": 1657 }, { "epoch": 1.9801924165251839, "grad_norm": 0.557304325917542, "learning_rate": 3.6072233054873634e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.14241379499435425, "step": 1750, "valid_targets_mean": 1989.8, "valid_targets_min": 709 }, { "epoch": 1.985851726089417, "grad_norm": 0.3099094861639918, "learning_rate": 3.6038595247226946e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.04021911323070526, "step": 1755, "valid_targets_mean": 3226.5, "valid_targets_min": 527 }, { "epoch": 1.9915110356536503, "grad_norm": 0.3484031043449807, "learning_rate": 3.600482983937943e-05, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.06430061161518097, "step": 1760, "valid_targets_mean": 3531.0, "valid_targets_min": 2318 }, { "epoch": 1.9971703452178833, "grad_norm": 0.3315201233960109, "learning_rate": 3.597093709996263e-05, "loss": 0.1027, "loss_nan_ranks": 0, "loss_rank_avg": 0.05331774055957794, "step": 1765, "valid_targets_mean": 3520.9, "valid_targets_min": 2883 }, { "epoch": 2.0022637238256933, "grad_norm": 0.4650942658007115, "learning_rate": 3.593691729862114e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.10227910429239273, "step": 1770, "valid_targets_mean": 5904.0, "valid_targets_min": 4967 }, { "epoch": 2.0079230333899263, "grad_norm": 0.3688430969903834, "learning_rate": 3.5902770706010414e-05, "loss": 0.201, "loss_nan_ranks": 0, "loss_rank_avg": 0.11695493757724762, "step": 1775, "valid_targets_mean": 8641.4, "valid_targets_min": 5164 }, { "epoch": 2.0135823429541597, "grad_norm": 0.36292308857695155, "learning_rate": 3.586849759379466e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.09385283291339874, "step": 1780, "valid_targets_mean": 6838.2, "valid_targets_min": 5200 }, { "epoch": 2.0192416525183927, "grad_norm": 0.3826950676721889, "learning_rate": 3.583409823464464e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.07843857258558273, "step": 1785, "valid_targets_mean": 5411.6, "valid_targets_min": 3853 }, { "epoch": 2.0249009620826257, "grad_norm": 0.39590639769636465, "learning_rate": 3.5799572902235506e-05, "loss": 0.1969, "loss_nan_ranks": 0, "loss_rank_avg": 0.10466514527797699, "step": 1790, "valid_targets_mean": 5598.0, "valid_targets_min": 4669 }, { "epoch": 2.030560271646859, "grad_norm": 0.42021932727305517, "learning_rate": 3.576492187124465e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.10257241129875183, "step": 1795, "valid_targets_mean": 5953.0, "valid_targets_min": 4216 }, { "epoch": 2.036219581211092, "grad_norm": 0.3824309948575738, "learning_rate": 3.5730145417349486e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.10280093550682068, "step": 1800, "valid_targets_mean": 5914.0, "valid_targets_min": 4589 }, { "epoch": 2.0418788907753256, "grad_norm": 0.3774424672724206, "learning_rate": 3.569524381722527e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.09702812880277634, "step": 1805, "valid_targets_mean": 6515.4, "valid_targets_min": 4588 }, { "epoch": 2.0475382003395586, "grad_norm": 0.3463163873793305, "learning_rate": 3.5660217348542905e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.09045751392841339, "step": 1810, "valid_targets_mean": 7015.2, "valid_targets_min": 4530 }, { "epoch": 2.0531975099037916, "grad_norm": 0.38005898031225666, "learning_rate": 3.562506628996672e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.10554981231689453, "step": 1815, "valid_targets_mean": 6202.6, "valid_targets_min": 4837 }, { "epoch": 2.058856819468025, "grad_norm": 0.49281621300824496, "learning_rate": 3.558979092115227e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.062259264290332794, "step": 1820, "valid_targets_mean": 1720.9, "valid_targets_min": 229 }, { "epoch": 2.064516129032258, "grad_norm": 0.38979368137302145, "learning_rate": 3.555439152274408e-05, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.09573017060756683, "step": 1825, "valid_targets_mean": 5963.8, "valid_targets_min": 4216 }, { "epoch": 2.0701754385964914, "grad_norm": 0.37983119309515756, "learning_rate": 3.551886837637346e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.09074237197637558, "step": 1830, "valid_targets_mean": 5973.9, "valid_targets_min": 4835 }, { "epoch": 2.0758347481607244, "grad_norm": 0.3558752312487743, "learning_rate": 3.548322176465622e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.0832388773560524, "step": 1835, "valid_targets_mean": 6669.8, "valid_targets_min": 4995 }, { "epoch": 2.0814940577249574, "grad_norm": 0.44946142448140997, "learning_rate": 3.544745197119042e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.12601280212402344, "step": 1840, "valid_targets_mean": 5705.5, "valid_targets_min": 4108 }, { "epoch": 2.087153367289191, "grad_norm": 0.4096707797369472, "learning_rate": 3.541155928055418e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.1199854165315628, "step": 1845, "valid_targets_mean": 6594.0, "valid_targets_min": 4527 }, { "epoch": 2.092812676853424, "grad_norm": 0.4480155154525078, "learning_rate": 3.537554397830331e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.10273626446723938, "step": 1850, "valid_targets_mean": 3100.9, "valid_targets_min": 2104 }, { "epoch": 2.098471986417657, "grad_norm": 0.376634058661012, "learning_rate": 3.533940635096915e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.08255627006292343, "step": 1855, "valid_targets_mean": 5817.8, "valid_targets_min": 4757 }, { "epoch": 2.1041312959818903, "grad_norm": 0.40073821404298404, "learning_rate": 3.530314668605621e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.11327770352363586, "step": 1860, "valid_targets_mean": 6333.0, "valid_targets_min": 5056 }, { "epoch": 2.1097906055461233, "grad_norm": 0.3734001545981099, "learning_rate": 3.5266765272039895e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.08531501889228821, "step": 1865, "valid_targets_mean": 5956.0, "valid_targets_min": 2834 }, { "epoch": 2.1154499151103567, "grad_norm": 0.3967893930386219, "learning_rate": 3.523026239836426e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.12767675518989563, "step": 1870, "valid_targets_mean": 6984.6, "valid_targets_min": 5744 }, { "epoch": 2.1211092246745897, "grad_norm": 0.4034811625677781, "learning_rate": 3.5193638355439635e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.08648249506950378, "step": 1875, "valid_targets_mean": 7290.2, "valid_targets_min": 5640 }, { "epoch": 2.1267685342388227, "grad_norm": 0.4225969920586299, "learning_rate": 3.515689343464038e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.09000758826732635, "step": 1880, "valid_targets_mean": 7036.0, "valid_targets_min": 5210 }, { "epoch": 2.132427843803056, "grad_norm": 0.4180663507921894, "learning_rate": 3.512002792830252e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.1279435157775879, "step": 1885, "valid_targets_mean": 7138.5, "valid_targets_min": 5292 }, { "epoch": 2.138087153367289, "grad_norm": 0.4082154228625417, "learning_rate": 3.508304212972145e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.10258790850639343, "step": 1890, "valid_targets_mean": 6134.2, "valid_targets_min": 3531 }, { "epoch": 2.143746462931522, "grad_norm": 0.4001627333855726, "learning_rate": 3.504593633314957e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.1019192785024643, "step": 1895, "valid_targets_mean": 5968.2, "valid_targets_min": 4640 }, { "epoch": 2.1494057724957556, "grad_norm": 0.3939812237785384, "learning_rate": 3.500871083379398e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.0974932610988617, "step": 1900, "valid_targets_mean": 6249.6, "valid_targets_min": 4328 }, { "epoch": 2.1550650820599886, "grad_norm": 0.425061630606132, "learning_rate": 3.497136592781411e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.10714038461446762, "step": 1905, "valid_targets_mean": 6002.4, "valid_targets_min": 3123 }, { "epoch": 2.160724391624222, "grad_norm": 0.3909594756495503, "learning_rate": 3.493390191231937e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.09464001655578613, "step": 1910, "valid_targets_mean": 6372.2, "valid_targets_min": 4256 }, { "epoch": 2.166383701188455, "grad_norm": 0.4753346300038162, "learning_rate": 3.4896319085366764e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.10602079331874847, "step": 1915, "valid_targets_mean": 5927.8, "valid_targets_min": 4753 }, { "epoch": 2.172043010752688, "grad_norm": 0.40365757025068216, "learning_rate": 3.485861774595857e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.09577983617782593, "step": 1920, "valid_targets_mean": 6106.1, "valid_targets_min": 5370 }, { "epoch": 2.1777023203169215, "grad_norm": 0.4429082540303591, "learning_rate": 3.482079819403991e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.10737248510122299, "step": 1925, "valid_targets_mean": 6240.6, "valid_targets_min": 4608 }, { "epoch": 2.1833616298811545, "grad_norm": 0.4604460702396511, "learning_rate": 3.4782860730496385e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.09162674099206924, "step": 1930, "valid_targets_mean": 5733.2, "valid_targets_min": 3801 }, { "epoch": 2.1890209394453874, "grad_norm": 0.38939580594223905, "learning_rate": 3.474480565715168e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.10398145765066147, "step": 1935, "valid_targets_mean": 6430.1, "valid_targets_min": 4754 }, { "epoch": 2.194680249009621, "grad_norm": 0.33698859572698064, "learning_rate": 3.470663327676517e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.0752083882689476, "step": 1940, "valid_targets_mean": 7375.2, "valid_targets_min": 6417 }, { "epoch": 2.200339558573854, "grad_norm": 0.4562817386757838, "learning_rate": 3.466834389302951e-05, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.1071748435497284, "step": 1945, "valid_targets_mean": 6281.0, "valid_targets_min": 3468 }, { "epoch": 2.2059988681380873, "grad_norm": 0.4019776315767542, "learning_rate": 3.4629937810568185e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.09497380256652832, "step": 1950, "valid_targets_mean": 6532.4, "valid_targets_min": 5221 }, { "epoch": 2.2116581777023203, "grad_norm": 0.49926857648549444, "learning_rate": 3.459141533493315e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.08050023019313812, "step": 1955, "valid_targets_mean": 5552.6, "valid_targets_min": 4438 }, { "epoch": 2.2173174872665533, "grad_norm": 0.4249799624141297, "learning_rate": 3.455277677260231e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.10170389711856842, "step": 1960, "valid_targets_mean": 5878.1, "valid_targets_min": 3915 }, { "epoch": 2.2229767968307867, "grad_norm": 0.3284937764800396, "learning_rate": 3.451402243097721e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.07613489031791687, "step": 1965, "valid_targets_mean": 7082.6, "valid_targets_min": 4135 }, { "epoch": 2.2286361063950197, "grad_norm": 0.4244872944881361, "learning_rate": 3.4475152618380456e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.0987371951341629, "step": 1970, "valid_targets_mean": 5936.4, "valid_targets_min": 3947 }, { "epoch": 2.234295415959253, "grad_norm": 0.40889945828872726, "learning_rate": 3.443616764405334e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.12065830081701279, "step": 1975, "valid_targets_mean": 6836.2, "valid_targets_min": 4865 }, { "epoch": 2.239954725523486, "grad_norm": 0.5840265740345978, "learning_rate": 3.4397067818153345e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.09379205107688904, "step": 1980, "valid_targets_mean": 6539.4, "valid_targets_min": 4643 }, { "epoch": 2.245614035087719, "grad_norm": 0.37861827661541286, "learning_rate": 3.435785345175173e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.09451638907194138, "step": 1985, "valid_targets_mean": 6613.6, "valid_targets_min": 4959 }, { "epoch": 2.2512733446519526, "grad_norm": 0.39489041786405854, "learning_rate": 3.431852485683098e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.10732698440551758, "step": 1990, "valid_targets_mean": 6044.1, "valid_targets_min": 4652 }, { "epoch": 2.2569326542161856, "grad_norm": 0.38898383798039116, "learning_rate": 3.4279082346282396e-05, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.0827295109629631, "step": 1995, "valid_targets_mean": 5893.9, "valid_targets_min": 4938 }, { "epoch": 2.2625919637804186, "grad_norm": 0.376704751319281, "learning_rate": 3.423952623390352e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.07669830322265625, "step": 2000, "valid_targets_mean": 5849.6, "valid_targets_min": 4546 }, { "epoch": 2.268251273344652, "grad_norm": 0.3910964440500796, "learning_rate": 3.419985683439574e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.08727534115314484, "step": 2005, "valid_targets_mean": 5751.5, "valid_targets_min": 3200 }, { "epoch": 2.273910582908885, "grad_norm": 0.37774305187779456, "learning_rate": 3.416007446336172e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.09513689577579498, "step": 2010, "valid_targets_mean": 6149.6, "valid_targets_min": 5010 }, { "epoch": 2.279569892473118, "grad_norm": 0.7245046622730861, "learning_rate": 3.4120179437302885e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.10477955639362335, "step": 2015, "valid_targets_mean": 6551.2, "valid_targets_min": 4904 }, { "epoch": 2.2852292020373515, "grad_norm": 0.43974321457580223, "learning_rate": 3.408017207361696e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.13391438126564026, "step": 2020, "valid_targets_mean": 5728.9, "valid_targets_min": 4812 }, { "epoch": 2.2908885116015845, "grad_norm": 0.4190046872972955, "learning_rate": 3.4040052690595376e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.07912546396255493, "step": 2025, "valid_targets_mean": 5047.9, "valid_targets_min": 3629 }, { "epoch": 2.296547821165818, "grad_norm": 0.4117794454695208, "learning_rate": 3.399982160742079e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.09514860808849335, "step": 2030, "valid_targets_mean": 6260.0, "valid_targets_min": 4324 }, { "epoch": 2.302207130730051, "grad_norm": 0.3485537640844097, "learning_rate": 3.3959479144164515e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.08208595216274261, "step": 2035, "valid_targets_mean": 7853.1, "valid_targets_min": 4920 }, { "epoch": 2.3078664402942843, "grad_norm": 0.40215304288985815, "learning_rate": 3.3919025621783996e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.08957590162754059, "step": 2040, "valid_targets_mean": 6231.0, "valid_targets_min": 4882 }, { "epoch": 2.3135257498585173, "grad_norm": 0.3994007707086233, "learning_rate": 3.387846136212022e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.08934713900089264, "step": 2045, "valid_targets_mean": 7472.9, "valid_targets_min": 3943 }, { "epoch": 2.3191850594227503, "grad_norm": 0.39411875696086646, "learning_rate": 3.3837786687895214e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.09899666160345078, "step": 2050, "valid_targets_mean": 6840.2, "valid_targets_min": 5034 }, { "epoch": 2.3248443689869838, "grad_norm": 0.41432286699353016, "learning_rate": 3.3797001922709416e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.09966832399368286, "step": 2055, "valid_targets_mean": 6458.5, "valid_targets_min": 4461 }, { "epoch": 2.3305036785512168, "grad_norm": 0.3696592168950713, "learning_rate": 3.375610739103913e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.0865120217204094, "step": 2060, "valid_targets_mean": 6645.4, "valid_targets_min": 5188 }, { "epoch": 2.3361629881154498, "grad_norm": 0.38218748203757885, "learning_rate": 3.371510341823396e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.09908951073884964, "step": 2065, "valid_targets_mean": 6002.9, "valid_targets_min": 5009 }, { "epoch": 2.341822297679683, "grad_norm": 0.4216291403746872, "learning_rate": 3.3673990330514197e-05, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.10168929398059845, "step": 2070, "valid_targets_mean": 6025.9, "valid_targets_min": 4551 }, { "epoch": 2.347481607243916, "grad_norm": 0.38801428996393683, "learning_rate": 3.363276845496822e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.09701313078403473, "step": 2075, "valid_targets_mean": 7210.0, "valid_targets_min": 4492 }, { "epoch": 2.353140916808149, "grad_norm": 0.38850555570599626, "learning_rate": 3.359143811954992e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.09031613916158676, "step": 2080, "valid_targets_mean": 7051.4, "valid_targets_min": 4718 }, { "epoch": 2.3588002263723826, "grad_norm": 0.38719154647188286, "learning_rate": 3.354999965307606e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.09918487071990967, "step": 2085, "valid_targets_mean": 6686.0, "valid_targets_min": 4827 }, { "epoch": 2.3644595359366156, "grad_norm": 0.36238981373390344, "learning_rate": 3.3508453385223684e-05, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.0751459077000618, "step": 2090, "valid_targets_mean": 5311.9, "valid_targets_min": 3828 }, { "epoch": 2.370118845500849, "grad_norm": 0.39766759905835697, "learning_rate": 3.346679964652749e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.07942270487546921, "step": 2095, "valid_targets_mean": 7078.9, "valid_targets_min": 4594 }, { "epoch": 2.375778155065082, "grad_norm": 0.39459968327080425, "learning_rate": 3.342503876837718e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.07656831294298172, "step": 2100, "valid_targets_mean": 6393.8, "valid_targets_min": 4509 }, { "epoch": 2.381437464629315, "grad_norm": 0.3758001299296689, "learning_rate": 3.3383171083014856e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.10427580773830414, "step": 2105, "valid_targets_mean": 7848.9, "valid_targets_min": 5649 }, { "epoch": 2.3870967741935485, "grad_norm": 0.3903744879220785, "learning_rate": 3.3341196923532336e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.07996858656406403, "step": 2110, "valid_targets_mean": 6623.4, "valid_targets_min": 4343 }, { "epoch": 2.3927560837577815, "grad_norm": 0.3953141794689289, "learning_rate": 3.329911662386855e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.08288268744945526, "step": 2115, "valid_targets_mean": 6255.9, "valid_targets_min": 4660 }, { "epoch": 2.398415393322015, "grad_norm": 0.34363852176252085, "learning_rate": 3.3256930518806845e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.09071113914251328, "step": 2120, "valid_targets_mean": 8243.0, "valid_targets_min": 6281 }, { "epoch": 2.404074702886248, "grad_norm": 0.360214785751071, "learning_rate": 3.321463894397235e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.08923101425170898, "step": 2125, "valid_targets_mean": 7083.5, "valid_targets_min": 4657 }, { "epoch": 2.409734012450481, "grad_norm": 0.4200445006113312, "learning_rate": 3.317224223582927e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.10604465007781982, "step": 2130, "valid_targets_mean": 6399.8, "valid_targets_min": 5098 }, { "epoch": 2.4153933220147144, "grad_norm": 0.46264235033494944, "learning_rate": 3.312974073167825e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.10362359136343002, "step": 2135, "valid_targets_mean": 5257.4, "valid_targets_min": 1879 }, { "epoch": 2.4210526315789473, "grad_norm": 0.43111753430771954, "learning_rate": 3.30871347696537e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.10390962660312653, "step": 2140, "valid_targets_mean": 5260.5, "valid_targets_min": 3619 }, { "epoch": 2.4267119411431803, "grad_norm": 0.41865096806641583, "learning_rate": 3.3044424688721016e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.06864843517541885, "step": 2145, "valid_targets_mean": 3976.1, "valid_targets_min": 3545 }, { "epoch": 2.432371250707414, "grad_norm": 0.3573869762021644, "learning_rate": 3.300161082867398e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.04815223067998886, "step": 2150, "valid_targets_mean": 3099.4, "valid_targets_min": 1024 }, { "epoch": 2.4380305602716468, "grad_norm": 0.34190173531670653, "learning_rate": 3.295869353013204e-05, "loss": 0.0982, "loss_nan_ranks": 0, "loss_rank_avg": 0.02967439591884613, "step": 2155, "valid_targets_mean": 3441.1, "valid_targets_min": 2927 }, { "epoch": 2.44368986983588, "grad_norm": 0.43983243600032806, "learning_rate": 3.291567313453754e-05, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.07892259210348129, "step": 2160, "valid_targets_mean": 3442.0, "valid_targets_min": 2213 }, { "epoch": 2.449349179400113, "grad_norm": 0.46751571452574264, "learning_rate": 3.287254998415308e-05, "loss": 0.0987, "loss_nan_ranks": 0, "loss_rank_avg": 0.060992803424596786, "step": 2165, "valid_targets_mean": 2907.4, "valid_targets_min": 1134 }, { "epoch": 2.455008488964346, "grad_norm": 0.4395489284393833, "learning_rate": 3.282932442205875e-05, "loss": 0.1062, "loss_nan_ranks": 0, "loss_rank_avg": 0.06305012106895447, "step": 2170, "valid_targets_mean": 2523.4, "valid_targets_min": 663 }, { "epoch": 2.4606677985285796, "grad_norm": 0.6628613828680201, "learning_rate": 3.2785996792149397e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.07510661333799362, "step": 2175, "valid_targets_mean": 1893.8, "valid_targets_min": 535 }, { "epoch": 2.4663271080928126, "grad_norm": 0.4089669303969591, "learning_rate": 3.274256743913192e-05, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.04284790903329849, "step": 2180, "valid_targets_mean": 1971.8, "valid_targets_min": 811 }, { "epoch": 2.471986417657046, "grad_norm": 0.4732750376584821, "learning_rate": 3.2699036708522486e-05, "loss": 0.1234, "loss_nan_ranks": 0, "loss_rank_avg": 0.07278202474117279, "step": 2185, "valid_targets_mean": 2785.5, "valid_targets_min": 2392 }, { "epoch": 2.477645727221279, "grad_norm": 0.2586276180787425, "learning_rate": 3.265540494664383e-05, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.032237522304058075, "step": 2190, "valid_targets_mean": 4540.6, "valid_targets_min": 3285 }, { "epoch": 2.483305036785512, "grad_norm": 0.373237775006757, "learning_rate": 3.261167250062246e-05, "loss": 0.097, "loss_nan_ranks": 0, "loss_rank_avg": 0.0476677343249321, "step": 2195, "valid_targets_mean": 2926.8, "valid_targets_min": 764 }, { "epoch": 2.4889643463497455, "grad_norm": 0.3674744465113664, "learning_rate": 3.25678397183859e-05, "loss": 0.1021, "loss_nan_ranks": 0, "loss_rank_avg": 0.056619517505168915, "step": 2200, "valid_targets_mean": 3378.6, "valid_targets_min": 1290 }, { "epoch": 2.4946236559139785, "grad_norm": 0.4594754544351409, "learning_rate": 3.252390694865995e-05, "loss": 0.0997, "loss_nan_ranks": 0, "loss_rank_avg": 0.057963818311691284, "step": 2205, "valid_targets_mean": 2432.4, "valid_targets_min": 720 }, { "epoch": 2.5002829654782115, "grad_norm": 0.3192949581204995, "learning_rate": 3.247987454096588e-05, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.04614349454641342, "step": 2210, "valid_targets_mean": 3896.0, "valid_targets_min": 2336 }, { "epoch": 2.505942275042445, "grad_norm": 0.33644471032634066, "learning_rate": 3.2435742845617664e-05, "loss": 0.0947, "loss_nan_ranks": 0, "loss_rank_avg": 0.04669766128063202, "step": 2215, "valid_targets_mean": 2912.5, "valid_targets_min": 1049 }, { "epoch": 2.511601584606678, "grad_norm": 0.34479623408810645, "learning_rate": 3.2391512213719195e-05, "loss": 0.1078, "loss_nan_ranks": 0, "loss_rank_avg": 0.0345931239426136, "step": 2220, "valid_targets_mean": 3087.8, "valid_targets_min": 1086 }, { "epoch": 2.517260894170911, "grad_norm": 0.36688535674523926, "learning_rate": 3.23471829971615e-05, "loss": 0.0884, "loss_nan_ranks": 0, "loss_rank_avg": 0.04897375777363777, "step": 2225, "valid_targets_mean": 3296.5, "valid_targets_min": 732 }, { "epoch": 2.5229202037351444, "grad_norm": 0.5957001879370355, "learning_rate": 3.230275554861988e-05, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.07079662382602692, "step": 2230, "valid_targets_mean": 1688.5, "valid_targets_min": 770 }, { "epoch": 2.5285795132993774, "grad_norm": 0.43461041178958076, "learning_rate": 3.2258230221551216e-05, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.04917736351490021, "step": 2235, "valid_targets_mean": 2574.8, "valid_targets_min": 592 }, { "epoch": 2.534238822863611, "grad_norm": 0.42565232202035636, "learning_rate": 3.221360737019105e-05, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.055679723620414734, "step": 2240, "valid_targets_mean": 3089.1, "valid_targets_min": 2224 }, { "epoch": 2.539898132427844, "grad_norm": 0.4171403916689987, "learning_rate": 3.216888734955082e-05, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.042909517884254456, "step": 2245, "valid_targets_mean": 2364.5, "valid_targets_min": 511 }, { "epoch": 2.5455574419920772, "grad_norm": 0.4453123084365863, "learning_rate": 3.2124070515415026e-05, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.06102481111884117, "step": 2250, "valid_targets_mean": 3775.5, "valid_targets_min": 2328 }, { "epoch": 2.5512167515563102, "grad_norm": 0.3935444374091009, "learning_rate": 3.20791572243384e-05, "loss": 0.0943, "loss_nan_ranks": 0, "loss_rank_avg": 0.043448153883218765, "step": 2255, "valid_targets_mean": 2867.1, "valid_targets_min": 669 }, { "epoch": 2.556876061120543, "grad_norm": 0.6248731534527211, "learning_rate": 3.2034147833643085e-05, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.07770198583602905, "step": 2260, "valid_targets_mean": 1722.5, "valid_targets_min": 802 }, { "epoch": 2.5625353706847767, "grad_norm": 0.6695756417777585, "learning_rate": 3.1989042701415735e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.07981681078672409, "step": 2265, "valid_targets_mean": 1527.9, "valid_targets_min": 357 }, { "epoch": 2.5681946802490097, "grad_norm": 0.37224281178132096, "learning_rate": 3.194384218650475e-05, "loss": 0.112, "loss_nan_ranks": 0, "loss_rank_avg": 0.05012982338666916, "step": 2270, "valid_targets_mean": 3831.6, "valid_targets_min": 2808 }, { "epoch": 2.5738539898132426, "grad_norm": 0.500568844305321, "learning_rate": 3.1898546648517344e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.13740640878677368, "step": 2275, "valid_targets_mean": 2953.2, "valid_targets_min": 652 }, { "epoch": 2.579513299377476, "grad_norm": 0.3736709958108341, "learning_rate": 3.185315644781674e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.05496054142713547, "step": 2280, "valid_targets_mean": 3963.6, "valid_targets_min": 3573 }, { "epoch": 2.585172608941709, "grad_norm": 0.5090649187854307, "learning_rate": 3.1807671945519275e-05, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.06333998590707779, "step": 2285, "valid_targets_mean": 2137.1, "valid_targets_min": 822 }, { "epoch": 2.590831918505942, "grad_norm": 0.5165232888652537, "learning_rate": 3.1762093503491515e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.16781306266784668, "step": 2290, "valid_targets_mean": 2582.1, "valid_targets_min": 965 }, { "epoch": 2.5964912280701755, "grad_norm": 0.3296689482507935, "learning_rate": 3.171642148434743e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.043995440006256104, "step": 2295, "valid_targets_mean": 4182.0, "valid_targets_min": 636 }, { "epoch": 2.6021505376344085, "grad_norm": 0.399676787291068, "learning_rate": 3.167065625144544e-05, "loss": 0.0972, "loss_nan_ranks": 0, "loss_rank_avg": 0.07242860645055771, "step": 2300, "valid_targets_mean": 4735.0, "valid_targets_min": 2733 }, { "epoch": 2.6078098471986415, "grad_norm": 0.3909386303098651, "learning_rate": 3.1624798168885566e-05, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.0652426928281784, "step": 2305, "valid_targets_mean": 4307.1, "valid_targets_min": 2571 }, { "epoch": 2.613469156762875, "grad_norm": 0.30890902026855777, "learning_rate": 3.157884760150653e-05, "loss": 0.1045, "loss_nan_ranks": 0, "loss_rank_avg": 0.03641439974308014, "step": 2310, "valid_targets_mean": 3207.2, "valid_targets_min": 970 }, { "epoch": 2.619128466327108, "grad_norm": 0.41688683844062174, "learning_rate": 3.153280491488285e-05, "loss": 0.0973, "loss_nan_ranks": 0, "loss_rank_avg": 0.038325291126966476, "step": 2315, "valid_targets_mean": 2923.8, "valid_targets_min": 748 }, { "epoch": 2.6247877758913414, "grad_norm": 0.4141664805039355, "learning_rate": 3.148667047532191e-05, "loss": 0.099, "loss_nan_ranks": 0, "loss_rank_avg": 0.06093056499958038, "step": 2320, "valid_targets_mean": 3834.1, "valid_targets_min": 3568 }, { "epoch": 2.6304470854555744, "grad_norm": 0.5296100301519969, "learning_rate": 3.1440444649861084e-05, "loss": 0.1014, "loss_nan_ranks": 0, "loss_rank_avg": 0.05555908381938934, "step": 2325, "valid_targets_mean": 2406.8, "valid_targets_min": 1820 }, { "epoch": 2.636106395019808, "grad_norm": 0.4344050252582694, "learning_rate": 3.139412780626478e-05, "loss": 0.0865, "loss_nan_ranks": 0, "loss_rank_avg": 0.0589946024119854, "step": 2330, "valid_targets_mean": 2587.6, "valid_targets_min": 772 }, { "epoch": 2.641765704584041, "grad_norm": 0.4764837983611368, "learning_rate": 3.134772031302156e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.07396160066127777, "step": 2335, "valid_targets_mean": 3260.0, "valid_targets_min": 1289 }, { "epoch": 2.647425014148274, "grad_norm": 0.37816499084386906, "learning_rate": 3.130122253934113e-05, "loss": 0.08, "loss_nan_ranks": 0, "loss_rank_avg": 0.045197054743766785, "step": 2340, "valid_targets_mean": 3723.0, "valid_targets_min": 3122 }, { "epoch": 2.6530843237125072, "grad_norm": 0.3706727023566082, "learning_rate": 3.125463485515149e-05, "loss": 0.0921, "loss_nan_ranks": 0, "loss_rank_avg": 0.049566566944122314, "step": 2345, "valid_targets_mean": 3712.5, "valid_targets_min": 1451 }, { "epoch": 2.6587436332767402, "grad_norm": 0.3661474166395112, "learning_rate": 3.1207957631095944e-05, "loss": 0.0876, "loss_nan_ranks": 0, "loss_rank_avg": 0.04905054345726967, "step": 2350, "valid_targets_mean": 3632.8, "valid_targets_min": 792 }, { "epoch": 2.6644029428409732, "grad_norm": 0.47433911573934034, "learning_rate": 3.116119123853014e-05, "loss": 0.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.044324200600385666, "step": 2355, "valid_targets_mean": 1992.4, "valid_targets_min": 795 }, { "epoch": 2.6700622524052067, "grad_norm": 0.3405483587292372, "learning_rate": 3.1114336049519165e-05, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.048648297786712646, "step": 2360, "valid_targets_mean": 3431.4, "valid_targets_min": 1196 }, { "epoch": 2.6757215619694397, "grad_norm": 0.528089751667171, "learning_rate": 3.106739243683453e-05, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.05340038612484932, "step": 2365, "valid_targets_mean": 1836.1, "valid_targets_min": 575 }, { "epoch": 2.6813808715336727, "grad_norm": 0.655807946929079, "learning_rate": 3.1020360773951225e-05, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.08533156663179398, "step": 2370, "valid_targets_mean": 1908.8, "valid_targets_min": 609 }, { "epoch": 2.687040181097906, "grad_norm": 0.479137600509888, "learning_rate": 3.097324143504479e-05, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.0396895632147789, "step": 2375, "valid_targets_mean": 1497.2, "valid_targets_min": 542 }, { "epoch": 2.692699490662139, "grad_norm": 0.35572554367136605, "learning_rate": 3.092603479498826e-05, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.046362824738025665, "step": 2380, "valid_targets_mean": 3701.8, "valid_targets_min": 2440 }, { "epoch": 2.6983588002263725, "grad_norm": 0.4294308993861767, "learning_rate": 3.087874122934924e-05, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.03990578651428223, "step": 2385, "valid_targets_mean": 1648.2, "valid_targets_min": 629 }, { "epoch": 2.7040181097906055, "grad_norm": 0.5487991767733832, "learning_rate": 3.0831361114386905e-05, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.05739689990878105, "step": 2390, "valid_targets_mean": 3953.0, "valid_targets_min": 3701 }, { "epoch": 2.709677419354839, "grad_norm": 0.42836710916085596, "learning_rate": 3.078389482704897e-05, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.05183224380016327, "step": 2395, "valid_targets_mean": 1700.9, "valid_targets_min": 485 }, { "epoch": 2.715336728919072, "grad_norm": 0.47163155795442635, "learning_rate": 3.0736342744968764e-05, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.0850541889667511, "step": 2400, "valid_targets_mean": 2381.9, "valid_targets_min": 605 }, { "epoch": 2.720996038483305, "grad_norm": 0.3348814947703484, "learning_rate": 3.068870524646215e-05, "loss": 0.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.03373149782419205, "step": 2405, "valid_targets_mean": 2713.5, "valid_targets_min": 848 }, { "epoch": 2.7266553480475384, "grad_norm": 0.31717139487830104, "learning_rate": 3.064098271052457e-05, "loss": 0.0912, "loss_nan_ranks": 0, "loss_rank_avg": 0.04711340367794037, "step": 2410, "valid_targets_mean": 5106.4, "valid_targets_min": 4456 }, { "epoch": 2.7323146576117714, "grad_norm": 0.37159333535295175, "learning_rate": 3.059317551682801e-05, "loss": 0.0948, "loss_nan_ranks": 0, "loss_rank_avg": 0.05447401478886604, "step": 2415, "valid_targets_mean": 3905.5, "valid_targets_min": 1864 }, { "epoch": 2.7379739671760044, "grad_norm": 0.36008589768281596, "learning_rate": 3.0545284045717956e-05, "loss": 0.1091, "loss_nan_ranks": 0, "loss_rank_avg": 0.04373928904533386, "step": 2420, "valid_targets_mean": 3313.8, "valid_targets_min": 1361 }, { "epoch": 2.743633276740238, "grad_norm": 0.41946488267172877, "learning_rate": 3.0497308678210413e-05, "loss": 0.1078, "loss_nan_ranks": 0, "loss_rank_avg": 0.05137067288160324, "step": 2425, "valid_targets_mean": 3500.1, "valid_targets_min": 1814 }, { "epoch": 2.749292586304471, "grad_norm": 0.4741519627348511, "learning_rate": 3.044924979598882e-05, "loss": 0.1162, "loss_nan_ranks": 0, "loss_rank_avg": 0.049934521317481995, "step": 2430, "valid_targets_mean": 1559.0, "valid_targets_min": 759 }, { "epoch": 2.754951895868704, "grad_norm": 0.3075634231736509, "learning_rate": 3.0401107781401092e-05, "loss": 0.0835, "loss_nan_ranks": 0, "loss_rank_avg": 0.039611075073480606, "step": 2435, "valid_targets_mean": 3942.6, "valid_targets_min": 2719 }, { "epoch": 2.7606112054329373, "grad_norm": 0.5009109914391133, "learning_rate": 3.0352883017456497e-05, "loss": 0.1061, "loss_nan_ranks": 0, "loss_rank_avg": 0.040671542286872864, "step": 2440, "valid_targets_mean": 1133.4, "valid_targets_min": 664 }, { "epoch": 2.7662705149971702, "grad_norm": 0.35783834790167424, "learning_rate": 3.0304575887822635e-05, "loss": 0.1039, "loss_nan_ranks": 0, "loss_rank_avg": 0.03562743961811066, "step": 2445, "valid_targets_mean": 2489.8, "valid_targets_min": 1584 }, { "epoch": 2.7719298245614032, "grad_norm": 0.36757407384846696, "learning_rate": 3.0256186776822415e-05, "loss": 0.0836, "loss_nan_ranks": 0, "loss_rank_avg": 0.0379403755068779, "step": 2450, "valid_targets_mean": 2685.4, "valid_targets_min": 1003 }, { "epoch": 2.7775891341256367, "grad_norm": 0.3558843724226644, "learning_rate": 3.0207716069430968e-05, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.04235576093196869, "step": 2455, "valid_targets_mean": 3180.8, "valid_targets_min": 560 }, { "epoch": 2.7832484436898697, "grad_norm": 0.36637576971355346, "learning_rate": 3.015916415127259e-05, "loss": 0.1036, "loss_nan_ranks": 0, "loss_rank_avg": 0.05197940021753311, "step": 2460, "valid_targets_mean": 3285.9, "valid_targets_min": 1049 }, { "epoch": 2.788907753254103, "grad_norm": 0.48073478238853684, "learning_rate": 3.011053140861768e-05, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.06219557300209999, "step": 2465, "valid_targets_mean": 2464.9, "valid_targets_min": 771 }, { "epoch": 2.794567062818336, "grad_norm": 0.4222816152964138, "learning_rate": 3.006181822837964e-05, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.0535898320376873, "step": 2470, "valid_targets_mean": 2959.5, "valid_targets_min": 825 }, { "epoch": 2.8002263723825696, "grad_norm": 0.5137217888589967, "learning_rate": 3.0013024998111856e-05, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.06423379480838776, "step": 2475, "valid_targets_mean": 2602.1, "valid_targets_min": 829 }, { "epoch": 2.8058856819468025, "grad_norm": 0.6608430897923827, "learning_rate": 2.9964152106004546e-05, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.062066759914159775, "step": 2480, "valid_targets_mean": 2106.1, "valid_targets_min": 650 }, { "epoch": 2.8115449915110355, "grad_norm": 0.4491563125079627, "learning_rate": 2.9915199940881723e-05, "loss": 0.1081, "loss_nan_ranks": 0, "loss_rank_avg": 0.060543835163116455, "step": 2485, "valid_targets_mean": 2946.0, "valid_targets_min": 729 }, { "epoch": 2.817204301075269, "grad_norm": 0.2901989643151657, "learning_rate": 2.9866168892198067e-05, "loss": 0.0935, "loss_nan_ranks": 0, "loss_rank_avg": 0.03691372275352478, "step": 2490, "valid_targets_mean": 3853.5, "valid_targets_min": 3152 }, { "epoch": 2.822863610639502, "grad_norm": 0.31715286077111987, "learning_rate": 2.9817059350035858e-05, "loss": 0.0958, "loss_nan_ranks": 0, "loss_rank_avg": 0.03336600959300995, "step": 2495, "valid_targets_mean": 3448.2, "valid_targets_min": 2543 }, { "epoch": 2.828522920203735, "grad_norm": 0.44423757895685106, "learning_rate": 2.9767871705101834e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.05750303715467453, "step": 2500, "valid_targets_mean": 2674.9, "valid_targets_min": 446 }, { "epoch": 2.8341822297679684, "grad_norm": 0.3714047560342441, "learning_rate": 2.9718606348724135e-05, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.042779020965099335, "step": 2505, "valid_targets_mean": 2807.6, "valid_targets_min": 681 }, { "epoch": 2.8398415393322014, "grad_norm": 0.45565095764546504, "learning_rate": 2.966926367284913e-05, "loss": 0.0975, "loss_nan_ranks": 0, "loss_rank_avg": 0.06783543527126312, "step": 2510, "valid_targets_mean": 5567.5, "valid_targets_min": 3772 }, { "epoch": 2.8455008488964344, "grad_norm": 0.31870357464902527, "learning_rate": 2.9619844070038336e-05, "loss": 0.0965, "loss_nan_ranks": 0, "loss_rank_avg": 0.04572061821818352, "step": 2515, "valid_targets_mean": 3662.4, "valid_targets_min": 484 }, { "epoch": 2.851160158460668, "grad_norm": 0.28353049541003644, "learning_rate": 2.957034793346531e-05, "loss": 0.0819, "loss_nan_ranks": 0, "loss_rank_avg": 0.035324037075042725, "step": 2520, "valid_targets_mean": 3900.0, "valid_targets_min": 861 }, { "epoch": 2.856819468024901, "grad_norm": 0.41454732495960667, "learning_rate": 2.9520775656912467e-05, "loss": 0.0969, "loss_nan_ranks": 0, "loss_rank_avg": 0.07399703562259674, "step": 2525, "valid_targets_mean": 4100.8, "valid_targets_min": 3268 }, { "epoch": 2.8624787775891343, "grad_norm": 0.3594007437946367, "learning_rate": 2.9471127634767992e-05, "loss": 0.097, "loss_nan_ranks": 0, "loss_rank_avg": 0.04679866135120392, "step": 2530, "valid_targets_mean": 3277.8, "valid_targets_min": 559 }, { "epoch": 2.8681380871533673, "grad_norm": 0.38766671277978854, "learning_rate": 2.9421404262022687e-05, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.044593460857868195, "step": 2535, "valid_targets_mean": 2986.2, "valid_targets_min": 689 }, { "epoch": 2.8737973967176007, "grad_norm": 0.5541215791435989, "learning_rate": 2.9371605934266826e-05, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.06732194870710373, "step": 2540, "valid_targets_mean": 1831.6, "valid_targets_min": 616 }, { "epoch": 2.8794567062818337, "grad_norm": 0.4653944890140849, "learning_rate": 2.9321733047687028e-05, "loss": 0.0785, "loss_nan_ranks": 0, "loss_rank_avg": 0.052152834832668304, "step": 2545, "valid_targets_mean": 2087.0, "valid_targets_min": 602 }, { "epoch": 2.8851160158460667, "grad_norm": 0.3697902152532082, "learning_rate": 2.9271785999063058e-05, "loss": 0.1201, "loss_nan_ranks": 0, "loss_rank_avg": 0.05232277512550354, "step": 2550, "valid_targets_mean": 3992.1, "valid_targets_min": 3551 }, { "epoch": 2.8907753254103, "grad_norm": 0.4102298567601552, "learning_rate": 2.922176518576473e-05, "loss": 0.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.03710225224494934, "step": 2555, "valid_targets_mean": 2115.1, "valid_targets_min": 596 }, { "epoch": 2.896434634974533, "grad_norm": 0.3506315433787024, "learning_rate": 2.9171671005748705e-05, "loss": 0.1021, "loss_nan_ranks": 0, "loss_rank_avg": 0.04065260291099548, "step": 2560, "valid_targets_mean": 3488.0, "valid_targets_min": 799 }, { "epoch": 2.902093944538766, "grad_norm": 0.43876156646589926, "learning_rate": 2.9121503857555337e-05, "loss": 0.1146, "loss_nan_ranks": 0, "loss_rank_avg": 0.0732661634683609, "step": 2565, "valid_targets_mean": 3078.9, "valid_targets_min": 706 }, { "epoch": 2.9077532541029996, "grad_norm": 0.4989205776297815, "learning_rate": 2.9071264140305504e-05, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.05086730048060417, "step": 2570, "valid_targets_mean": 1957.6, "valid_targets_min": 710 }, { "epoch": 2.9134125636672326, "grad_norm": 0.411276296598042, "learning_rate": 2.9020952253697417e-05, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.045306913554668427, "step": 2575, "valid_targets_mean": 3112.4, "valid_targets_min": 647 }, { "epoch": 2.9190718732314656, "grad_norm": 0.5328660391020346, "learning_rate": 2.8970568598003485e-05, "loss": 0.1019, "loss_nan_ranks": 0, "loss_rank_avg": 0.047358643263578415, "step": 2580, "valid_targets_mean": 1494.9, "valid_targets_min": 716 }, { "epoch": 2.924731182795699, "grad_norm": 0.3852799501619404, "learning_rate": 2.8920113574067063e-05, "loss": 0.0956, "loss_nan_ranks": 0, "loss_rank_avg": 0.05453154444694519, "step": 2585, "valid_targets_mean": 3669.5, "valid_targets_min": 3122 }, { "epoch": 2.930390492359932, "grad_norm": 0.4503646099363286, "learning_rate": 2.8869587583299315e-05, "loss": 0.0979, "loss_nan_ranks": 0, "loss_rank_avg": 0.051441676914691925, "step": 2590, "valid_targets_mean": 2399.1, "valid_targets_min": 832 }, { "epoch": 2.936049801924165, "grad_norm": 0.5372867608649338, "learning_rate": 2.8818991027676014e-05, "loss": 0.0854, "loss_nan_ranks": 0, "loss_rank_avg": 0.04305317997932434, "step": 2595, "valid_targets_mean": 1216.9, "valid_targets_min": 635 }, { "epoch": 2.9417091114883984, "grad_norm": 0.40304566483129606, "learning_rate": 2.876832430973432e-05, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.048321161419153214, "step": 2600, "valid_targets_mean": 3078.1, "valid_targets_min": 756 }, { "epoch": 2.9473684210526314, "grad_norm": 0.4502755032894269, "learning_rate": 2.8717587832569598e-05, "loss": 0.0881, "loss_nan_ranks": 0, "loss_rank_avg": 0.059124238789081573, "step": 2605, "valid_targets_mean": 2387.1, "valid_targets_min": 744 }, { "epoch": 2.953027730616865, "grad_norm": 0.3427640277748679, "learning_rate": 2.8666781999832198e-05, "loss": 0.0946, "loss_nan_ranks": 0, "loss_rank_avg": 0.03376740589737892, "step": 2610, "valid_targets_mean": 2088.4, "valid_targets_min": 529 }, { "epoch": 2.958687040181098, "grad_norm": 0.44946510033221493, "learning_rate": 2.8615907215724266e-05, "loss": 0.1061, "loss_nan_ranks": 0, "loss_rank_avg": 0.06872159242630005, "step": 2615, "valid_targets_mean": 3932.1, "valid_targets_min": 2017 }, { "epoch": 2.9643463497453313, "grad_norm": 0.2666267217286435, "learning_rate": 2.8564963884996494e-05, "loss": 0.0894, "loss_nan_ranks": 0, "loss_rank_avg": 0.03546273708343506, "step": 2620, "valid_targets_mean": 4790.0, "valid_targets_min": 516 }, { "epoch": 2.9700056593095643, "grad_norm": 0.364616438660843, "learning_rate": 2.851395241294493e-05, "loss": 0.088, "loss_nan_ranks": 0, "loss_rank_avg": 0.041498977690935135, "step": 2625, "valid_targets_mean": 2245.1, "valid_targets_min": 772 }, { "epoch": 2.9756649688737973, "grad_norm": 0.348973673917049, "learning_rate": 2.8462873205407747e-05, "loss": 0.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.046205684542655945, "step": 2630, "valid_targets_mean": 3851.0, "valid_targets_min": 2196 }, { "epoch": 2.9813242784380307, "grad_norm": 0.46190471072869965, "learning_rate": 2.8411726668761998e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.13584215939044952, "step": 2635, "valid_targets_mean": 3094.1, "valid_targets_min": 2759 }, { "epoch": 2.9869835880022637, "grad_norm": 0.3227746990944905, "learning_rate": 2.8360513209920388e-05, "loss": 0.1048, "loss_nan_ranks": 0, "loss_rank_avg": 0.03658788651227951, "step": 2640, "valid_targets_mean": 3760.2, "valid_targets_min": 3175 }, { "epoch": 2.9926428975664967, "grad_norm": 0.3837603633008106, "learning_rate": 2.8309233236328074e-05, "loss": 0.1043, "loss_nan_ranks": 0, "loss_rank_avg": 0.03533530980348587, "step": 2645, "valid_targets_mean": 2446.5, "valid_targets_min": 759 }, { "epoch": 2.99830220713073, "grad_norm": 0.4993258903053454, "learning_rate": 2.8257887155959352e-05, "loss": 0.1022, "loss_nan_ranks": 0, "loss_rank_avg": 0.10851038992404938, "step": 2650, "valid_targets_mean": 2332.5, "valid_targets_min": 927 }, { "epoch": 3.0033955857385397, "grad_norm": 0.4474466581519664, "learning_rate": 2.8206475377314486e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.08224907517433167, "step": 2655, "valid_targets_mean": 6116.6, "valid_targets_min": 4858 }, { "epoch": 3.009054895302773, "grad_norm": 0.3834057659347809, "learning_rate": 2.8154998309416404e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.08942107111215591, "step": 2660, "valid_targets_mean": 6616.0, "valid_targets_min": 4759 }, { "epoch": 3.014714204867006, "grad_norm": 0.38251126769579447, "learning_rate": 2.8103456361807473e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.08066676557064056, "step": 2665, "valid_targets_mean": 5258.1, "valid_targets_min": 4373 }, { "epoch": 3.0203735144312396, "grad_norm": 0.400000478072429, "learning_rate": 2.8051849944546225e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.09580092132091522, "step": 2670, "valid_targets_mean": 5849.6, "valid_targets_min": 4813 }, { "epoch": 3.0260328239954726, "grad_norm": 0.43763746681992655, "learning_rate": 2.80001794682041e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.09335286170244217, "step": 2675, "valid_targets_mean": 5604.5, "valid_targets_min": 3983 }, { "epoch": 3.0316921335597056, "grad_norm": 0.48759592075455604, "learning_rate": 2.7948445343862188e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.08601689338684082, "step": 2680, "valid_targets_mean": 6438.2, "valid_targets_min": 5154 }, { "epoch": 3.037351443123939, "grad_norm": 0.4005248763640473, "learning_rate": 2.7896647983107952e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.07797376066446304, "step": 2685, "valid_targets_mean": 5509.6, "valid_targets_min": 5040 }, { "epoch": 3.043010752688172, "grad_norm": 0.4567820303407952, "learning_rate": 2.784478779803194e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.11923784762620926, "step": 2690, "valid_targets_mean": 6410.5, "valid_targets_min": 5066 }, { "epoch": 3.048670062252405, "grad_norm": 0.4018410434737254, "learning_rate": 2.7792865201224536e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.07983622699975967, "step": 2695, "valid_targets_mean": 6616.2, "valid_targets_min": 4500 }, { "epoch": 3.0543293718166384, "grad_norm": 0.42280164910105855, "learning_rate": 2.7740880605772644e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.10148809850215912, "step": 2700, "valid_targets_mean": 7507.6, "valid_targets_min": 5455 }, { "epoch": 3.0599886813808714, "grad_norm": 0.40674098351312155, "learning_rate": 2.7688834425256426e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.09895728528499603, "step": 2705, "valid_targets_mean": 7383.8, "valid_targets_min": 4715 }, { "epoch": 3.065647990945105, "grad_norm": 0.36990046485579053, "learning_rate": 2.7636727073746015e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.0861731767654419, "step": 2710, "valid_targets_mean": 6624.9, "valid_targets_min": 5315 }, { "epoch": 3.071307300509338, "grad_norm": 0.3662529670090019, "learning_rate": 2.7584558965798183e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.09385193884372711, "step": 2715, "valid_targets_mean": 7394.5, "valid_targets_min": 4353 }, { "epoch": 3.076966610073571, "grad_norm": 0.476285721677575, "learning_rate": 2.7532330516453094e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.08194148540496826, "step": 2720, "valid_targets_mean": 6296.0, "valid_targets_min": 4890 }, { "epoch": 3.0826259196378043, "grad_norm": 0.4001613005928641, "learning_rate": 2.7480042141230963e-05, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.0721985325217247, "step": 2725, "valid_targets_mean": 5848.5, "valid_targets_min": 4560 }, { "epoch": 3.0882852292020373, "grad_norm": 0.4520142971167075, "learning_rate": 2.7427694256128776e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.09193578362464905, "step": 2730, "valid_targets_mean": 5550.9, "valid_targets_min": 3640 }, { "epoch": 3.0939445387662703, "grad_norm": 0.5140528274529098, "learning_rate": 2.737528727761696e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.09765416383743286, "step": 2735, "valid_targets_mean": 5894.4, "valid_targets_min": 3967 }, { "epoch": 3.0996038483305037, "grad_norm": 0.3994772187194201, "learning_rate": 2.7322821622636077e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.08106030523777008, "step": 2740, "valid_targets_mean": 6153.9, "valid_targets_min": 4521 }, { "epoch": 3.1052631578947367, "grad_norm": 0.4273215647315338, "learning_rate": 2.7270297708593517e-05, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.08103308826684952, "step": 2745, "valid_targets_mean": 6440.5, "valid_targets_min": 5067 }, { "epoch": 3.11092246745897, "grad_norm": 0.4133850486345733, "learning_rate": 2.7217715953360166e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.07770150154829025, "step": 2750, "valid_targets_mean": 6049.2, "valid_targets_min": 4385 }, { "epoch": 3.116581777023203, "grad_norm": 0.34763851050877514, "learning_rate": 2.716507677526707e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.07968132197856903, "step": 2755, "valid_targets_mean": 7771.6, "valid_targets_min": 4566 }, { "epoch": 3.122241086587436, "grad_norm": 0.3658412345569811, "learning_rate": 2.711238059310215e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.08296516537666321, "step": 2760, "valid_targets_mean": 6633.6, "valid_targets_min": 5067 }, { "epoch": 3.1279003961516696, "grad_norm": 0.4022203908775496, "learning_rate": 2.7059627826106817e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.08426246792078018, "step": 2765, "valid_targets_mean": 6862.6, "valid_targets_min": 5178 }, { "epoch": 3.1335597057159026, "grad_norm": 0.36101301045305095, "learning_rate": 2.700681889397267e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.08576173335313797, "step": 2770, "valid_targets_mean": 6075.1, "valid_targets_min": 3854 }, { "epoch": 3.139219015280136, "grad_norm": 0.38940482167263113, "learning_rate": 2.6953954216838148e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.103759765625, "step": 2775, "valid_targets_mean": 6840.1, "valid_targets_min": 4743 }, { "epoch": 3.144878324844369, "grad_norm": 0.42119432839413173, "learning_rate": 2.6901034215285182e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.11053457856178284, "step": 2780, "valid_targets_mean": 6480.9, "valid_targets_min": 4761 }, { "epoch": 3.150537634408602, "grad_norm": 0.38769543749848867, "learning_rate": 2.684805931033586e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.08253707736730576, "step": 2785, "valid_targets_mean": 6224.5, "valid_targets_min": 4789 }, { "epoch": 3.1561969439728355, "grad_norm": 0.4282214287537209, "learning_rate": 2.679502992344907e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.08985629677772522, "step": 2790, "valid_targets_mean": 6686.4, "valid_targets_min": 5403 }, { "epoch": 3.1618562535370685, "grad_norm": 0.41290216643054406, "learning_rate": 2.6741946476517146e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.08517882227897644, "step": 2795, "valid_targets_mean": 6285.0, "valid_targets_min": 4970 }, { "epoch": 3.1675155631013014, "grad_norm": 0.3814241100551298, "learning_rate": 2.6688809391862523e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.09944672882556915, "step": 2800, "valid_targets_mean": 6926.9, "valid_targets_min": 5299 }, { "epoch": 3.173174872665535, "grad_norm": 0.3698913524612867, "learning_rate": 2.663561909223435e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.08579894155263901, "step": 2805, "valid_targets_mean": 6121.8, "valid_targets_min": 4951 }, { "epoch": 3.178834182229768, "grad_norm": 0.37507158309419764, "learning_rate": 2.6582376000805165e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.08966280519962311, "step": 2810, "valid_targets_mean": 8113.1, "valid_targets_min": 4794 }, { "epoch": 3.1844934917940013, "grad_norm": 0.41938823779454215, "learning_rate": 2.6529080541167495e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.09570719301700592, "step": 2815, "valid_targets_mean": 5281.6, "valid_targets_min": 593 }, { "epoch": 3.1901528013582343, "grad_norm": 0.3576745054687525, "learning_rate": 2.6475733137330507e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.07610517740249634, "step": 2820, "valid_targets_mean": 7339.1, "valid_targets_min": 4595 }, { "epoch": 3.1958121109224673, "grad_norm": 0.37485748388357865, "learning_rate": 2.6422334213716624e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.07846750319004059, "step": 2825, "valid_targets_mean": 6674.0, "valid_targets_min": 5411 }, { "epoch": 3.2014714204867007, "grad_norm": 0.39479740390012996, "learning_rate": 2.6368884195158143e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.0896659716963768, "step": 2830, "valid_targets_mean": 6596.2, "valid_targets_min": 4451 }, { "epoch": 3.2071307300509337, "grad_norm": 0.40341629615302077, "learning_rate": 2.6315383506893876e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.09459621459245682, "step": 2835, "valid_targets_mean": 7159.2, "valid_targets_min": 5568 }, { "epoch": 3.212790039615167, "grad_norm": 0.3918402890328763, "learning_rate": 2.6261832574565752e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.10028786957263947, "step": 2840, "valid_targets_mean": 6923.1, "valid_targets_min": 4839 }, { "epoch": 3.2184493491794, "grad_norm": 0.44570531285265286, "learning_rate": 2.6208231824215417e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.07951401174068451, "step": 2845, "valid_targets_mean": 4921.4, "valid_targets_min": 3517 }, { "epoch": 3.224108658743633, "grad_norm": 0.39736569597017907, "learning_rate": 2.6154581682280892e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.07940314710140228, "step": 2850, "valid_targets_mean": 5929.9, "valid_targets_min": 3551 }, { "epoch": 3.2297679683078666, "grad_norm": 0.43576786309433435, "learning_rate": 2.610088257559311e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.07687495648860931, "step": 2855, "valid_targets_mean": 5854.9, "valid_targets_min": 4614 }, { "epoch": 3.2354272778720996, "grad_norm": 0.39667426144543194, "learning_rate": 2.604713493137259e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.0954388827085495, "step": 2860, "valid_targets_mean": 6779.1, "valid_targets_min": 5050 }, { "epoch": 3.2410865874363326, "grad_norm": 0.39211282940314196, "learning_rate": 2.5993339177226002e-05, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.08446860313415527, "step": 2865, "valid_targets_mean": 5993.4, "valid_targets_min": 4734 }, { "epoch": 3.246745897000566, "grad_norm": 0.37180973272400625, "learning_rate": 2.593949574114274e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.08481285721063614, "step": 2870, "valid_targets_mean": 6826.9, "valid_targets_min": 4966 }, { "epoch": 3.252405206564799, "grad_norm": 0.38890138005202446, "learning_rate": 2.5885605051491592e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.076046884059906, "step": 2875, "valid_targets_mean": 6366.5, "valid_targets_min": 4510 }, { "epoch": 3.258064516129032, "grad_norm": 0.3764722912174805, "learning_rate": 2.583166753701725e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.06771224737167358, "step": 2880, "valid_targets_mean": 5248.9, "valid_targets_min": 4430 }, { "epoch": 3.2637238256932655, "grad_norm": 0.3707213763979597, "learning_rate": 2.5777683626836964e-05, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.07067465782165527, "step": 2885, "valid_targets_mean": 5854.6, "valid_targets_min": 4701 }, { "epoch": 3.2693831352574985, "grad_norm": 0.38176253383761427, "learning_rate": 2.5723653750437083e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.08251985907554626, "step": 2890, "valid_targets_mean": 6520.2, "valid_targets_min": 4501 }, { "epoch": 3.275042444821732, "grad_norm": 0.3696783228124919, "learning_rate": 2.5669578337669653e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.08970288187265396, "step": 2895, "valid_targets_mean": 6796.4, "valid_targets_min": 3640 }, { "epoch": 3.280701754385965, "grad_norm": 0.5997009652550589, "learning_rate": 2.5615457818749007e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.08683329820632935, "step": 2900, "valid_targets_mean": 6024.8, "valid_targets_min": 5024 }, { "epoch": 3.286361063950198, "grad_norm": 0.3970354064915422, "learning_rate": 2.5561292624248344e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.09823933243751526, "step": 2905, "valid_targets_mean": 6549.4, "valid_targets_min": 4715 }, { "epoch": 3.2920203735144313, "grad_norm": 0.4040600633209962, "learning_rate": 2.5507083185096267e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.0729404091835022, "step": 2910, "valid_targets_mean": 5681.1, "valid_targets_min": 4730 }, { "epoch": 3.2976796830786643, "grad_norm": 0.40529122982296795, "learning_rate": 2.545282993257341e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.08735214918851852, "step": 2915, "valid_targets_mean": 5787.6, "valid_targets_min": 4657 }, { "epoch": 3.3033389926428978, "grad_norm": 0.38732883346244273, "learning_rate": 2.5398533298308956e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.08877654373645782, "step": 2920, "valid_targets_mean": 6862.9, "valid_targets_min": 5599 }, { "epoch": 3.3089983022071308, "grad_norm": 0.5611570775932486, "learning_rate": 2.534419371427724e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.11140226572751999, "step": 2925, "valid_targets_mean": 6471.2, "valid_targets_min": 4948 }, { "epoch": 3.3146576117713638, "grad_norm": 0.43561660126955126, "learning_rate": 2.5289811612794297e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.09498600661754608, "step": 2930, "valid_targets_mean": 7644.9, "valid_targets_min": 4876 }, { "epoch": 3.320316921335597, "grad_norm": 0.39243379533926886, "learning_rate": 2.5235387426514405e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.07330992817878723, "step": 2935, "valid_targets_mean": 5750.1, "valid_targets_min": 3599 }, { "epoch": 3.32597623089983, "grad_norm": 0.3950361179379625, "learning_rate": 2.5180921588426693e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.10302229225635529, "step": 2940, "valid_targets_mean": 7335.2, "valid_targets_min": 4800 }, { "epoch": 3.331635540464063, "grad_norm": 0.34118533977997895, "learning_rate": 2.5126414531851634e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.06809462606906891, "step": 2945, "valid_targets_mean": 7088.9, "valid_targets_min": 4228 }, { "epoch": 3.3372948500282966, "grad_norm": 0.40089882561464724, "learning_rate": 2.507186669043764e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.08894894272089005, "step": 2950, "valid_targets_mean": 6421.2, "valid_targets_min": 5314 }, { "epoch": 3.3429541595925296, "grad_norm": 0.3809360499548981, "learning_rate": 2.5017278498157608e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.08135772496461868, "step": 2955, "valid_targets_mean": 6345.4, "valid_targets_min": 4634 }, { "epoch": 3.348613469156763, "grad_norm": 0.401319262721283, "learning_rate": 2.496265038930545e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.07413016259670258, "step": 2960, "valid_targets_mean": 5758.2, "valid_targets_min": 4521 }, { "epoch": 3.354272778720996, "grad_norm": 0.4181749873395065, "learning_rate": 2.4907982798492647e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.07992276549339294, "step": 2965, "valid_targets_mean": 5346.1, "valid_targets_min": 4180 }, { "epoch": 3.359932088285229, "grad_norm": 0.37821898461591213, "learning_rate": 2.485327616064479e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.09109698235988617, "step": 2970, "valid_targets_mean": 7561.1, "valid_targets_min": 4791 }, { "epoch": 3.3655913978494625, "grad_norm": 0.42463483961812915, "learning_rate": 2.4798530910998126e-05, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.07687358558177948, "step": 2975, "valid_targets_mean": 6135.1, "valid_targets_min": 4670 }, { "epoch": 3.3712507074136955, "grad_norm": 0.4168973212704639, "learning_rate": 2.474374748509609e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.08751700818538666, "step": 2980, "valid_targets_mean": 6526.8, "valid_targets_min": 4806 }, { "epoch": 3.376910016977929, "grad_norm": 0.4377975902513151, "learning_rate": 2.4688926318785845e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.07013484835624695, "step": 2985, "valid_targets_mean": 5486.9, "valid_targets_min": 4453 }, { "epoch": 3.382569326542162, "grad_norm": 0.37451008367015687, "learning_rate": 2.4634067848214797e-05, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.09076303988695145, "step": 2990, "valid_targets_mean": 7182.4, "valid_targets_min": 5687 }, { "epoch": 3.388228636106395, "grad_norm": 0.39214339758244726, "learning_rate": 2.4579172509827146e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.07283439487218857, "step": 2995, "valid_targets_mean": 6945.2, "valid_targets_min": 4964 }, { "epoch": 3.3938879456706283, "grad_norm": 0.34687787029362777, "learning_rate": 2.4524240740360404e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.08273832499980927, "step": 3000, "valid_targets_mean": 7281.2, "valid_targets_min": 5625 }, { "epoch": 3.3995472552348613, "grad_norm": 0.39512915127755643, "learning_rate": 2.4469272976841925e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.07421189546585083, "step": 3005, "valid_targets_mean": 6706.9, "valid_targets_min": 5006 }, { "epoch": 3.4052065647990943, "grad_norm": 0.3837267214169814, "learning_rate": 2.441426965658543e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.08413764834403992, "step": 3010, "valid_targets_mean": 6947.8, "valid_targets_min": 5252 }, { "epoch": 3.4108658743633278, "grad_norm": 0.3987996482159172, "learning_rate": 2.4359231217187508e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.08512748777866364, "step": 3015, "valid_targets_mean": 6373.1, "valid_targets_min": 5071 }, { "epoch": 3.4165251839275608, "grad_norm": 0.42740405345315763, "learning_rate": 2.430415809652416e-05, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.09217800945043564, "step": 3020, "valid_targets_mean": 6664.0, "valid_targets_min": 3440 }, { "epoch": 3.4221844934917938, "grad_norm": 0.4565520082770164, "learning_rate": 2.4249050732747302e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.05961686745285988, "step": 3025, "valid_targets_mean": 3621.8, "valid_targets_min": 393 }, { "epoch": 3.427843803056027, "grad_norm": 0.46328547075081156, "learning_rate": 2.4193909564281288e-05, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.04435160011053085, "step": 3030, "valid_targets_mean": 2602.0, "valid_targets_min": 816 }, { "epoch": 3.43350311262026, "grad_norm": 0.37137173861478123, "learning_rate": 2.4138735029819418e-05, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.04348450154066086, "step": 3035, "valid_targets_mean": 3217.9, "valid_targets_min": 2461 }, { "epoch": 3.4391624221844936, "grad_norm": 0.39992157414840956, "learning_rate": 2.408352756832042e-05, "loss": 0.0875, "loss_nan_ranks": 0, "loss_rank_avg": 0.04790376126766205, "step": 3040, "valid_targets_mean": 3767.2, "valid_targets_min": 2571 }, { "epoch": 3.4448217317487266, "grad_norm": 0.35293050494196204, "learning_rate": 2.402828761900502e-05, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.042876340448856354, "step": 3045, "valid_targets_mean": 3830.4, "valid_targets_min": 2582 }, { "epoch": 3.4504810413129596, "grad_norm": 0.5742800954287768, "learning_rate": 2.3973015621352382e-05, "loss": 0.0869, "loss_nan_ranks": 0, "loss_rank_avg": 0.036809295415878296, "step": 3050, "valid_targets_mean": 3032.0, "valid_targets_min": 1198 }, { "epoch": 3.456140350877193, "grad_norm": 0.7703852038293989, "learning_rate": 2.3917712015096664e-05, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.06168600916862488, "step": 3055, "valid_targets_mean": 974.9, "valid_targets_min": 525 }, { "epoch": 3.461799660441426, "grad_norm": 0.4488567722071903, "learning_rate": 2.386237724022348e-05, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.052345506846904755, "step": 3060, "valid_targets_mean": 3010.8, "valid_targets_min": 954 }, { "epoch": 3.4674589700056595, "grad_norm": 0.4394392338230334, "learning_rate": 2.3807011736966414e-05, "loss": 0.095, "loss_nan_ranks": 0, "loss_rank_avg": 0.0646510049700737, "step": 3065, "valid_targets_mean": 3078.4, "valid_targets_min": 863 }, { "epoch": 3.4731182795698925, "grad_norm": 0.33509251616177965, "learning_rate": 2.3751615945803547e-05, "loss": 0.1027, "loss_nan_ranks": 0, "loss_rank_avg": 0.04230031371116638, "step": 3070, "valid_targets_mean": 2921.1, "valid_targets_min": 540 }, { "epoch": 3.4787775891341255, "grad_norm": 0.2933598862510744, "learning_rate": 2.3696190307453883e-05, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.03300682455301285, "step": 3075, "valid_targets_mean": 4658.5, "valid_targets_min": 1008 }, { "epoch": 3.484436898698359, "grad_norm": 0.3443708556168441, "learning_rate": 2.364073526287392e-05, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.042443834245204926, "step": 3080, "valid_targets_mean": 3757.0, "valid_targets_min": 818 }, { "epoch": 3.490096208262592, "grad_norm": 0.32342934598558776, "learning_rate": 2.358525125325409e-05, "loss": 0.0911, "loss_nan_ranks": 0, "loss_rank_avg": 0.03649405390024185, "step": 3085, "valid_targets_mean": 4063.0, "valid_targets_min": 2642 }, { "epoch": 3.495755517826825, "grad_norm": 0.5233099293331086, "learning_rate": 2.352973872001527e-05, "loss": 0.1005, "loss_nan_ranks": 0, "loss_rank_avg": 0.09330583363771439, "step": 3090, "valid_targets_mean": 2844.0, "valid_targets_min": 614 }, { "epoch": 3.5014148273910584, "grad_norm": 0.3713693899571308, "learning_rate": 2.347419810480527e-05, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.03937401995062828, "step": 3095, "valid_targets_mean": 3617.4, "valid_targets_min": 2537 }, { "epoch": 3.5070741369552914, "grad_norm": 0.5342177275371015, "learning_rate": 2.34186298494953e-05, "loss": 0.0902, "loss_nan_ranks": 0, "loss_rank_avg": 0.05524876341223717, "step": 3100, "valid_targets_mean": 1941.8, "valid_targets_min": 674 }, { "epoch": 3.5127334465195243, "grad_norm": 0.32478754183719977, "learning_rate": 2.3363034396176486e-05, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.03607283532619476, "step": 3105, "valid_targets_mean": 3252.2, "valid_targets_min": 987 }, { "epoch": 3.518392756083758, "grad_norm": 0.34568450638192383, "learning_rate": 2.3307412187156334e-05, "loss": 0.0796, "loss_nan_ranks": 0, "loss_rank_avg": 0.036379989236593246, "step": 3110, "valid_targets_mean": 3654.8, "valid_targets_min": 2616 }, { "epoch": 3.524052065647991, "grad_norm": 0.446074380238172, "learning_rate": 2.3251763664955208e-05, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.040246620774269104, "step": 3115, "valid_targets_mean": 2054.1, "valid_targets_min": 714 }, { "epoch": 3.5297113752122242, "grad_norm": 0.46251594514856853, "learning_rate": 2.3196089272302813e-05, "loss": 0.1032, "loss_nan_ranks": 0, "loss_rank_avg": 0.047611210495233536, "step": 3120, "valid_targets_mean": 2018.1, "valid_targets_min": 893 }, { "epoch": 3.535370684776457, "grad_norm": 0.43018554505934625, "learning_rate": 2.3140389452134677e-05, "loss": 0.1043, "loss_nan_ranks": 0, "loss_rank_avg": 0.053366247564554214, "step": 3125, "valid_targets_mean": 3815.4, "valid_targets_min": 3061 }, { "epoch": 3.5410299943406907, "grad_norm": 0.38989614452081606, "learning_rate": 2.3084664647588636e-05, "loss": 0.1001, "loss_nan_ranks": 0, "loss_rank_avg": 0.05068257078528404, "step": 3130, "valid_targets_mean": 3584.0, "valid_targets_min": 1810 }, { "epoch": 3.5466893039049237, "grad_norm": 0.33899258716770153, "learning_rate": 2.3028915302001286e-05, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.03708091750741005, "step": 3135, "valid_targets_mean": 3354.2, "valid_targets_min": 902 }, { "epoch": 3.5523486134691566, "grad_norm": 0.479265531070496, "learning_rate": 2.297314185890446e-05, "loss": 0.0872, "loss_nan_ranks": 0, "loss_rank_avg": 0.04440346360206604, "step": 3140, "valid_targets_mean": 2775.8, "valid_targets_min": 711 }, { "epoch": 3.55800792303339, "grad_norm": 0.670543564360072, "learning_rate": 2.291734476202173e-05, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.05753045901656151, "step": 3145, "valid_targets_mean": 1493.0, "valid_targets_min": 643 }, { "epoch": 3.563667232597623, "grad_norm": 0.5391448054021986, "learning_rate": 2.286152445526482e-05, "loss": 0.1134, "loss_nan_ranks": 0, "loss_rank_avg": 0.04792678728699684, "step": 3150, "valid_targets_mean": 2481.8, "valid_targets_min": 538 }, { "epoch": 3.569326542161856, "grad_norm": 0.4195015177774701, "learning_rate": 2.2805681382730142e-05, "loss": 0.0912, "loss_nan_ranks": 0, "loss_rank_avg": 0.028936494141817093, "step": 3155, "valid_targets_mean": 2257.2, "valid_targets_min": 664 }, { "epoch": 3.5749858517260895, "grad_norm": 0.5865427341283793, "learning_rate": 2.2749815988695208e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.09612908959388733, "step": 3160, "valid_targets_mean": 2451.9, "valid_targets_min": 1180 }, { "epoch": 3.5806451612903225, "grad_norm": 0.4682729700077621, "learning_rate": 2.2693928717615118e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.03941601514816284, "step": 3165, "valid_targets_mean": 1885.5, "valid_targets_min": 756 }, { "epoch": 3.5863044708545555, "grad_norm": 0.342242583693858, "learning_rate": 2.2638020014119033e-05, "loss": 0.1034, "loss_nan_ranks": 0, "loss_rank_avg": 0.03896958753466606, "step": 3170, "valid_targets_mean": 3355.1, "valid_targets_min": 2963 }, { "epoch": 3.591963780418789, "grad_norm": 0.6921453617996776, "learning_rate": 2.2582090323006603e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.1678619682788849, "step": 3175, "valid_targets_mean": 2357.1, "valid_targets_min": 1153 }, { "epoch": 3.597623089983022, "grad_norm": 0.31611802316350174, "learning_rate": 2.2526140089244483e-05, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.04150187224149704, "step": 3180, "valid_targets_mean": 4602.2, "valid_targets_min": 3507 }, { "epoch": 3.6032823995472554, "grad_norm": 0.3350914314311627, "learning_rate": 2.247016975796274e-05, "loss": 0.0901, "loss_nan_ranks": 0, "loss_rank_avg": 0.04903364181518555, "step": 3185, "valid_targets_mean": 4597.1, "valid_targets_min": 3835 }, { "epoch": 3.6089417091114884, "grad_norm": 0.40270627304143364, "learning_rate": 2.2414179774451333e-05, "loss": 0.1007, "loss_nan_ranks": 0, "loss_rank_avg": 0.04972846806049347, "step": 3190, "valid_targets_mean": 3571.6, "valid_targets_min": 784 }, { "epoch": 3.614601018675722, "grad_norm": 0.415917999569666, "learning_rate": 2.2358170584156577e-05, "loss": 0.0865, "loss_nan_ranks": 0, "loss_rank_avg": 0.034407228231430054, "step": 3195, "valid_targets_mean": 1951.9, "valid_targets_min": 779 }, { "epoch": 3.620260328239955, "grad_norm": 0.5217860854709225, "learning_rate": 2.2302142632677605e-05, "loss": 0.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.042375870048999786, "step": 3200, "valid_targets_mean": 2124.8, "valid_targets_min": 674 }, { "epoch": 3.625919637804188, "grad_norm": 0.44254199276435036, "learning_rate": 2.2246096365762782e-05, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.04500596970319748, "step": 3205, "valid_targets_mean": 2388.5, "valid_targets_min": 712 }, { "epoch": 3.6315789473684212, "grad_norm": 0.3665353563421478, "learning_rate": 2.2190032229306215e-05, "loss": 0.0894, "loss_nan_ranks": 0, "loss_rank_avg": 0.04064202308654785, "step": 3210, "valid_targets_mean": 3521.6, "valid_targets_min": 2422 }, { "epoch": 3.6372382569326542, "grad_norm": 0.34605379460700103, "learning_rate": 2.2133950669344156e-05, "loss": 0.0767, "loss_nan_ranks": 0, "loss_rank_avg": 0.02806910313665867, "step": 3215, "valid_targets_mean": 3248.5, "valid_targets_min": 576 }, { "epoch": 3.6428975664968872, "grad_norm": 0.30931044690920806, "learning_rate": 2.207785213205149e-05, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.023745758458971977, "step": 3220, "valid_targets_mean": 3581.9, "valid_targets_min": 772 }, { "epoch": 3.6485568760611207, "grad_norm": 0.43922432142537926, "learning_rate": 2.202173706373817e-05, "loss": 0.0751, "loss_nan_ranks": 0, "loss_rank_avg": 0.03783226013183594, "step": 3225, "valid_targets_mean": 2654.1, "valid_targets_min": 722 }, { "epoch": 3.6542161856253537, "grad_norm": 0.3477209012773255, "learning_rate": 2.1965605910845654e-05, "loss": 0.0779, "loss_nan_ranks": 0, "loss_rank_avg": 0.04104755073785782, "step": 3230, "valid_targets_mean": 3685.9, "valid_targets_min": 2788 }, { "epoch": 3.6598754951895867, "grad_norm": 0.3768374199903355, "learning_rate": 2.1909459119943384e-05, "loss": 0.0805, "loss_nan_ranks": 0, "loss_rank_avg": 0.0392816886305809, "step": 3235, "valid_targets_mean": 2503.4, "valid_targets_min": 614 }, { "epoch": 3.66553480475382, "grad_norm": 0.6007344213267962, "learning_rate": 2.1853297137725204e-05, "loss": 0.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.11411529779434204, "step": 3240, "valid_targets_mean": 1719.4, "valid_targets_min": 608 }, { "epoch": 3.671194114318053, "grad_norm": 0.3754157879242706, "learning_rate": 2.1797120411005807e-05, "loss": 0.0982, "loss_nan_ranks": 0, "loss_rank_avg": 0.042109765112400055, "step": 3245, "valid_targets_mean": 3966.6, "valid_targets_min": 3150 }, { "epoch": 3.676853423882286, "grad_norm": 0.5445762559868512, "learning_rate": 2.1740929386717222e-05, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.05597252771258354, "step": 3250, "valid_targets_mean": 2366.1, "valid_targets_min": 718 }, { "epoch": 3.6825127334465195, "grad_norm": 0.42769001995635586, "learning_rate": 2.1684724511905193e-05, "loss": 0.0934, "loss_nan_ranks": 0, "loss_rank_avg": 0.04565860331058502, "step": 3255, "valid_targets_mean": 3555.2, "valid_targets_min": 1333 }, { "epoch": 3.688172043010753, "grad_norm": 0.44318255157550557, "learning_rate": 2.1628506233725678e-05, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.041587576270103455, "step": 3260, "valid_targets_mean": 2041.2, "valid_targets_min": 693 }, { "epoch": 3.693831352574986, "grad_norm": 0.4537669446711333, "learning_rate": 2.1572274999441265e-05, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.036606110632419586, "step": 3265, "valid_targets_mean": 1494.2, "valid_targets_min": 803 }, { "epoch": 3.699490662139219, "grad_norm": 0.38686037920354616, "learning_rate": 2.151603125641761e-05, "loss": 0.0984, "loss_nan_ranks": 0, "loss_rank_avg": 0.07212714850902557, "step": 3270, "valid_targets_mean": 2762.1, "valid_targets_min": 902 }, { "epoch": 3.7051499717034524, "grad_norm": 0.47568407094967713, "learning_rate": 2.1459775452119898e-05, "loss": 0.1123, "loss_nan_ranks": 0, "loss_rank_avg": 0.04315885156393051, "step": 3275, "valid_targets_mean": 3572.5, "valid_targets_min": 2393 }, { "epoch": 3.7108092812676854, "grad_norm": 0.35866653739893223, "learning_rate": 2.1403508034109262e-05, "loss": 0.0951, "loss_nan_ranks": 0, "loss_rank_avg": 0.030487315729260445, "step": 3280, "valid_targets_mean": 3086.6, "valid_targets_min": 804 }, { "epoch": 3.7164685908319184, "grad_norm": 0.344859782354928, "learning_rate": 2.1347229450039237e-05, "loss": 0.0932, "loss_nan_ranks": 0, "loss_rank_avg": 0.0409947969019413, "step": 3285, "valid_targets_mean": 5223.5, "valid_targets_min": 4147 }, { "epoch": 3.722127900396152, "grad_norm": 0.39780389555566287, "learning_rate": 2.12909401476522e-05, "loss": 0.0808, "loss_nan_ranks": 0, "loss_rank_avg": 0.052354902029037476, "step": 3290, "valid_targets_mean": 4369.2, "valid_targets_min": 871 }, { "epoch": 3.727787209960385, "grad_norm": 0.28502767625047915, "learning_rate": 2.1234640574775783e-05, "loss": 0.0771, "loss_nan_ranks": 0, "loss_rank_avg": 0.02787552773952484, "step": 3295, "valid_targets_mean": 4207.1, "valid_targets_min": 896 }, { "epoch": 3.733446519524618, "grad_norm": 0.35279233295246115, "learning_rate": 2.1178331179319336e-05, "loss": 0.088, "loss_nan_ranks": 0, "loss_rank_avg": 0.043562762439250946, "step": 3300, "valid_targets_mean": 3603.9, "valid_targets_min": 2862 }, { "epoch": 3.7391058290888513, "grad_norm": 0.6045679331388665, "learning_rate": 2.112201240927037e-05, "loss": 0.1066, "loss_nan_ranks": 0, "loss_rank_avg": 0.06445741653442383, "step": 3305, "valid_targets_mean": 1776.4, "valid_targets_min": 497 }, { "epoch": 3.7447651386530842, "grad_norm": 0.41700082787673637, "learning_rate": 2.1065684712690954e-05, "loss": 0.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.05462094396352768, "step": 3310, "valid_targets_mean": 4063.8, "valid_targets_min": 3217 }, { "epoch": 3.7504244482173172, "grad_norm": 0.47105077925347255, "learning_rate": 2.1009348537714194e-05, "loss": 0.1009, "loss_nan_ranks": 0, "loss_rank_avg": 0.04253324121236801, "step": 3315, "valid_targets_mean": 2245.1, "valid_targets_min": 901 }, { "epoch": 3.7560837577815507, "grad_norm": 0.3781290654660693, "learning_rate": 2.0953004332540644e-05, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.03992723301053047, "step": 3320, "valid_targets_mean": 3350.9, "valid_targets_min": 905 }, { "epoch": 3.7617430673457837, "grad_norm": 0.4585858979255781, "learning_rate": 2.089665254543473e-05, "loss": 0.0975, "loss_nan_ranks": 0, "loss_rank_avg": 0.06727780401706696, "step": 3325, "valid_targets_mean": 3223.2, "valid_targets_min": 1181 }, { "epoch": 3.767402376910017, "grad_norm": 0.42217539231813284, "learning_rate": 2.0840293624721234e-05, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.03888125717639923, "step": 3330, "valid_targets_mean": 3718.1, "valid_targets_min": 3184 }, { "epoch": 3.77306168647425, "grad_norm": 0.579536581426898, "learning_rate": 2.0783928018781644e-05, "loss": 0.0833, "loss_nan_ranks": 0, "loss_rank_avg": 0.07282514870166779, "step": 3335, "valid_targets_mean": 2082.6, "valid_targets_min": 650 }, { "epoch": 3.7787209960384835, "grad_norm": 0.517663613067983, "learning_rate": 2.0727556176050676e-05, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.046402908861637115, "step": 3340, "valid_targets_mean": 1639.8, "valid_targets_min": 827 }, { "epoch": 3.7843803056027165, "grad_norm": 0.534794827416597, "learning_rate": 2.0671178545012643e-05, "loss": 0.0945, "loss_nan_ranks": 0, "loss_rank_avg": 0.05245472490787506, "step": 3345, "valid_targets_mean": 1642.2, "valid_targets_min": 940 }, { "epoch": 3.7900396151669495, "grad_norm": 0.37804680274866975, "learning_rate": 2.0614795574197907e-05, "loss": 0.101, "loss_nan_ranks": 0, "loss_rank_avg": 0.03373146057128906, "step": 3350, "valid_targets_mean": 2931.0, "valid_targets_min": 958 }, { "epoch": 3.795698924731183, "grad_norm": 0.5595591873372421, "learning_rate": 2.0558407712179334e-05, "loss": 0.0925, "loss_nan_ranks": 0, "loss_rank_avg": 0.03488003835082054, "step": 3355, "valid_targets_mean": 1184.4, "valid_targets_min": 495 }, { "epoch": 3.801358234295416, "grad_norm": 0.5049597929263119, "learning_rate": 2.050201540756868e-05, "loss": 0.1026, "loss_nan_ranks": 0, "loss_rank_avg": 0.031919289380311966, "step": 3360, "valid_targets_mean": 1703.6, "valid_targets_min": 655 }, { "epoch": 3.807017543859649, "grad_norm": 0.6514065995671096, "learning_rate": 2.0445619109013054e-05, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.1003175750374794, "step": 3365, "valid_targets_mean": 2292.5, "valid_targets_min": 521 }, { "epoch": 3.8126768534238824, "grad_norm": 0.43132665183117197, "learning_rate": 2.038921926519134e-05, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.052312783896923065, "step": 3370, "valid_targets_mean": 3474.4, "valid_targets_min": 1909 }, { "epoch": 3.8183361629881154, "grad_norm": 0.31564328422784954, "learning_rate": 2.033281632481063e-05, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.03723391890525818, "step": 3375, "valid_targets_mean": 3427.6, "valid_targets_min": 841 }, { "epoch": 3.8239954725523484, "grad_norm": 0.39519327642614127, "learning_rate": 2.027641073660265e-05, "loss": 0.0889, "loss_nan_ranks": 0, "loss_rank_avg": 0.04752538353204727, "step": 3380, "valid_targets_mean": 3007.1, "valid_targets_min": 2144 }, { "epoch": 3.829654782116582, "grad_norm": 0.456054856186123, "learning_rate": 2.0220002949320187e-05, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.05250108242034912, "step": 3385, "valid_targets_mean": 3419.9, "valid_targets_min": 2215 }, { "epoch": 3.835314091680815, "grad_norm": 0.33797200336103456, "learning_rate": 2.0163593411733533e-05, "loss": 0.0715, "loss_nan_ranks": 0, "loss_rank_avg": 0.04054778814315796, "step": 3390, "valid_targets_mean": 3754.9, "valid_targets_min": 723 }, { "epoch": 3.8409734012450483, "grad_norm": 0.3296089900649167, "learning_rate": 2.0107182572626897e-05, "loss": 0.0893, "loss_nan_ranks": 0, "loss_rank_avg": 0.04143691062927246, "step": 3395, "valid_targets_mean": 4612.4, "valid_targets_min": 1253 }, { "epoch": 3.8466327108092813, "grad_norm": 0.315842382743557, "learning_rate": 2.0050770880794843e-05, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.04056167230010033, "step": 3400, "valid_targets_mean": 3894.0, "valid_targets_min": 995 }, { "epoch": 3.8522920203735147, "grad_norm": 0.29138446818333136, "learning_rate": 1.9994358785038736e-05, "loss": 0.0707, "loss_nan_ranks": 0, "loss_rank_avg": 0.04306381940841675, "step": 3405, "valid_targets_mean": 4775.1, "valid_targets_min": 3539 }, { "epoch": 3.8579513299377477, "grad_norm": 0.4118629229039932, "learning_rate": 1.9937946734163117e-05, "loss": 0.0945, "loss_nan_ranks": 0, "loss_rank_avg": 0.05121958628296852, "step": 3410, "valid_targets_mean": 4235.9, "valid_targets_min": 2839 }, { "epoch": 3.8636106395019807, "grad_norm": 0.32989201224002446, "learning_rate": 1.98815351769722e-05, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.02642885595560074, "step": 3415, "valid_targets_mean": 2090.6, "valid_targets_min": 424 }, { "epoch": 3.869269949066214, "grad_norm": 0.4092120038133833, "learning_rate": 1.982512456226628e-05, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.05555412918329239, "step": 3420, "valid_targets_mean": 2603.4, "valid_targets_min": 541 }, { "epoch": 3.874929258630447, "grad_norm": 0.38568525926824204, "learning_rate": 1.976871533883812e-05, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.03278844431042671, "step": 3425, "valid_targets_mean": 3360.5, "valid_targets_min": 1938 }, { "epoch": 3.88058856819468, "grad_norm": 0.44242322902590053, "learning_rate": 1.971230795546944e-05, "loss": 0.0865, "loss_nan_ranks": 0, "loss_rank_avg": 0.11511512100696564, "step": 3430, "valid_targets_mean": 2122.4, "valid_targets_min": 722 }, { "epoch": 3.8862478777589136, "grad_norm": 0.38417822688245, "learning_rate": 1.965590286092731e-05, "loss": 0.0925, "loss_nan_ranks": 0, "loss_rank_avg": 0.045143697410821915, "step": 3435, "valid_targets_mean": 3572.6, "valid_targets_min": 2919 }, { "epoch": 3.8919071873231466, "grad_norm": 0.42311205060593304, "learning_rate": 1.9599500503960596e-05, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.03667496144771576, "step": 3440, "valid_targets_mean": 1793.4, "valid_targets_min": 559 }, { "epoch": 3.8975664968873796, "grad_norm": 0.49304330387414225, "learning_rate": 1.954310133329639e-05, "loss": 0.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.06212100386619568, "step": 3445, "valid_targets_mean": 2699.0, "valid_targets_min": 811 }, { "epoch": 3.903225806451613, "grad_norm": 0.6981683111926872, "learning_rate": 1.948670579763641e-05, "loss": 0.1126, "loss_nan_ranks": 0, "loss_rank_avg": 0.07180996239185333, "step": 3450, "valid_targets_mean": 1462.5, "valid_targets_min": 685 }, { "epoch": 3.908885116015846, "grad_norm": 0.3665019195997859, "learning_rate": 1.9430314345653486e-05, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.028401896357536316, "step": 3455, "valid_targets_mean": 2990.6, "valid_targets_min": 593 }, { "epoch": 3.914544425580079, "grad_norm": 0.36683102464115874, "learning_rate": 1.9373927425987928e-05, "loss": 0.0964, "loss_nan_ranks": 0, "loss_rank_avg": 0.041700564324855804, "step": 3460, "valid_targets_mean": 3558.8, "valid_targets_min": 1041 }, { "epoch": 3.9202037351443124, "grad_norm": 0.4262467475407333, "learning_rate": 1.9317545487244016e-05, "loss": 0.0949, "loss_nan_ranks": 0, "loss_rank_avg": 0.05397236347198486, "step": 3465, "valid_targets_mean": 3713.2, "valid_targets_min": 2556 }, { "epoch": 3.9258630447085454, "grad_norm": 0.45865992664307026, "learning_rate": 1.926116897798639e-05, "loss": 0.0838, "loss_nan_ranks": 0, "loss_rank_avg": 0.05742509290575981, "step": 3470, "valid_targets_mean": 3734.9, "valid_targets_min": 3385 }, { "epoch": 3.931522354272779, "grad_norm": 0.3807270985107737, "learning_rate": 1.9204798346736485e-05, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.0385202094912529, "step": 3475, "valid_targets_mean": 3136.2, "valid_targets_min": 541 }, { "epoch": 3.937181663837012, "grad_norm": 0.697305609254891, "learning_rate": 1.914843404196899e-05, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.056570932269096375, "step": 3480, "valid_targets_mean": 1219.4, "valid_targets_min": 598 }, { "epoch": 3.9428409734012453, "grad_norm": 0.4381515795574387, "learning_rate": 1.9092076512108253e-05, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.04982505738735199, "step": 3485, "valid_targets_mean": 3262.6, "valid_targets_min": 1069 }, { "epoch": 3.9485002829654783, "grad_norm": 0.5458296366412162, "learning_rate": 1.903572620552471e-05, "loss": 0.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.0361316055059433, "step": 3490, "valid_targets_mean": 1540.1, "valid_targets_min": 680 }, { "epoch": 3.9541595925297113, "grad_norm": 0.40347912681769865, "learning_rate": 1.8979383570531358e-05, "loss": 0.0804, "loss_nan_ranks": 0, "loss_rank_avg": 0.04016882926225662, "step": 3495, "valid_targets_mean": 2487.0, "valid_targets_min": 774 }, { "epoch": 3.9598189020939447, "grad_norm": 0.3597195559569826, "learning_rate": 1.8923049055380128e-05, "loss": 0.0945, "loss_nan_ranks": 0, "loss_rank_avg": 0.043545953929424286, "step": 3500, "valid_targets_mean": 4372.6, "valid_targets_min": 1474 }, { "epoch": 3.9654782116581777, "grad_norm": 0.25634379370918176, "learning_rate": 1.8866723108258376e-05, "loss": 0.0747, "loss_nan_ranks": 0, "loss_rank_avg": 0.03357706218957901, "step": 3505, "valid_targets_mean": 5496.2, "valid_targets_min": 4657 }, { "epoch": 3.9711375212224107, "grad_norm": 0.3334762985004109, "learning_rate": 1.8810406177285282e-05, "loss": 0.081, "loss_nan_ranks": 0, "loss_rank_avg": 0.042172081768512726, "step": 3510, "valid_targets_mean": 3943.8, "valid_targets_min": 675 }, { "epoch": 3.976796830786644, "grad_norm": 0.35172500208172275, "learning_rate": 1.8754098710508294e-05, "loss": 0.0846, "loss_nan_ranks": 0, "loss_rank_avg": 0.046609655022621155, "step": 3515, "valid_targets_mean": 3760.4, "valid_targets_min": 2463 }, { "epoch": 3.982456140350877, "grad_norm": 0.8796896661404067, "learning_rate": 1.869780115589957e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.03977133333683014, "step": 3520, "valid_targets_mean": 2844.4, "valid_targets_min": 605 }, { "epoch": 3.98811544991511, "grad_norm": 0.35543893040609253, "learning_rate": 1.8641513961352396e-05, "loss": 0.079, "loss_nan_ranks": 0, "loss_rank_avg": 0.037588320672512054, "step": 3525, "valid_targets_mean": 3247.4, "valid_targets_min": 1014 }, { "epoch": 3.9937747594793436, "grad_norm": 0.3704753246940243, "learning_rate": 1.858523757467765e-05, "loss": 0.0912, "loss_nan_ranks": 0, "loss_rank_avg": 0.042072445154190063, "step": 3530, "valid_targets_mean": 3545.2, "valid_targets_min": 2807 }, { "epoch": 3.9994340690435766, "grad_norm": 0.5344737197927087, "learning_rate": 1.8528972443600226e-05, "loss": 0.1144, "loss_nan_ranks": 0, "loss_rank_avg": 0.11486827582120895, "step": 3535, "valid_targets_mean": 2912.9, "valid_targets_min": 1214 }, { "epoch": 4.005659309564233, "grad_norm": 0.5008124596440419, "learning_rate": 1.8472719015755452e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.09267597645521164, "step": 3540, "valid_targets_mean": 7214.4, "valid_targets_min": 4847 }, { "epoch": 4.011318619128466, "grad_norm": 0.3939702908833795, "learning_rate": 1.8416477738685567e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.0846470445394516, "step": 3545, "valid_targets_mean": 6417.1, "valid_targets_min": 4480 }, { "epoch": 4.016977928692699, "grad_norm": 0.3835188973433748, "learning_rate": 1.8360249059836123e-05, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.08836297690868378, "step": 3550, "valid_targets_mean": 7605.4, "valid_targets_min": 5236 }, { "epoch": 4.022637238256933, "grad_norm": 0.40270414663569104, "learning_rate": 1.830403342655246e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.07130195200443268, "step": 3555, "valid_targets_mean": 5827.9, "valid_targets_min": 4727 }, { "epoch": 4.028296547821165, "grad_norm": 0.4331187042742476, "learning_rate": 1.824783128607612e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.0947471559047699, "step": 3560, "valid_targets_mean": 6448.2, "valid_targets_min": 4211 }, { "epoch": 4.033955857385399, "grad_norm": 0.4728306033797111, "learning_rate": 1.8191643085541296e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.09749437868595123, "step": 3565, "valid_targets_mean": 6108.1, "valid_targets_min": 4279 }, { "epoch": 4.039615166949632, "grad_norm": 0.3742686771616783, "learning_rate": 1.813546927197129e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.07242477685213089, "step": 3570, "valid_targets_mean": 5962.4, "valid_targets_min": 4589 }, { "epoch": 4.045274476513866, "grad_norm": 0.47923860816844743, "learning_rate": 1.8079310292274928e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.08282826095819473, "step": 3575, "valid_targets_mean": 3503.2, "valid_targets_min": 2015 }, { "epoch": 4.050933786078098, "grad_norm": 0.35980349731828126, "learning_rate": 1.8023166593243026e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.06773898005485535, "step": 3580, "valid_targets_mean": 6102.5, "valid_targets_min": 4778 }, { "epoch": 4.056593095642332, "grad_norm": 0.3825978995401686, "learning_rate": 1.7967038621544845e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.07666116952896118, "step": 3585, "valid_targets_mean": 5868.2, "valid_targets_min": 4612 }, { "epoch": 4.062252405206565, "grad_norm": 0.40696919494833955, "learning_rate": 1.791092682372449e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.08827384561300278, "step": 3590, "valid_targets_mean": 6105.8, "valid_targets_min": 4491 }, { "epoch": 4.067911714770798, "grad_norm": 0.39421380445121584, "learning_rate": 1.7854831646197426e-05, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.08447161316871643, "step": 3595, "valid_targets_mean": 6962.0, "valid_targets_min": 4754 }, { "epoch": 4.073571024335031, "grad_norm": 0.37473359119575794, "learning_rate": 1.7798753535246856e-05, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.07447396218776703, "step": 3600, "valid_targets_mean": 6035.1, "valid_targets_min": 4787 }, { "epoch": 4.079230333899265, "grad_norm": 0.4227213769477523, "learning_rate": 1.7742692937020234e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.07278391718864441, "step": 3605, "valid_targets_mean": 6028.5, "valid_targets_min": 5213 }, { "epoch": 4.084889643463497, "grad_norm": 0.38524214879156815, "learning_rate": 1.768665029752567e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.06999488174915314, "step": 3610, "valid_targets_mean": 6814.1, "valid_targets_min": 4664 }, { "epoch": 4.090548953027731, "grad_norm": 0.3972869029235263, "learning_rate": 1.763062606262839e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.07294754683971405, "step": 3615, "valid_targets_mean": 6281.5, "valid_targets_min": 4996 }, { "epoch": 4.096208262591964, "grad_norm": 0.3931822579344668, "learning_rate": 1.7574620678047215e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.07363331317901611, "step": 3620, "valid_targets_mean": 6628.9, "valid_targets_min": 4582 }, { "epoch": 4.101867572156197, "grad_norm": 0.3601228835997598, "learning_rate": 1.751863458935099e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.06443273276090622, "step": 3625, "valid_targets_mean": 6536.6, "valid_targets_min": 5205 }, { "epoch": 4.10752688172043, "grad_norm": 0.37681366926978777, "learning_rate": 1.746266824195504e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.07399990409612656, "step": 3630, "valid_targets_mean": 7031.0, "valid_targets_min": 5098 }, { "epoch": 4.1131861912846635, "grad_norm": 0.4129281253908889, "learning_rate": 1.7406722081117632e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.09378090500831604, "step": 3635, "valid_targets_mean": 6514.2, "valid_targets_min": 5016 }, { "epoch": 4.118845500848896, "grad_norm": 0.40046677747273324, "learning_rate": 1.7350796551936432e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.11042913794517517, "step": 3640, "valid_targets_mean": 6330.0, "valid_targets_min": 965 }, { "epoch": 4.124504810413129, "grad_norm": 0.38272577252010453, "learning_rate": 1.7294892099344975e-05, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.07567565888166428, "step": 3645, "valid_targets_mean": 6293.1, "valid_targets_min": 5218 }, { "epoch": 4.130164119977363, "grad_norm": 0.4075941121248639, "learning_rate": 1.7239009168109108e-05, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.07180091738700867, "step": 3650, "valid_targets_mean": 6957.4, "valid_targets_min": 4213 }, { "epoch": 4.135823429541596, "grad_norm": 0.4459180719896231, "learning_rate": 1.7183148202823445e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.09024065732955933, "step": 3655, "valid_targets_mean": 5888.5, "valid_targets_min": 4923 }, { "epoch": 4.141482739105829, "grad_norm": 0.417345833444335, "learning_rate": 1.7127309647907867e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.11535342037677765, "step": 3660, "valid_targets_mean": 7822.9, "valid_targets_min": 4993 }, { "epoch": 4.147142048670062, "grad_norm": 0.4092836996069491, "learning_rate": 1.7071493947603942e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.08515796065330505, "step": 3665, "valid_targets_mean": 6098.6, "valid_targets_min": 4872 }, { "epoch": 4.152801358234296, "grad_norm": 0.3829832784465982, "learning_rate": 1.7015701545971417e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.08360423147678375, "step": 3670, "valid_targets_mean": 6892.2, "valid_targets_min": 4706 }, { "epoch": 4.158460667798528, "grad_norm": 0.45523292925046316, "learning_rate": 1.695993288688469e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.07692007720470428, "step": 3675, "valid_targets_mean": 6352.0, "valid_targets_min": 4889 }, { "epoch": 4.164119977362762, "grad_norm": 0.4255022530499619, "learning_rate": 1.6904188414029248e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.07571934908628464, "step": 3680, "valid_targets_mean": 5948.9, "valid_targets_min": 3888 }, { "epoch": 4.169779286926995, "grad_norm": 0.4095787920769221, "learning_rate": 1.6848468570898172e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.07443135976791382, "step": 3685, "valid_targets_mean": 5846.2, "valid_targets_min": 4051 }, { "epoch": 4.175438596491228, "grad_norm": 0.3788095484158347, "learning_rate": 1.6792773800788583e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.08252878487110138, "step": 3690, "valid_targets_mean": 7319.2, "valid_targets_min": 5230 }, { "epoch": 4.181097906055461, "grad_norm": 0.38497942903312243, "learning_rate": 1.673710454679813e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.08583734184503555, "step": 3695, "valid_targets_mean": 8235.1, "valid_targets_min": 4997 }, { "epoch": 4.186757215619695, "grad_norm": 0.4446341909959979, "learning_rate": 1.668146125182147e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.08628219366073608, "step": 3700, "valid_targets_mean": 6402.5, "valid_targets_min": 5364 }, { "epoch": 4.192416525183927, "grad_norm": 0.40330962971590845, "learning_rate": 1.6625844358546715e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.09064686298370361, "step": 3705, "valid_targets_mean": 7117.4, "valid_targets_min": 3391 }, { "epoch": 4.198075834748161, "grad_norm": 0.36576009736166315, "learning_rate": 1.657025430945195e-05, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.07560627907514572, "step": 3710, "valid_targets_mean": 7542.8, "valid_targets_min": 4829 }, { "epoch": 4.203735144312394, "grad_norm": 0.5393492990188449, "learning_rate": 1.651469154680167e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.0772615298628807, "step": 3715, "valid_targets_mean": 6284.4, "valid_targets_min": 5180 }, { "epoch": 4.2093944538766275, "grad_norm": 0.4471781144605719, "learning_rate": 1.6459156512643303e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.08217886090278625, "step": 3720, "valid_targets_mean": 5806.2, "valid_targets_min": 5101 }, { "epoch": 4.21505376344086, "grad_norm": 0.4336240077848953, "learning_rate": 1.640364964880367e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.07309036701917648, "step": 3725, "valid_targets_mean": 6697.9, "valid_targets_min": 4527 }, { "epoch": 4.2207130730050935, "grad_norm": 0.40323628644582493, "learning_rate": 1.6348171396885468e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.08748327940702438, "step": 3730, "valid_targets_mean": 6410.4, "valid_targets_min": 3082 }, { "epoch": 4.226372382569327, "grad_norm": 0.4095929036243839, "learning_rate": 1.6292722198263766e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.07573725283145905, "step": 3735, "valid_targets_mean": 6847.1, "valid_targets_min": 4685 }, { "epoch": 4.2320316921335595, "grad_norm": 0.43963984326487965, "learning_rate": 1.623730249408249e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.08435098826885223, "step": 3740, "valid_targets_mean": 6194.0, "valid_targets_min": 4644 }, { "epoch": 4.237691001697793, "grad_norm": 0.3929935896020955, "learning_rate": 1.618191272525092e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.06960330903530121, "step": 3745, "valid_targets_mean": 6283.8, "valid_targets_min": 4433 }, { "epoch": 4.243350311262026, "grad_norm": 0.5154631432189906, "learning_rate": 1.612655333244016e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.07508840411901474, "step": 3750, "valid_targets_mean": 5917.2, "valid_targets_min": 4857 }, { "epoch": 4.249009620826259, "grad_norm": 0.4376479061623972, "learning_rate": 1.6071224756079666e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.0977800190448761, "step": 3755, "valid_targets_mean": 6986.4, "valid_targets_min": 5101 }, { "epoch": 4.254668930390492, "grad_norm": 0.445663905724086, "learning_rate": 1.6015927436353713e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.06677838414907455, "step": 3760, "valid_targets_mean": 5299.5, "valid_targets_min": 4442 }, { "epoch": 4.260328239954726, "grad_norm": 0.37709369412424565, "learning_rate": 1.59606618131979e-05, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.05814947187900543, "step": 3765, "valid_targets_mean": 6133.9, "valid_targets_min": 5130 }, { "epoch": 4.265987549518958, "grad_norm": 0.42340455157424106, "learning_rate": 1.5905428326295663e-05, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.08240945637226105, "step": 3770, "valid_targets_mean": 6477.4, "valid_targets_min": 4162 }, { "epoch": 4.271646859083192, "grad_norm": 0.3764871118641996, "learning_rate": 1.585022741507477e-05, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.06925308704376221, "step": 3775, "valid_targets_mean": 6350.4, "valid_targets_min": 3940 }, { "epoch": 4.277306168647425, "grad_norm": 0.4362310563771639, "learning_rate": 1.579505951870381e-05, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.08733298629522324, "step": 3780, "valid_targets_mean": 6625.1, "valid_targets_min": 4642 }, { "epoch": 4.282965478211658, "grad_norm": 0.4268228683981418, "learning_rate": 1.573992507608872e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.08933217823505402, "step": 3785, "valid_targets_mean": 4907.0, "valid_targets_min": 4431 }, { "epoch": 4.288624787775891, "grad_norm": 0.42302991710871685, "learning_rate": 1.568482452586929e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.08254139870405197, "step": 3790, "valid_targets_mean": 6465.0, "valid_targets_min": 5333 }, { "epoch": 4.294284097340125, "grad_norm": 0.4151763737853865, "learning_rate": 1.5629758306415652e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.0802953690290451, "step": 3795, "valid_targets_mean": 5650.5, "valid_targets_min": 4769 }, { "epoch": 4.299943406904358, "grad_norm": 0.4311186422126902, "learning_rate": 1.5574726855824827e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.07794877886772156, "step": 3800, "valid_targets_mean": 5540.0, "valid_targets_min": 4281 }, { "epoch": 4.305602716468591, "grad_norm": 0.4543300622427506, "learning_rate": 1.5519730611917206e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.11111429333686829, "step": 3805, "valid_targets_mean": 6499.0, "valid_targets_min": 4844 }, { "epoch": 4.311262026032824, "grad_norm": 0.39997302398510315, "learning_rate": 1.546477001223309e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.07029193639755249, "step": 3810, "valid_targets_mean": 5736.5, "valid_targets_min": 5227 }, { "epoch": 4.3169213355970575, "grad_norm": 0.3686385730004549, "learning_rate": 1.5409845494029208e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.06129857152700424, "step": 3815, "valid_targets_mean": 5857.2, "valid_targets_min": 2461 }, { "epoch": 4.32258064516129, "grad_norm": 0.4060862356848946, "learning_rate": 1.5354957494275207e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.07067536562681198, "step": 3820, "valid_targets_mean": 5793.4, "valid_targets_min": 2815 }, { "epoch": 4.3282399547255235, "grad_norm": 0.4038576482109372, "learning_rate": 1.5300106449650234e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.06821887195110321, "step": 3825, "valid_targets_mean": 6588.8, "valid_targets_min": 4875 }, { "epoch": 4.333899264289757, "grad_norm": 0.41338552584688865, "learning_rate": 1.524529279653939e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.07139618694782257, "step": 3830, "valid_targets_mean": 5984.8, "valid_targets_min": 4901 }, { "epoch": 4.3395585738539895, "grad_norm": 0.3626865453067956, "learning_rate": 1.5190516971030324e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.06856446713209152, "step": 3835, "valid_targets_mean": 6067.4, "valid_targets_min": 3786 }, { "epoch": 4.345217883418223, "grad_norm": 0.40474411941293037, "learning_rate": 1.5135779408909732e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.07661972939968109, "step": 3840, "valid_targets_mean": 5852.5, "valid_targets_min": 5057 }, { "epoch": 4.350877192982456, "grad_norm": 0.4529750374758651, "learning_rate": 1.5081080545659874e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.0812104269862175, "step": 3845, "valid_targets_mean": 6362.2, "valid_targets_min": 3952 }, { "epoch": 4.356536502546689, "grad_norm": 0.47063382640866086, "learning_rate": 1.5026420816455156e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.07746419310569763, "step": 3850, "valid_targets_mean": 5360.2, "valid_targets_min": 4267 }, { "epoch": 4.362195812110922, "grad_norm": 0.42248565285269357, "learning_rate": 1.4971800656158624e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.09461343288421631, "step": 3855, "valid_targets_mean": 6842.1, "valid_targets_min": 4785 }, { "epoch": 4.367855121675156, "grad_norm": 0.38764246155158855, "learning_rate": 1.4917220499318506e-05, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.06870239973068237, "step": 3860, "valid_targets_mean": 6188.5, "valid_targets_min": 5438 }, { "epoch": 4.373514431239389, "grad_norm": 0.43502410000194525, "learning_rate": 1.4862680780164805e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.08560039103031158, "step": 3865, "valid_targets_mean": 5848.6, "valid_targets_min": 4734 }, { "epoch": 4.379173740803622, "grad_norm": 0.35644987083560775, "learning_rate": 1.4808181932605787e-05, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.06139899417757988, "step": 3870, "valid_targets_mean": 6278.2, "valid_targets_min": 5636 }, { "epoch": 4.384833050367855, "grad_norm": 0.3918664932129097, "learning_rate": 1.4753724390224551e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.0662948489189148, "step": 3875, "valid_targets_mean": 6168.9, "valid_targets_min": 4206 }, { "epoch": 4.390492359932089, "grad_norm": 0.40240258367128745, "learning_rate": 1.4699308586275591e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.06691467016935349, "step": 3880, "valid_targets_mean": 6226.5, "valid_targets_min": 4535 }, { "epoch": 4.396151669496321, "grad_norm": 0.35360407851709585, "learning_rate": 1.464493495368132e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.07321492582559586, "step": 3885, "valid_targets_mean": 7821.6, "valid_targets_min": 5471 }, { "epoch": 4.401810979060555, "grad_norm": 0.4168799254478002, "learning_rate": 1.459060392502866e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.06479287147521973, "step": 3890, "valid_targets_mean": 6843.0, "valid_targets_min": 5243 }, { "epoch": 4.407470288624788, "grad_norm": 0.45280990702426094, "learning_rate": 1.4536315932565575e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.08667883276939392, "step": 3895, "valid_targets_mean": 6658.6, "valid_targets_min": 4906 }, { "epoch": 4.413129598189021, "grad_norm": 0.5170654478744513, "learning_rate": 1.448207140819764e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.07833343744277954, "step": 3900, "valid_targets_mean": 6799.5, "valid_targets_min": 5168 }, { "epoch": 4.418788907753254, "grad_norm": 0.4585375937990011, "learning_rate": 1.4427870783484613e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.08121506869792938, "step": 3905, "valid_targets_mean": 5376.2, "valid_targets_min": 3130 }, { "epoch": 4.4244482173174875, "grad_norm": 0.443331932431525, "learning_rate": 1.4373714489636985e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.04741574078798294, "step": 3910, "valid_targets_mean": 2843.1, "valid_targets_min": 1990 }, { "epoch": 4.43010752688172, "grad_norm": 0.48401226868031233, "learning_rate": 1.4319602957512564e-05, "loss": 0.106, "loss_nan_ranks": 0, "loss_rank_avg": 0.04668089747428894, "step": 3915, "valid_targets_mean": 2532.2, "valid_targets_min": 324 }, { "epoch": 4.4357668364459535, "grad_norm": 0.3954237444400868, "learning_rate": 1.4265536617613043e-05, "loss": 0.0807, "loss_nan_ranks": 0, "loss_rank_avg": 0.04219325631856918, "step": 3920, "valid_targets_mean": 2359.2, "valid_targets_min": 982 }, { "epoch": 4.441426146010187, "grad_norm": 0.5155838952571494, "learning_rate": 1.4211515900080568e-05, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.04493227228522301, "step": 3925, "valid_targets_mean": 3640.0, "valid_targets_min": 2479 }, { "epoch": 4.44708545557442, "grad_norm": 0.3246724348372543, "learning_rate": 1.4157541234694324e-05, "loss": 0.0906, "loss_nan_ranks": 0, "loss_rank_avg": 0.028960149735212326, "step": 3930, "valid_targets_mean": 3079.5, "valid_targets_min": 811 }, { "epoch": 4.452744765138653, "grad_norm": 0.4095150256981928, "learning_rate": 1.4103613050867117e-05, "loss": 0.0837, "loss_nan_ranks": 0, "loss_rank_avg": 0.047411803156137466, "step": 3935, "valid_targets_mean": 3113.4, "valid_targets_min": 1431 }, { "epoch": 4.458404074702886, "grad_norm": 0.6391321063571365, "learning_rate": 1.4049731777641948e-05, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.086330845952034, "step": 3940, "valid_targets_mean": 1990.9, "valid_targets_min": 702 }, { "epoch": 4.46406338426712, "grad_norm": 0.38922644742240664, "learning_rate": 1.3995897843688615e-05, "loss": 0.1011, "loss_nan_ranks": 0, "loss_rank_avg": 0.047160811722278595, "step": 3945, "valid_targets_mean": 3221.6, "valid_targets_min": 621 }, { "epoch": 4.469722693831352, "grad_norm": 0.6462094372397308, "learning_rate": 1.3942111677300276e-05, "loss": 0.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.05346031114459038, "step": 3950, "valid_targets_mean": 2591.4, "valid_targets_min": 846 }, { "epoch": 4.475382003395586, "grad_norm": 0.4061055434466861, "learning_rate": 1.388837370639008e-05, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.06589578837156296, "step": 3955, "valid_targets_mean": 3738.9, "valid_targets_min": 1369 }, { "epoch": 4.481041312959819, "grad_norm": 0.3849733546616827, "learning_rate": 1.3834684358487731e-05, "loss": 0.0646, "loss_nan_ranks": 0, "loss_rank_avg": 0.039215341210365295, "step": 3960, "valid_targets_mean": 2715.4, "valid_targets_min": 754 }, { "epoch": 4.486700622524052, "grad_norm": 0.4253804496012952, "learning_rate": 1.3781044060736089e-05, "loss": 0.0812, "loss_nan_ranks": 0, "loss_rank_avg": 0.04853950813412666, "step": 3965, "valid_targets_mean": 2725.9, "valid_targets_min": 776 }, { "epoch": 4.492359932088285, "grad_norm": 0.3578152154235922, "learning_rate": 1.3727453239887796e-05, "loss": 0.0802, "loss_nan_ranks": 0, "loss_rank_avg": 0.052317701280117035, "step": 3970, "valid_targets_mean": 3194.4, "valid_targets_min": 754 }, { "epoch": 4.498019241652519, "grad_norm": 0.6391115960853455, "learning_rate": 1.367391232230185e-05, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.17157770693302155, "step": 3975, "valid_targets_mean": 2053.8, "valid_targets_min": 664 }, { "epoch": 4.503678551216751, "grad_norm": 0.40231212097613134, "learning_rate": 1.3620421733940234e-05, "loss": 0.0756, "loss_nan_ranks": 0, "loss_rank_avg": 0.04370037838816643, "step": 3980, "valid_targets_mean": 3771.4, "valid_targets_min": 2542 }, { "epoch": 4.509337860780985, "grad_norm": 0.4723821784200535, "learning_rate": 1.356698190036453e-05, "loss": 0.0813, "loss_nan_ranks": 0, "loss_rank_avg": 0.051801249384880066, "step": 3985, "valid_targets_mean": 3486.2, "valid_targets_min": 2988 }, { "epoch": 4.514997170345218, "grad_norm": 0.4080233853264302, "learning_rate": 1.3513593246732506e-05, "loss": 0.0751, "loss_nan_ranks": 0, "loss_rank_avg": 0.046337466686964035, "step": 3990, "valid_targets_mean": 3779.4, "valid_targets_min": 3281 }, { "epoch": 4.5206564799094515, "grad_norm": 0.44644169226312036, "learning_rate": 1.3460256197794768e-05, "loss": 0.0822, "loss_nan_ranks": 0, "loss_rank_avg": 0.04264343902468681, "step": 3995, "valid_targets_mean": 3471.1, "valid_targets_min": 2189 }, { "epoch": 4.526315789473684, "grad_norm": 0.4063499834323027, "learning_rate": 1.3406971177891343e-05, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.03730551153421402, "step": 4000, "valid_targets_mean": 3483.6, "valid_targets_min": 1788 }, { "epoch": 4.5319750990379175, "grad_norm": 0.5680761401310686, "learning_rate": 1.3353738610948347e-05, "loss": 0.0964, "loss_nan_ranks": 0, "loss_rank_avg": 0.05603942275047302, "step": 4005, "valid_targets_mean": 2562.1, "valid_targets_min": 597 }, { "epoch": 4.53763440860215, "grad_norm": 0.4615652741114608, "learning_rate": 1.3300558920474586e-05, "loss": 0.0904, "loss_nan_ranks": 0, "loss_rank_avg": 0.04337063431739807, "step": 4010, "valid_targets_mean": 2272.8, "valid_targets_min": 701 }, { "epoch": 4.5432937181663835, "grad_norm": 0.475199804932793, "learning_rate": 1.3247432529558175e-05, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.07559002190828323, "step": 4015, "valid_targets_mean": 2971.0, "valid_targets_min": 1652 }, { "epoch": 4.548953027730617, "grad_norm": 0.3985376653121622, "learning_rate": 1.3194359860863201e-05, "loss": 0.0938, "loss_nan_ranks": 0, "loss_rank_avg": 0.03962837532162666, "step": 4020, "valid_targets_mean": 3747.4, "valid_targets_min": 1908 }, { "epoch": 4.55461233729485, "grad_norm": 0.4095101597017151, "learning_rate": 1.3141341336626336e-05, "loss": 0.0767, "loss_nan_ranks": 0, "loss_rank_avg": 0.03326389938592911, "step": 4025, "valid_targets_mean": 3247.8, "valid_targets_min": 971 }, { "epoch": 4.560271646859083, "grad_norm": 0.44270290029488385, "learning_rate": 1.3088377378653503e-05, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.04294685274362564, "step": 4030, "valid_targets_mean": 3422.2, "valid_targets_min": 2552 }, { "epoch": 4.565930956423316, "grad_norm": 0.39806191121450035, "learning_rate": 1.3035468408316501e-05, "loss": 0.0944, "loss_nan_ranks": 0, "loss_rank_avg": 0.03280611336231232, "step": 4035, "valid_targets_mean": 2948.9, "valid_targets_min": 753 }, { "epoch": 4.57159026598755, "grad_norm": 0.5454580231471242, "learning_rate": 1.2982614846549639e-05, "loss": 0.0899, "loss_nan_ranks": 0, "loss_rank_avg": 0.036681562662124634, "step": 4040, "valid_targets_mean": 1090.5, "valid_targets_min": 568 }, { "epoch": 4.577249575551782, "grad_norm": 0.5272571498175689, "learning_rate": 1.2929817113846428e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.11161740869283676, "step": 4045, "valid_targets_mean": 2921.1, "valid_targets_min": 1070 }, { "epoch": 4.582908885116016, "grad_norm": 0.5114999200280982, "learning_rate": 1.287707563025621e-05, "loss": 0.0928, "loss_nan_ranks": 0, "loss_rank_avg": 0.04125947877764702, "step": 4050, "valid_targets_mean": 2052.1, "valid_targets_min": 329 }, { "epoch": 4.588568194680249, "grad_norm": 0.6794177641022152, "learning_rate": 1.2824390815380805e-05, "loss": 0.0947, "loss_nan_ranks": 0, "loss_rank_avg": 0.05280480161309242, "step": 4055, "valid_targets_mean": 998.2, "valid_targets_min": 608 }, { "epoch": 4.594227504244482, "grad_norm": 0.43483819154934944, "learning_rate": 1.2771763088371202e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.050098396837711334, "step": 4060, "valid_targets_mean": 4405.9, "valid_targets_min": 2772 }, { "epoch": 4.599886813808715, "grad_norm": 0.3413473904426111, "learning_rate": 1.2719192867924197e-05, "loss": 0.077, "loss_nan_ranks": 0, "loss_rank_avg": 0.021962987259030342, "step": 4065, "valid_targets_mean": 5138.2, "valid_targets_min": 3778 }, { "epoch": 4.605546123372949, "grad_norm": 0.37623027963803085, "learning_rate": 1.2666680572279083e-05, "loss": 0.0903, "loss_nan_ranks": 0, "loss_rank_avg": 0.04053713008761406, "step": 4070, "valid_targets_mean": 4641.0, "valid_targets_min": 2336 }, { "epoch": 4.611205432937181, "grad_norm": 0.4165917942784783, "learning_rate": 1.2614226619214317e-05, "loss": 0.0874, "loss_nan_ranks": 0, "loss_rank_avg": 0.05364896357059479, "step": 4075, "valid_targets_mean": 3962.1, "valid_targets_min": 2161 }, { "epoch": 4.616864742501415, "grad_norm": 0.4068046168922619, "learning_rate": 1.2561831426044173e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.04479540139436722, "step": 4080, "valid_targets_mean": 3271.8, "valid_targets_min": 798 }, { "epoch": 4.622524052065648, "grad_norm": 0.48384948537626565, "learning_rate": 1.250949540961547e-05, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.03350779414176941, "step": 4085, "valid_targets_mean": 1915.8, "valid_targets_min": 533 }, { "epoch": 4.6281833616298815, "grad_norm": 0.46288391779242044, "learning_rate": 1.2457218986304196e-05, "loss": 0.077, "loss_nan_ranks": 0, "loss_rank_avg": 0.038839347660541534, "step": 4090, "valid_targets_mean": 2589.2, "valid_targets_min": 833 }, { "epoch": 4.633842671194114, "grad_norm": 0.35155068112360527, "learning_rate": 1.2405002572012252e-05, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.036818526685237885, "step": 4095, "valid_targets_mean": 3888.0, "valid_targets_min": 3391 }, { "epoch": 4.6395019807583475, "grad_norm": 0.5592411123462357, "learning_rate": 1.2352846582164117e-05, "loss": 0.0832, "loss_nan_ranks": 0, "loss_rank_avg": 0.06276963651180267, "step": 4100, "valid_targets_mean": 1517.1, "valid_targets_min": 732 }, { "epoch": 4.645161290322581, "grad_norm": 0.6587717790794467, "learning_rate": 1.2300751431703523e-05, "loss": 0.1068, "loss_nan_ranks": 0, "loss_rank_avg": 0.05123891681432724, "step": 4105, "valid_targets_mean": 1623.9, "valid_targets_min": 538 }, { "epoch": 4.6508205998868135, "grad_norm": 0.5410366205486246, "learning_rate": 1.2248717535090196e-05, "loss": 0.065, "loss_nan_ranks": 0, "loss_rank_avg": 0.04050035774707794, "step": 4110, "valid_targets_mean": 1158.1, "valid_targets_min": 720 }, { "epoch": 4.656479909451047, "grad_norm": 0.46500986147482537, "learning_rate": 1.2196745306296522e-05, "loss": 0.0731, "loss_nan_ranks": 0, "loss_rank_avg": 0.0410282164812088, "step": 4115, "valid_targets_mean": 2982.2, "valid_targets_min": 2328 }, { "epoch": 4.66213921901528, "grad_norm": 0.46392092870275686, "learning_rate": 1.2144835158804282e-05, "loss": 0.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.03278231620788574, "step": 4120, "valid_targets_mean": 2637.0, "valid_targets_min": 684 }, { "epoch": 4.667798528579513, "grad_norm": 0.41902047710660106, "learning_rate": 1.2092987505601346e-05, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.043621864169836044, "step": 4125, "valid_targets_mean": 3441.4, "valid_targets_min": 2795 }, { "epoch": 4.673457838143746, "grad_norm": 0.4456436609381996, "learning_rate": 1.2041202759178381e-05, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.0421648807823658, "step": 4130, "valid_targets_mean": 3286.4, "valid_targets_min": 744 }, { "epoch": 4.67911714770798, "grad_norm": 0.3824039606101949, "learning_rate": 1.198948133152559e-05, "loss": 0.094, "loss_nan_ranks": 0, "loss_rank_avg": 0.03015786036849022, "step": 4135, "valid_targets_mean": 3976.5, "valid_targets_min": 3279 }, { "epoch": 4.684776457272212, "grad_norm": 0.6000628647624624, "learning_rate": 1.1937823634129416e-05, "loss": 0.0867, "loss_nan_ranks": 0, "loss_rank_avg": 0.0420723631978035, "step": 4140, "valid_targets_mean": 1140.4, "valid_targets_min": 536 }, { "epoch": 4.690435766836446, "grad_norm": 0.5812001606124553, "learning_rate": 1.1886230077969278e-05, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.04249496012926102, "step": 4145, "valid_targets_mean": 2468.8, "valid_targets_min": 853 }, { "epoch": 4.696095076400679, "grad_norm": 0.46335769498418267, "learning_rate": 1.1834701073514306e-05, "loss": 0.0843, "loss_nan_ranks": 0, "loss_rank_avg": 0.0430687814950943, "step": 4150, "valid_targets_mean": 3205.8, "valid_targets_min": 2621 }, { "epoch": 4.701754385964913, "grad_norm": 0.6333180992883152, "learning_rate": 1.1783237030720049e-05, "loss": 0.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.04079118371009827, "step": 4155, "valid_targets_mean": 1332.4, "valid_targets_min": 728 }, { "epoch": 4.707413695529145, "grad_norm": 0.5690407519442315, "learning_rate": 1.1731838359025261e-05, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.04055098071694374, "step": 4160, "valid_targets_mean": 1538.9, "valid_targets_min": 618 }, { "epoch": 4.713073005093379, "grad_norm": 0.35164824124775307, "learning_rate": 1.1680505467348584e-05, "loss": 0.0827, "loss_nan_ranks": 0, "loss_rank_avg": 0.045088913291692734, "step": 4165, "valid_targets_mean": 4142.9, "valid_targets_min": 907 }, { "epoch": 4.718732314657612, "grad_norm": 0.6006000307194947, "learning_rate": 1.162923876408535e-05, "loss": 0.0884, "loss_nan_ranks": 0, "loss_rank_avg": 0.059268467128276825, "step": 4170, "valid_targets_mean": 3060.4, "valid_targets_min": 577 }, { "epoch": 4.724391624221845, "grad_norm": 0.3963810037110701, "learning_rate": 1.1578038657104295e-05, "loss": 0.0701, "loss_nan_ranks": 0, "loss_rank_avg": 0.032515622675418854, "step": 4175, "valid_targets_mean": 3732.2, "valid_targets_min": 726 }, { "epoch": 4.730050933786078, "grad_norm": 0.4059488375077736, "learning_rate": 1.1526905553744337e-05, "loss": 0.0672, "loss_nan_ranks": 0, "loss_rank_avg": 0.03996988385915756, "step": 4180, "valid_targets_mean": 4288.9, "valid_targets_min": 2252 }, { "epoch": 4.7357102433503115, "grad_norm": 0.4600670199394049, "learning_rate": 1.1475839860811301e-05, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.04087667912244797, "step": 4185, "valid_targets_mean": 2427.5, "valid_targets_min": 531 }, { "epoch": 4.741369552914544, "grad_norm": 0.46001203112270483, "learning_rate": 1.142484198457475e-05, "loss": 0.0955, "loss_nan_ranks": 0, "loss_rank_avg": 0.03880181163549423, "step": 4190, "valid_targets_mean": 2126.6, "valid_targets_min": 744 }, { "epoch": 4.7470288624787775, "grad_norm": 0.4411981906244772, "learning_rate": 1.1373912330764671e-05, "loss": 0.0894, "loss_nan_ranks": 0, "loss_rank_avg": 0.03835024684667587, "step": 4195, "valid_targets_mean": 3755.5, "valid_targets_min": 3024 }, { "epoch": 4.752688172043011, "grad_norm": 0.3773991905548678, "learning_rate": 1.1323051304568292e-05, "loss": 0.0805, "loss_nan_ranks": 0, "loss_rank_avg": 0.04429854452610016, "step": 4200, "valid_targets_mean": 3352.0, "valid_targets_min": 2366 }, { "epoch": 4.7583474816072435, "grad_norm": 0.5035610691167854, "learning_rate": 1.1272259310626872e-05, "loss": 0.0782, "loss_nan_ranks": 0, "loss_rank_avg": 0.04907100647687912, "step": 4205, "valid_targets_mean": 956.8, "valid_targets_min": 509 }, { "epoch": 4.764006791171477, "grad_norm": 0.45983183893965734, "learning_rate": 1.122153675303244e-05, "loss": 0.0881, "loss_nan_ranks": 0, "loss_rank_avg": 0.03519134968519211, "step": 4210, "valid_targets_mean": 3013.6, "valid_targets_min": 1158 }, { "epoch": 4.76966610073571, "grad_norm": 0.33209367748663793, "learning_rate": 1.1170884035324607e-05, "loss": 0.0661, "loss_nan_ranks": 0, "loss_rank_avg": 0.034753963351249695, "step": 4215, "valid_targets_mean": 3860.5, "valid_targets_min": 3044 }, { "epoch": 4.775325410299944, "grad_norm": 0.3847170268802759, "learning_rate": 1.1120301560487365e-05, "loss": 0.0819, "loss_nan_ranks": 0, "loss_rank_avg": 0.02686852589249611, "step": 4220, "valid_targets_mean": 2286.4, "valid_targets_min": 539 }, { "epoch": 4.780984719864176, "grad_norm": 0.6034937690417163, "learning_rate": 1.1069789730945849e-05, "loss": 0.083, "loss_nan_ranks": 0, "loss_rank_avg": 0.03560284525156021, "step": 4225, "valid_targets_mean": 2865.5, "valid_targets_min": 912 }, { "epoch": 4.78664402942841, "grad_norm": 0.6053259730967792, "learning_rate": 1.1019348948563154e-05, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.04834606498479843, "step": 4230, "valid_targets_mean": 2087.4, "valid_targets_min": 872 }, { "epoch": 4.792303338992643, "grad_norm": 0.40623321419478176, "learning_rate": 1.096897961463714e-05, "loss": 0.0838, "loss_nan_ranks": 0, "loss_rank_avg": 0.026839591562747955, "step": 4235, "valid_targets_mean": 3380.1, "valid_targets_min": 2254 }, { "epoch": 4.797962648556876, "grad_norm": 0.7531250762705376, "learning_rate": 1.0918682129897244e-05, "loss": 0.0856, "loss_nan_ranks": 0, "loss_rank_avg": 0.05346660315990448, "step": 4240, "valid_targets_mean": 1274.0, "valid_targets_min": 605 }, { "epoch": 4.803621958121109, "grad_norm": 0.4541710056333317, "learning_rate": 1.0868456894501276e-05, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.044228989630937576, "step": 4245, "valid_targets_mean": 2289.0, "valid_targets_min": 1117 }, { "epoch": 4.809281267685343, "grad_norm": 0.48951262028685094, "learning_rate": 1.0818304308032232e-05, "loss": 0.1018, "loss_nan_ranks": 0, "loss_rank_avg": 0.03746718168258667, "step": 4250, "valid_targets_mean": 3169.9, "valid_targets_min": 1132 }, { "epoch": 4.814940577249575, "grad_norm": 0.4192328688567942, "learning_rate": 1.0768224769495155e-05, "loss": 0.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.028717348352074623, "step": 4255, "valid_targets_mean": 2107.4, "valid_targets_min": 524 }, { "epoch": 4.820599886813809, "grad_norm": 0.4462875440845788, "learning_rate": 1.0718218677313904e-05, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.032722052186727524, "step": 4260, "valid_targets_mean": 1705.8, "valid_targets_min": 516 }, { "epoch": 4.826259196378042, "grad_norm": 0.5227401635445773, "learning_rate": 1.0668286429328015e-05, "loss": 0.0913, "loss_nan_ranks": 0, "loss_rank_avg": 0.04021327197551727, "step": 4265, "valid_targets_mean": 2088.2, "valid_targets_min": 342 }, { "epoch": 4.831918505942275, "grad_norm": 0.37467202581633297, "learning_rate": 1.0618428422789555e-05, "loss": 0.0858, "loss_nan_ranks": 0, "loss_rank_avg": 0.035980671644210815, "step": 4270, "valid_targets_mean": 3528.1, "valid_targets_min": 1935 }, { "epoch": 4.837577815506508, "grad_norm": 0.5620575705357205, "learning_rate": 1.0568645054359919e-05, "loss": 0.0677, "loss_nan_ranks": 0, "loss_rank_avg": 0.029610414057970047, "step": 4275, "valid_targets_mean": 1818.2, "valid_targets_min": 564 }, { "epoch": 4.8432371250707416, "grad_norm": 0.35221795133693484, "learning_rate": 1.051893672010669e-05, "loss": 0.0779, "loss_nan_ranks": 0, "loss_rank_avg": 0.036343298852443695, "step": 4280, "valid_targets_mean": 5238.9, "valid_targets_min": 3653 }, { "epoch": 4.848896434634975, "grad_norm": 0.34385645132118725, "learning_rate": 1.0469303815500518e-05, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.0252225324511528, "step": 4285, "valid_targets_mean": 2983.4, "valid_targets_min": 684 }, { "epoch": 4.8545557441992075, "grad_norm": 0.4035843769574735, "learning_rate": 1.0419746735411922e-05, "loss": 0.0633, "loss_nan_ranks": 0, "loss_rank_avg": 0.03745335340499878, "step": 4290, "valid_targets_mean": 3324.8, "valid_targets_min": 726 }, { "epoch": 4.860215053763441, "grad_norm": 0.3379316891220196, "learning_rate": 1.037026587410819e-05, "loss": 0.0873, "loss_nan_ranks": 0, "loss_rank_avg": 0.04062708839774132, "step": 4295, "valid_targets_mean": 4154.5, "valid_targets_min": 3469 }, { "epoch": 4.8658743633276735, "grad_norm": 0.5869714625833198, "learning_rate": 1.032086162525021e-05, "loss": 0.0974, "loss_nan_ranks": 0, "loss_rank_avg": 0.1502927839756012, "step": 4300, "valid_targets_mean": 2561.6, "valid_targets_min": 1536 }, { "epoch": 4.871533672891907, "grad_norm": 0.3806887067815329, "learning_rate": 1.0271534381889385e-05, "loss": 0.078, "loss_nan_ranks": 0, "loss_rank_avg": 0.041151951998472214, "step": 4305, "valid_targets_mean": 2912.4, "valid_targets_min": 582 }, { "epoch": 4.87719298245614, "grad_norm": 0.3310535788490826, "learning_rate": 1.0222284536464451e-05, "loss": 0.0892, "loss_nan_ranks": 0, "loss_rank_avg": 0.026854077354073524, "step": 4310, "valid_targets_mean": 3388.5, "valid_targets_min": 633 }, { "epoch": 4.882852292020374, "grad_norm": 0.40632377202265596, "learning_rate": 1.0173112480798376e-05, "loss": 0.0988, "loss_nan_ranks": 0, "loss_rank_avg": 0.03150768578052521, "step": 4315, "valid_targets_mean": 3263.6, "valid_targets_min": 1130 }, { "epoch": 4.888511601584606, "grad_norm": 0.42612380843339315, "learning_rate": 1.0124018606095278e-05, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.03779520094394684, "step": 4320, "valid_targets_mean": 2866.5, "valid_targets_min": 492 }, { "epoch": 4.89417091114884, "grad_norm": 0.6847680115960296, "learning_rate": 1.0075003302937247e-05, "loss": 0.0841, "loss_nan_ranks": 0, "loss_rank_avg": 0.05836600810289383, "step": 4325, "valid_targets_mean": 2353.8, "valid_targets_min": 1045 }, { "epoch": 4.899830220713073, "grad_norm": 0.3809740597349084, "learning_rate": 1.0026066961281282e-05, "loss": 0.0712, "loss_nan_ranks": 0, "loss_rank_avg": 0.025576546788215637, "step": 4330, "valid_targets_mean": 3043.9, "valid_targets_min": 647 }, { "epoch": 4.905489530277306, "grad_norm": 0.625831634310936, "learning_rate": 9.977209970456194e-06, "loss": 0.1175, "loss_nan_ranks": 0, "loss_rank_avg": 0.0737590566277504, "step": 4335, "valid_targets_mean": 2093.0, "valid_targets_min": 806 }, { "epoch": 4.911148839841539, "grad_norm": 0.6263000587819555, "learning_rate": 9.928432719159475e-06, "loss": 0.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.041312504559755325, "step": 4340, "valid_targets_mean": 1208.8, "valid_targets_min": 575 }, { "epoch": 4.916808149405773, "grad_norm": 0.44496719578733984, "learning_rate": 9.879735595454232e-06, "loss": 0.077, "loss_nan_ranks": 0, "loss_rank_avg": 0.03539961576461792, "step": 4345, "valid_targets_mean": 3447.5, "valid_targets_min": 2784 }, { "epoch": 4.922467458970006, "grad_norm": 0.37638760798797666, "learning_rate": 9.831118986766084e-06, "loss": 0.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.030857397243380547, "step": 4350, "valid_targets_mean": 3721.6, "valid_targets_min": 2525 }, { "epoch": 4.928126768534239, "grad_norm": 0.4266897421917311, "learning_rate": 9.782583279880096e-06, "loss": 0.0769, "loss_nan_ranks": 0, "loss_rank_avg": 0.030803639441728592, "step": 4355, "valid_targets_mean": 2665.2, "valid_targets_min": 767 }, { "epoch": 4.933786078098472, "grad_norm": 0.46673207366963637, "learning_rate": 9.734128860937675e-06, "loss": 0.0688, "loss_nan_ranks": 0, "loss_rank_avg": 0.031016550958156586, "step": 4360, "valid_targets_mean": 2277.6, "valid_targets_min": 870 }, { "epoch": 4.939445387662705, "grad_norm": 0.7649765411181526, "learning_rate": 9.68575611543355e-06, "loss": 0.0954, "loss_nan_ranks": 0, "loss_rank_avg": 0.05628187209367752, "step": 4365, "valid_targets_mean": 1535.8, "valid_targets_min": 758 }, { "epoch": 4.945104697226938, "grad_norm": 0.452703192648749, "learning_rate": 9.637465428212636e-06, "loss": 0.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.037448108196258545, "step": 4370, "valid_targets_mean": 2024.1, "valid_targets_min": 797 }, { "epoch": 4.950764006791172, "grad_norm": 0.4250155772613219, "learning_rate": 9.589257183467025e-06, "loss": 0.0724, "loss_nan_ranks": 0, "loss_rank_avg": 0.034758277237415314, "step": 4375, "valid_targets_mean": 3299.5, "valid_targets_min": 1606 }, { "epoch": 4.956423316355405, "grad_norm": 0.5030761530701435, "learning_rate": 9.541131764732896e-06, "loss": 0.0743, "loss_nan_ranks": 0, "loss_rank_avg": 0.04057200998067856, "step": 4380, "valid_targets_mean": 3055.0, "valid_targets_min": 678 }, { "epoch": 4.962082625919638, "grad_norm": 0.3454890398598417, "learning_rate": 9.493089554887508e-06, "loss": 0.0792, "loss_nan_ranks": 0, "loss_rank_avg": 0.037702687084674835, "step": 4385, "valid_targets_mean": 4980.6, "valid_targets_min": 1078 }, { "epoch": 4.967741935483871, "grad_norm": 0.3417198049280031, "learning_rate": 9.445130936146098e-06, "loss": 0.0696, "loss_nan_ranks": 0, "loss_rank_avg": 0.02648003399372101, "step": 4390, "valid_targets_mean": 2680.8, "valid_targets_min": 706 }, { "epoch": 4.973401245048104, "grad_norm": 0.5884179767956441, "learning_rate": 9.397256290058869e-06, "loss": 0.0767, "loss_nan_ranks": 0, "loss_rank_avg": 0.048919759690761566, "step": 4395, "valid_targets_mean": 1580.4, "valid_targets_min": 580 }, { "epoch": 4.979060554612337, "grad_norm": 0.5496614675946481, "learning_rate": 9.349465997507974e-06, "loss": 0.0971, "loss_nan_ranks": 0, "loss_rank_avg": 0.07147332280874252, "step": 4400, "valid_targets_mean": 2592.1, "valid_targets_min": 780 }, { "epoch": 4.98471986417657, "grad_norm": 0.3756997485189556, "learning_rate": 9.301760438704442e-06, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.03079824708402157, "step": 4405, "valid_targets_mean": 3478.2, "valid_targets_min": 2861 }, { "epoch": 4.990379173740804, "grad_norm": 0.4112393944489124, "learning_rate": 9.254139993185176e-06, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.0403585322201252, "step": 4410, "valid_targets_mean": 3846.5, "valid_targets_min": 2453 }, { "epoch": 4.996038483305036, "grad_norm": 0.42208698207818324, "learning_rate": 9.206605039809955e-06, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.04255661368370056, "step": 4415, "valid_targets_mean": 3881.8, "valid_targets_min": 3389 }, { "epoch": 5.001131861912847, "grad_norm": 0.7669520907027851, "learning_rate": 9.159155956758375e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.09069793671369553, "step": 4420, "valid_targets_mean": 6935.0, "valid_targets_min": 5295 }, { "epoch": 5.006791171477079, "grad_norm": 0.558900053602927, "learning_rate": 9.111793121526862e-06, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.0958920270204544, "step": 4425, "valid_targets_mean": 7672.9, "valid_targets_min": 5066 }, { "epoch": 5.012450481041313, "grad_norm": 0.42971110414210983, "learning_rate": 9.064516910925698e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.0791202113032341, "step": 4430, "valid_targets_mean": 7347.6, "valid_targets_min": 4923 }, { "epoch": 5.018109790605546, "grad_norm": 0.424026939483264, "learning_rate": 9.017327701075965e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.07265719771385193, "step": 4435, "valid_targets_mean": 5446.8, "valid_targets_min": 3922 }, { "epoch": 5.023769100169779, "grad_norm": 0.3966328657232047, "learning_rate": 8.970225867406593e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.0743541494011879, "step": 4440, "valid_targets_mean": 6924.9, "valid_targets_min": 4797 }, { "epoch": 5.029428409734012, "grad_norm": 0.40249258933443416, "learning_rate": 8.923211784651356e-06, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.08096291124820709, "step": 4445, "valid_targets_mean": 6443.5, "valid_targets_min": 3853 }, { "epoch": 5.035087719298246, "grad_norm": 0.5019839927447249, "learning_rate": 8.876285826845918e-06, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.0774025097489357, "step": 4450, "valid_targets_mean": 5446.5, "valid_targets_min": 4487 }, { "epoch": 5.040747028862479, "grad_norm": 0.41328338470674536, "learning_rate": 8.82944836732482e-06, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.07444000989198685, "step": 4455, "valid_targets_mean": 6210.2, "valid_targets_min": 4137 }, { "epoch": 5.046406338426712, "grad_norm": 0.5368670084410287, "learning_rate": 8.782699778718516e-06, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.1226726844906807, "step": 4460, "valid_targets_mean": 5404.4, "valid_targets_min": 698 }, { "epoch": 5.052065647990945, "grad_norm": 0.4194795096973056, "learning_rate": 8.736040432950447e-06, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.08990229666233063, "step": 4465, "valid_targets_mean": 7197.6, "valid_targets_min": 4499 }, { "epoch": 5.057724957555179, "grad_norm": 0.45155172518626197, "learning_rate": 8.689470701234037e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.10899793356657028, "step": 4470, "valid_targets_mean": 5538.4, "valid_targets_min": 4291 }, { "epoch": 5.063384267119411, "grad_norm": 0.3856721196725891, "learning_rate": 8.642990954069747e-06, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.06013498827815056, "step": 4475, "valid_targets_mean": 5531.4, "valid_targets_min": 4050 }, { "epoch": 5.069043576683645, "grad_norm": 0.43003600987131757, "learning_rate": 8.596601561242167e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.08636723458766937, "step": 4480, "valid_targets_mean": 7526.6, "valid_targets_min": 5196 }, { "epoch": 5.074702886247878, "grad_norm": 0.37505619278492647, "learning_rate": 8.550302891817015e-06, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.0698092132806778, "step": 4485, "valid_targets_mean": 6248.9, "valid_targets_min": 4749 }, { "epoch": 5.080362195812111, "grad_norm": 0.4318746906316014, "learning_rate": 8.50409531413824e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.039330024272203445, "step": 4490, "valid_targets_mean": 3248.5, "valid_targets_min": 1908 }, { "epoch": 5.086021505376344, "grad_norm": 0.41762584637699307, "learning_rate": 8.457979195825076e-06, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.070592001080513, "step": 4495, "valid_targets_mean": 6225.6, "valid_targets_min": 4808 }, { "epoch": 5.0916808149405774, "grad_norm": 0.4025616969393729, "learning_rate": 8.411954903769145e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.0751720666885376, "step": 4500, "valid_targets_mean": 5383.0, "valid_targets_min": 3774 }, { "epoch": 5.09734012450481, "grad_norm": 0.4221341874106493, "learning_rate": 8.366022804131487e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.07378105074167252, "step": 4505, "valid_targets_mean": 6291.4, "valid_targets_min": 5335 }, { "epoch": 5.102999434069043, "grad_norm": 0.3829917137612727, "learning_rate": 8.320183262339686e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.07340899109840393, "step": 4510, "valid_targets_mean": 7749.1, "valid_targets_min": 6205 }, { "epoch": 5.108658743633277, "grad_norm": 0.3805013608286788, "learning_rate": 8.274436643084962e-06, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.0707998052239418, "step": 4515, "valid_targets_mean": 6882.1, "valid_targets_min": 4428 }, { "epoch": 5.11431805319751, "grad_norm": 0.48028126526368026, "learning_rate": 8.228783310319248e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.07884474098682404, "step": 4520, "valid_targets_mean": 5751.8, "valid_targets_min": 4458 }, { "epoch": 5.119977362761743, "grad_norm": 0.3926095512807884, "learning_rate": 8.183223627252305e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.06521456688642502, "step": 4525, "valid_targets_mean": 6003.9, "valid_targets_min": 4458 }, { "epoch": 5.125636672325976, "grad_norm": 0.4181977204631873, "learning_rate": 8.137757956348854e-06, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.06609899550676346, "step": 4530, "valid_targets_mean": 6033.8, "valid_targets_min": 4066 }, { "epoch": 5.13129598189021, "grad_norm": 0.46323510844564697, "learning_rate": 8.092386659325644e-06, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.08222903311252594, "step": 4535, "valid_targets_mean": 6601.0, "valid_targets_min": 4708 }, { "epoch": 5.136955291454442, "grad_norm": 0.4315489667874819, "learning_rate": 8.047110097148618e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.08429074287414551, "step": 4540, "valid_targets_mean": 6092.1, "valid_targets_min": 4789 }, { "epoch": 5.142614601018676, "grad_norm": 0.42567220761721475, "learning_rate": 8.001928630030017e-06, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.08571913838386536, "step": 4545, "valid_targets_mean": 6474.6, "valid_targets_min": 4224 }, { "epoch": 5.148273910582909, "grad_norm": 0.41413321611049403, "learning_rate": 7.95684261742554e-06, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.08004915714263916, "step": 4550, "valid_targets_mean": 6312.4, "valid_targets_min": 4617 }, { "epoch": 5.153933220147142, "grad_norm": 0.4071549037169186, "learning_rate": 7.911852418031449e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.0771443247795105, "step": 4555, "valid_targets_mean": 6333.8, "valid_targets_min": 4783 }, { "epoch": 5.159592529711375, "grad_norm": 0.40644763519175936, "learning_rate": 7.866958389781736e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.07742355763912201, "step": 4560, "valid_targets_mean": 7380.1, "valid_targets_min": 6020 }, { "epoch": 5.165251839275609, "grad_norm": 0.4306799765061804, "learning_rate": 7.822160889845286e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.08144442737102509, "step": 4565, "valid_targets_mean": 6009.0, "valid_targets_min": 3049 }, { "epoch": 5.170911148839841, "grad_norm": 0.41741532189159075, "learning_rate": 7.777460274623005e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.07007598876953125, "step": 4570, "valid_targets_mean": 5973.1, "valid_targets_min": 4822 }, { "epoch": 5.176570458404075, "grad_norm": 0.4294904406202204, "learning_rate": 7.732856899745003e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.07263119518756866, "step": 4575, "valid_targets_mean": 5754.9, "valid_targets_min": 2910 }, { "epoch": 5.182229767968308, "grad_norm": 0.44380956966564805, "learning_rate": 7.688351120067781e-06, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.08814549446105957, "step": 4580, "valid_targets_mean": 6414.6, "valid_targets_min": 4791 }, { "epoch": 5.187889077532541, "grad_norm": 0.4526826853647187, "learning_rate": 7.643943289671374e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.07937498390674591, "step": 4585, "valid_targets_mean": 5675.9, "valid_targets_min": 3983 }, { "epoch": 5.193548387096774, "grad_norm": 0.3578771225498125, "learning_rate": 7.599633761856542e-06, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.06336264312267303, "step": 4590, "valid_targets_mean": 6975.5, "valid_targets_min": 4383 }, { "epoch": 5.1992076966610075, "grad_norm": 0.3907734003361043, "learning_rate": 7.555422889141997e-06, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.073424331843853, "step": 4595, "valid_targets_mean": 6417.1, "valid_targets_min": 3182 }, { "epoch": 5.204867006225241, "grad_norm": 0.4311567298480243, "learning_rate": 7.51131102326154e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.0849514901638031, "step": 4600, "valid_targets_mean": 6218.6, "valid_targets_min": 5077 }, { "epoch": 5.2105263157894735, "grad_norm": 0.4696685522510483, "learning_rate": 7.467298515161305e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.0753907635807991, "step": 4605, "valid_targets_mean": 4774.9, "valid_targets_min": 3663 }, { "epoch": 5.216185625353707, "grad_norm": 0.41679582330020365, "learning_rate": 7.423385714996942e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.07688593864440918, "step": 4610, "valid_targets_mean": 6316.8, "valid_targets_min": 4105 }, { "epoch": 5.22184493491794, "grad_norm": 0.4005301809886344, "learning_rate": 7.379572972130864e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.06853274255990982, "step": 4615, "valid_targets_mean": 6528.9, "valid_targets_min": 4537 }, { "epoch": 5.227504244482173, "grad_norm": 0.4028892173858166, "learning_rate": 7.335860635129426e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.06940186023712158, "step": 4620, "valid_targets_mean": 6416.8, "valid_targets_min": 2494 }, { "epoch": 5.233163554046406, "grad_norm": 0.40156406656775434, "learning_rate": 7.292249051760169e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.0779690071940422, "step": 4625, "valid_targets_mean": 6070.9, "valid_targets_min": 4921 }, { "epoch": 5.23882286361064, "grad_norm": 0.4027854588002, "learning_rate": 7.2487385689890845e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.0822412520647049, "step": 4630, "valid_targets_mean": 6701.4, "valid_targets_min": 5285 }, { "epoch": 5.244482173174872, "grad_norm": 0.42468145589722883, "learning_rate": 7.205329532977794e-06, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.0705537348985672, "step": 4635, "valid_targets_mean": 6273.9, "valid_targets_min": 4464 }, { "epoch": 5.250141482739106, "grad_norm": 0.45132048278659165, "learning_rate": 7.162022289080837e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.06876321882009506, "step": 4640, "valid_targets_mean": 5554.8, "valid_targets_min": 4439 }, { "epoch": 5.255800792303339, "grad_norm": 0.41803966931151526, "learning_rate": 7.1188171818429256e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.06165836751461029, "step": 4645, "valid_targets_mean": 6043.0, "valid_targets_min": 4686 }, { "epoch": 5.261460101867572, "grad_norm": 0.440878055574104, "learning_rate": 7.075714554996176e-06, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.06370429694652557, "step": 4650, "valid_targets_mean": 5912.5, "valid_targets_min": 3381 }, { "epoch": 5.267119411431805, "grad_norm": 0.612073574059755, "learning_rate": 7.032714751457395e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.06927108019590378, "step": 4655, "valid_targets_mean": 6495.5, "valid_targets_min": 5309 }, { "epoch": 5.272778720996039, "grad_norm": 0.4251949566082133, "learning_rate": 6.989818113325333e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.07870665192604065, "step": 4660, "valid_targets_mean": 6483.9, "valid_targets_min": 5161 }, { "epoch": 5.278438030560272, "grad_norm": 0.4438435905888869, "learning_rate": 6.947024981878001e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.07518930733203888, "step": 4665, "valid_targets_mean": 5958.9, "valid_targets_min": 4666 }, { "epoch": 5.284097340124505, "grad_norm": 0.5827403553757994, "learning_rate": 6.904335697569909e-06, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.09826524555683136, "step": 4670, "valid_targets_mean": 1691.5, "valid_targets_min": 1440 }, { "epoch": 5.289756649688738, "grad_norm": 0.4333512080117021, "learning_rate": 6.861750600029373e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.06576051563024521, "step": 4675, "valid_targets_mean": 5299.1, "valid_targets_min": 4547 }, { "epoch": 5.2954159592529715, "grad_norm": 0.4298304067134876, "learning_rate": 6.819270028055844e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.07609501481056213, "step": 4680, "valid_targets_mean": 6003.5, "valid_targets_min": 5031 }, { "epoch": 5.301075268817204, "grad_norm": 0.434080083592628, "learning_rate": 6.776894319617162e-06, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.06977563351392746, "step": 4685, "valid_targets_mean": 8169.6, "valid_targets_min": 5487 }, { "epoch": 5.3067345783814375, "grad_norm": 0.4234596055091472, "learning_rate": 6.73462381184689e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.0698070153594017, "step": 4690, "valid_targets_mean": 6474.9, "valid_targets_min": 4253 }, { "epoch": 5.312393887945671, "grad_norm": 0.4227309069414161, "learning_rate": 6.6924588410416604e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.08599575608968735, "step": 4695, "valid_targets_mean": 7021.0, "valid_targets_min": 4990 }, { "epoch": 5.3180531975099035, "grad_norm": 0.4433300308692838, "learning_rate": 6.650399742658442e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.08826185762882233, "step": 4700, "valid_targets_mean": 6356.0, "valid_targets_min": 4385 }, { "epoch": 5.323712507074137, "grad_norm": 0.38772347681595304, "learning_rate": 6.608446851311918e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.08048726618289948, "step": 4705, "valid_targets_mean": 6815.1, "valid_targets_min": 5164 }, { "epoch": 5.32937181663837, "grad_norm": 0.40251172074444747, "learning_rate": 6.566600500771796e-06, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.05604606121778488, "step": 4710, "valid_targets_mean": 5588.5, "valid_targets_min": 4098 }, { "epoch": 5.335031126202603, "grad_norm": 0.41678126626964224, "learning_rate": 6.524861023960185e-06, "loss": 0.1386, "loss_nan_ranks": 0, "loss_rank_avg": 0.07454540580511093, "step": 4715, "valid_targets_mean": 6167.6, "valid_targets_min": 4801 }, { "epoch": 5.340690435766836, "grad_norm": 0.45099069972017347, "learning_rate": 6.483228752948902e-06, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.18380106985569, "step": 4720, "valid_targets_mean": 6224.9, "valid_targets_min": 4772 }, { "epoch": 5.34634974533107, "grad_norm": 0.44008724009186123, "learning_rate": 6.441704018956858e-06, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.08497292548418045, "step": 4725, "valid_targets_mean": 6549.2, "valid_targets_min": 5025 }, { "epoch": 5.352009054895303, "grad_norm": 0.5276958180485326, "learning_rate": 6.400287152347442e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.0843924731016159, "step": 4730, "valid_targets_mean": 6680.8, "valid_targets_min": 4818 }, { "epoch": 5.357668364459536, "grad_norm": 0.46757375166774123, "learning_rate": 6.35897848262584e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.0748303085565567, "step": 4735, "valid_targets_mean": 5835.1, "valid_targets_min": 4111 }, { "epoch": 5.363327674023769, "grad_norm": 0.42048683370736745, "learning_rate": 6.317778338436449e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.07209735363721848, "step": 4740, "valid_targets_mean": 7029.9, "valid_targets_min": 2275 }, { "epoch": 5.368986983588003, "grad_norm": 0.41548903650378316, "learning_rate": 6.276687047560275e-06, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.06418467313051224, "step": 4745, "valid_targets_mean": 5621.2, "valid_targets_min": 4826 }, { "epoch": 5.374646293152235, "grad_norm": 0.4009641412548776, "learning_rate": 6.235704936912288e-06, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.06733281910419464, "step": 4750, "valid_targets_mean": 6858.8, "valid_targets_min": 4710 }, { "epoch": 5.380305602716469, "grad_norm": 0.4058686462438823, "learning_rate": 6.194832332538838e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.10353972017765045, "step": 4755, "valid_targets_mean": 7012.5, "valid_targets_min": 5421 }, { "epoch": 5.385964912280702, "grad_norm": 0.4080275617258039, "learning_rate": 6.154069559615081e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.06577767431735992, "step": 4760, "valid_targets_mean": 6967.6, "valid_targets_min": 4949 }, { "epoch": 5.391624221844935, "grad_norm": 0.38798007962489367, "learning_rate": 6.113416942442358e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.07223743200302124, "step": 4765, "valid_targets_mean": 6348.5, "valid_targets_min": 4831 }, { "epoch": 5.397283531409168, "grad_norm": 0.4311691528295395, "learning_rate": 6.072874804445632e-06, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.09179031848907471, "step": 4770, "valid_targets_mean": 6597.2, "valid_targets_min": 4018 }, { "epoch": 5.4029428409734015, "grad_norm": 0.3467602354311775, "learning_rate": 6.032443468170912e-06, "loss": 0.1386, "loss_nan_ranks": 0, "loss_rank_avg": 0.051479682326316833, "step": 4775, "valid_targets_mean": 6420.9, "valid_targets_min": 5034 }, { "epoch": 5.408602150537634, "grad_norm": 0.41667026215499137, "learning_rate": 5.992123255282702e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.08383023738861084, "step": 4780, "valid_targets_mean": 6962.4, "valid_targets_min": 5442 }, { "epoch": 5.4142614601018675, "grad_norm": 0.4802376377588568, "learning_rate": 5.951914486561417e-06, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.07770697772502899, "step": 4785, "valid_targets_mean": 5610.9, "valid_targets_min": 4609 }, { "epoch": 5.419920769666101, "grad_norm": 0.4589664164147789, "learning_rate": 5.911817481900832e-06, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.07419160008430481, "step": 4790, "valid_targets_mean": 5038.4, "valid_targets_min": 2301 }, { "epoch": 5.425580079230334, "grad_norm": 0.5730477242441706, "learning_rate": 5.871832560305573e-06, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.0763842836022377, "step": 4795, "valid_targets_mean": 1449.8, "valid_targets_min": 363 }, { "epoch": 5.431239388794567, "grad_norm": 0.38431554670090246, "learning_rate": 5.831960039888533e-06, "loss": 0.0822, "loss_nan_ranks": 0, "loss_rank_avg": 0.04814344644546509, "step": 4800, "valid_targets_mean": 3729.8, "valid_targets_min": 3074 }, { "epoch": 5.4368986983588, "grad_norm": 0.42804624601009617, "learning_rate": 5.792200237868361e-06, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.04012545943260193, "step": 4805, "valid_targets_mean": 2272.8, "valid_targets_min": 700 }, { "epoch": 5.442558007923034, "grad_norm": 0.47429604453716917, "learning_rate": 5.752553470566957e-06, "loss": 0.0804, "loss_nan_ranks": 0, "loss_rank_avg": 0.03822815418243408, "step": 4810, "valid_targets_mean": 2997.5, "valid_targets_min": 803 }, { "epoch": 5.448217317487266, "grad_norm": 0.47494590604900366, "learning_rate": 5.713020053406917e-06, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.04123368859291077, "step": 4815, "valid_targets_mean": 2655.5, "valid_targets_min": 920 }, { "epoch": 5.4538766270515, "grad_norm": 0.432653492711929, "learning_rate": 5.673600300909053e-06, "loss": 0.0787, "loss_nan_ranks": 0, "loss_rank_avg": 0.04253911226987839, "step": 4820, "valid_targets_mean": 3263.8, "valid_targets_min": 806 }, { "epoch": 5.459535936615733, "grad_norm": 0.7187022007851978, "learning_rate": 5.634294526689872e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.06496002525091171, "step": 4825, "valid_targets_mean": 1644.4, "valid_targets_min": 718 }, { "epoch": 5.465195246179966, "grad_norm": 0.4211215979416941, "learning_rate": 5.595103043459109e-06, "loss": 0.0868, "loss_nan_ranks": 0, "loss_rank_avg": 0.043419234454631805, "step": 4830, "valid_targets_mean": 3399.4, "valid_targets_min": 1133 }, { "epoch": 5.470854555744199, "grad_norm": 0.4693753835767023, "learning_rate": 5.556026163017205e-06, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.035194315016269684, "step": 4835, "valid_targets_mean": 1808.9, "valid_targets_min": 859 }, { "epoch": 5.476513865308433, "grad_norm": 0.27086846723671243, "learning_rate": 5.517064196252837e-06, "loss": 0.1077, "loss_nan_ranks": 0, "loss_rank_avg": 0.023684551939368248, "step": 4840, "valid_targets_mean": 5541.4, "valid_targets_min": 5150 }, { "epoch": 5.482173174872665, "grad_norm": 0.48126645790976275, "learning_rate": 5.478217453140471e-06, "loss": 0.0683, "loss_nan_ranks": 0, "loss_rank_avg": 0.04665878415107727, "step": 4845, "valid_targets_mean": 4000.1, "valid_targets_min": 502 }, { "epoch": 5.487832484436899, "grad_norm": 0.3917605803512901, "learning_rate": 5.439486242737855e-06, "loss": 0.0734, "loss_nan_ranks": 0, "loss_rank_avg": 0.043694302439689636, "step": 4850, "valid_targets_mean": 3906.9, "valid_targets_min": 600 }, { "epoch": 5.493491794001132, "grad_norm": 0.39241086936632663, "learning_rate": 5.400870873183583e-06, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.03243585675954819, "step": 4855, "valid_targets_mean": 2979.5, "valid_targets_min": 518 }, { "epoch": 5.499151103565365, "grad_norm": 0.43406960946047696, "learning_rate": 5.362371651694647e-06, "loss": 0.1167, "loss_nan_ranks": 0, "loss_rank_avg": 0.04233259707689285, "step": 4860, "valid_targets_mean": 3522.5, "valid_targets_min": 549 }, { "epoch": 5.504810413129598, "grad_norm": 0.3572759598808805, "learning_rate": 5.323988884563975e-06, "loss": 0.0659, "loss_nan_ranks": 0, "loss_rank_avg": 0.02906729094684124, "step": 4865, "valid_targets_mean": 3878.5, "valid_targets_min": 3170 }, { "epoch": 5.5104697226938315, "grad_norm": 0.5208358787040975, "learning_rate": 5.2857228771580105e-06, "loss": 0.0794, "loss_nan_ranks": 0, "loss_rank_avg": 0.04582788050174713, "step": 4870, "valid_targets_mean": 1656.0, "valid_targets_min": 644 }, { "epoch": 5.516129032258064, "grad_norm": 0.3326607206725967, "learning_rate": 5.247573933914285e-06, "loss": 0.0604, "loss_nan_ranks": 0, "loss_rank_avg": 0.020800217986106873, "step": 4875, "valid_targets_mean": 2891.8, "valid_targets_min": 720 }, { "epoch": 5.5217883418222975, "grad_norm": 0.4923417370395899, "learning_rate": 5.20954235833898e-06, "loss": 0.08, "loss_nan_ranks": 0, "loss_rank_avg": 0.030622247606515884, "step": 4880, "valid_targets_mean": 1775.6, "valid_targets_min": 516 }, { "epoch": 5.527447651386531, "grad_norm": 0.5285695399568121, "learning_rate": 5.171628453004512e-06, "loss": 0.0823, "loss_nan_ranks": 0, "loss_rank_avg": 0.05061523616313934, "step": 4885, "valid_targets_mean": 2018.6, "valid_targets_min": 557 }, { "epoch": 5.533106960950764, "grad_norm": 0.5460414179629879, "learning_rate": 5.133832519547155e-06, "loss": 0.0849, "loss_nan_ranks": 0, "loss_rank_avg": 0.04757304489612579, "step": 4890, "valid_targets_mean": 3398.1, "valid_targets_min": 1086 }, { "epoch": 5.538766270514997, "grad_norm": 0.4886522424962672, "learning_rate": 5.096154858664608e-06, "loss": 0.0832, "loss_nan_ranks": 0, "loss_rank_avg": 0.04523239657282829, "step": 4895, "valid_targets_mean": 2532.9, "valid_targets_min": 1008 }, { "epoch": 5.54442558007923, "grad_norm": 0.498231032412165, "learning_rate": 5.058595770113606e-06, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.03225970268249512, "step": 4900, "valid_targets_mean": 3481.1, "valid_targets_min": 2756 }, { "epoch": 5.550084889643464, "grad_norm": 0.34825050975154626, "learning_rate": 5.0211555527075664e-06, "loss": 0.07, "loss_nan_ranks": 0, "loss_rank_avg": 0.03134623169898987, "step": 4905, "valid_targets_mean": 4113.5, "valid_targets_min": 3798 }, { "epoch": 5.555744199207696, "grad_norm": 0.8345018317724164, "learning_rate": 4.9838345043141665e-06, "loss": 0.0851, "loss_nan_ranks": 0, "loss_rank_avg": 0.07340296357870102, "step": 4910, "valid_targets_mean": 1058.6, "valid_targets_min": 598 }, { "epoch": 5.56140350877193, "grad_norm": 0.4594410538877418, "learning_rate": 4.946632921853009e-06, "loss": 0.0935, "loss_nan_ranks": 0, "loss_rank_avg": 0.030109558254480362, "step": 4915, "valid_targets_mean": 2403.5, "valid_targets_min": 754 }, { "epoch": 5.567062818336163, "grad_norm": 0.4270637822659359, "learning_rate": 4.909551101293238e-06, "loss": 0.0862, "loss_nan_ranks": 0, "loss_rank_avg": 0.03934195637702942, "step": 4920, "valid_targets_mean": 4045.8, "valid_targets_min": 3390 }, { "epoch": 5.572722127900396, "grad_norm": 0.6800143738685122, "learning_rate": 4.872589337651208e-06, "loss": 0.1131, "loss_nan_ranks": 0, "loss_rank_avg": 0.13332173228263855, "step": 4925, "valid_targets_mean": 2255.9, "valid_targets_min": 1052 }, { "epoch": 5.578381437464629, "grad_norm": 0.5031406060454691, "learning_rate": 4.835747924988105e-06, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.0451483353972435, "step": 4930, "valid_targets_mean": 3214.0, "valid_targets_min": 2176 }, { "epoch": 5.584040747028863, "grad_norm": 0.4795250100183131, "learning_rate": 4.799027156407632e-06, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.038113273680210114, "step": 4935, "valid_targets_mean": 2396.0, "valid_targets_min": 1074 }, { "epoch": 5.589700056593095, "grad_norm": 0.4549673328264594, "learning_rate": 4.7624273240536756e-06, "loss": 0.0857, "loss_nan_ranks": 0, "loss_rank_avg": 0.04130017012357712, "step": 4940, "valid_targets_mean": 3271.8, "valid_targets_min": 1212 }, { "epoch": 5.595359366157329, "grad_norm": 0.48797530904109687, "learning_rate": 4.725948719107965e-06, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.049380846321582794, "step": 4945, "valid_targets_mean": 3990.8, "valid_targets_min": 2258 }, { "epoch": 5.601018675721562, "grad_norm": 0.34295461979365804, "learning_rate": 4.6895916317877624e-06, "loss": 0.0666, "loss_nan_ranks": 0, "loss_rank_avg": 0.047332584857940674, "step": 4950, "valid_targets_mean": 3730.2, "valid_targets_min": 1466 }, { "epoch": 5.6066779852857955, "grad_norm": 0.3693165572830921, "learning_rate": 4.653356351343577e-06, "loss": 0.0804, "loss_nan_ranks": 0, "loss_rank_avg": 0.03545898199081421, "step": 4955, "valid_targets_mean": 3557.1, "valid_targets_min": 560 }, { "epoch": 5.612337294850028, "grad_norm": 0.45760123311509754, "learning_rate": 4.617243166056826e-06, "loss": 0.0831, "loss_nan_ranks": 0, "loss_rank_avg": 0.04132983461022377, "step": 4960, "valid_targets_mean": 3222.9, "valid_targets_min": 1189 }, { "epoch": 5.6179966044142615, "grad_norm": 0.38183081000487035, "learning_rate": 4.581252363237567e-06, "loss": 0.069, "loss_nan_ranks": 0, "loss_rank_avg": 0.03381497412919998, "step": 4965, "valid_targets_mean": 3665.2, "valid_targets_min": 2257 }, { "epoch": 5.623655913978495, "grad_norm": 0.385036821503619, "learning_rate": 4.545384229222196e-06, "loss": 0.0679, "loss_nan_ranks": 0, "loss_rank_avg": 0.028356987982988358, "step": 4970, "valid_targets_mean": 3314.4, "valid_targets_min": 886 }, { "epoch": 5.6293152235427275, "grad_norm": 0.4014468518014719, "learning_rate": 4.509639049371193e-06, "loss": 0.0722, "loss_nan_ranks": 0, "loss_rank_avg": 0.03628263995051384, "step": 4975, "valid_targets_mean": 3377.5, "valid_targets_min": 2409 }, { "epoch": 5.634974533106961, "grad_norm": 0.401897256250637, "learning_rate": 4.474017108066828e-06, "loss": 0.0668, "loss_nan_ranks": 0, "loss_rank_avg": 0.03104272112250328, "step": 4980, "valid_targets_mean": 3241.8, "valid_targets_min": 820 }, { "epoch": 5.640633842671194, "grad_norm": 0.6805433850912309, "learning_rate": 4.438518688710898e-06, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.08667178452014923, "step": 4985, "valid_targets_mean": 2264.2, "valid_targets_min": 813 }, { "epoch": 5.646293152235427, "grad_norm": 0.366707828447475, "learning_rate": 4.403144073722501e-06, "loss": 0.0626, "loss_nan_ranks": 0, "loss_rank_avg": 0.02789473347365856, "step": 4990, "valid_targets_mean": 3651.9, "valid_targets_min": 2877 }, { "epoch": 5.65195246179966, "grad_norm": 0.5065193268802206, "learning_rate": 4.367893544535757e-06, "loss": 0.0625, "loss_nan_ranks": 0, "loss_rank_avg": 0.039443302899599075, "step": 4995, "valid_targets_mean": 2384.0, "valid_targets_min": 667 }, { "epoch": 5.657611771363894, "grad_norm": 0.38590017909105073, "learning_rate": 4.332767381597575e-06, "loss": 0.0615, "loss_nan_ranks": 0, "loss_rank_avg": 0.029201095923781395, "step": 5000, "valid_targets_mean": 3488.6, "valid_targets_min": 2353 }, { "epoch": 5.663271080928126, "grad_norm": 0.40972454629192384, "learning_rate": 4.297765864365453e-06, "loss": 0.0647, "loss_nan_ranks": 0, "loss_rank_avg": 0.039309754967689514, "step": 5005, "valid_targets_mean": 3189.9, "valid_targets_min": 549 }, { "epoch": 5.66893039049236, "grad_norm": 0.42666806283297, "learning_rate": 4.262889271305204e-06, "loss": 0.1096, "loss_nan_ranks": 0, "loss_rank_avg": 0.0314299650490284, "step": 5010, "valid_targets_mean": 3826.5, "valid_targets_min": 3340 }, { "epoch": 5.674589700056593, "grad_norm": 0.5179962988049834, "learning_rate": 4.228137879888774e-06, "loss": 0.0926, "loss_nan_ranks": 0, "loss_rank_avg": 0.05188950523734093, "step": 5015, "valid_targets_mean": 2178.2, "valid_targets_min": 647 }, { "epoch": 5.680249009620827, "grad_norm": 0.4970353043681172, "learning_rate": 4.193511966592041e-06, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.04057688266038895, "step": 5020, "valid_targets_mean": 1558.9, "valid_targets_min": 804 }, { "epoch": 5.685908319185059, "grad_norm": 0.7646762922675957, "learning_rate": 4.1590118068925815e-06, "loss": 0.0911, "loss_nan_ranks": 0, "loss_rank_avg": 0.08557213842868805, "step": 5025, "valid_targets_mean": 1855.1, "valid_targets_min": 702 }, { "epoch": 5.691567628749293, "grad_norm": 0.5384667166461213, "learning_rate": 4.124637675267511e-06, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.05332893133163452, "step": 5030, "valid_targets_mean": 2858.1, "valid_targets_min": 945 }, { "epoch": 5.697226938313526, "grad_norm": 0.5288805198191306, "learning_rate": 4.090389845191278e-06, "loss": 0.0774, "loss_nan_ranks": 0, "loss_rank_avg": 0.049206458032131195, "step": 5035, "valid_targets_mean": 2879.5, "valid_targets_min": 703 }, { "epoch": 5.702886247877759, "grad_norm": 0.5414207861579454, "learning_rate": 4.056268589133516e-06, "loss": 0.095, "loss_nan_ranks": 0, "loss_rank_avg": 0.038104280829429626, "step": 5040, "valid_targets_mean": 3950.5, "valid_targets_min": 3051 }, { "epoch": 5.708545557441992, "grad_norm": 0.5739872667001847, "learning_rate": 4.022274178556844e-06, "loss": 0.0772, "loss_nan_ranks": 0, "loss_rank_avg": 0.05831873416900635, "step": 5045, "valid_targets_mean": 1759.8, "valid_targets_min": 523 }, { "epoch": 5.7142048670062255, "grad_norm": 0.3871279428177479, "learning_rate": 3.988406883914717e-06, "loss": 0.0696, "loss_nan_ranks": 0, "loss_rank_avg": 0.03543112799525261, "step": 5050, "valid_targets_mean": 2138.2, "valid_targets_min": 468 }, { "epoch": 5.719864176570458, "grad_norm": 0.29274510999762493, "learning_rate": 3.954666974649295e-06, "loss": 0.076, "loss_nan_ranks": 0, "loss_rank_avg": 0.021055569872260094, "step": 5055, "valid_targets_mean": 4428.1, "valid_targets_min": 885 }, { "epoch": 5.7255234861346915, "grad_norm": 0.3924485471902587, "learning_rate": 3.921054719189272e-06, "loss": 0.0679, "loss_nan_ranks": 0, "loss_rank_avg": 0.025709647685289383, "step": 5060, "valid_targets_mean": 2478.5, "valid_targets_min": 546 }, { "epoch": 5.731182795698925, "grad_norm": 0.3937628507775362, "learning_rate": 3.887570384947745e-06, "loss": 0.0657, "loss_nan_ranks": 0, "loss_rank_avg": 0.03667730838060379, "step": 5065, "valid_targets_mean": 3910.5, "valid_targets_min": 981 }, { "epoch": 5.7368421052631575, "grad_norm": 0.5433030872476484, "learning_rate": 3.854214238320109e-06, "loss": 0.0783, "loss_nan_ranks": 0, "loss_rank_avg": 0.04392950236797333, "step": 5070, "valid_targets_mean": 1519.9, "valid_targets_min": 697 }, { "epoch": 5.742501414827391, "grad_norm": 0.43220977807356675, "learning_rate": 3.8209865446819105e-06, "loss": 0.0818, "loss_nan_ranks": 0, "loss_rank_avg": 0.03852108120918274, "step": 5075, "valid_targets_mean": 3473.4, "valid_targets_min": 2777 }, { "epoch": 5.748160724391624, "grad_norm": 0.44530962837687676, "learning_rate": 3.7878875683867476e-06, "loss": 0.0845, "loss_nan_ranks": 0, "loss_rank_avg": 0.042130667716264725, "step": 5080, "valid_targets_mean": 3932.4, "valid_targets_min": 3061 }, { "epoch": 5.753820033955858, "grad_norm": 0.3694916026913543, "learning_rate": 3.7549175727641606e-06, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.03624318540096283, "step": 5085, "valid_targets_mean": 2882.2, "valid_targets_min": 868 }, { "epoch": 5.75947934352009, "grad_norm": 0.4227025192070278, "learning_rate": 3.7220768201175615e-06, "loss": 0.0718, "loss_nan_ranks": 0, "loss_rank_avg": 0.03077586367726326, "step": 5090, "valid_targets_mean": 2506.6, "valid_targets_min": 752 }, { "epoch": 5.765138653084324, "grad_norm": 0.41725972794779176, "learning_rate": 3.689365571722112e-06, "loss": 0.0798, "loss_nan_ranks": 0, "loss_rank_avg": 0.03431401774287224, "step": 5095, "valid_targets_mean": 3418.9, "valid_targets_min": 1141 }, { "epoch": 5.770797962648556, "grad_norm": 0.3500677147973765, "learning_rate": 3.6567840878226577e-06, "loss": 0.0592, "loss_nan_ranks": 0, "loss_rank_avg": 0.03257271274924278, "step": 5100, "valid_targets_mean": 3901.2, "valid_targets_min": 3540 }, { "epoch": 5.77645727221279, "grad_norm": 0.43941140678159996, "learning_rate": 3.624332627631679e-06, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.030285216867923737, "step": 5105, "valid_targets_mean": 2808.2, "valid_targets_min": 773 }, { "epoch": 5.782116581777023, "grad_norm": 0.42014420275176356, "learning_rate": 3.5920114493271974e-06, "loss": 0.0745, "loss_nan_ranks": 0, "loss_rank_avg": 0.025668412446975708, "step": 5110, "valid_targets_mean": 3550.5, "valid_targets_min": 2587 }, { "epoch": 5.787775891341257, "grad_norm": 0.4385807667884832, "learning_rate": 3.5598208100507314e-06, "loss": 0.0847, "loss_nan_ranks": 0, "loss_rank_avg": 0.034961722791194916, "step": 5115, "valid_targets_mean": 2700.6, "valid_targets_min": 773 }, { "epoch": 5.793435200905489, "grad_norm": 0.5285363614611225, "learning_rate": 3.5277609659052712e-06, "loss": 0.0754, "loss_nan_ranks": 0, "loss_rank_avg": 0.037699900567531586, "step": 5120, "valid_targets_mean": 3615.9, "valid_targets_min": 2962 }, { "epoch": 5.799094510469723, "grad_norm": 0.6519064391093398, "learning_rate": 3.4958321719532106e-06, "loss": 0.0807, "loss_nan_ranks": 0, "loss_rank_avg": 0.04379285126924515, "step": 5125, "valid_targets_mean": 1766.6, "valid_targets_min": 649 }, { "epoch": 5.804753820033956, "grad_norm": 0.6115661117657148, "learning_rate": 3.4640346822143324e-06, "loss": 0.0763, "loss_nan_ranks": 0, "loss_rank_avg": 0.0414419025182724, "step": 5130, "valid_targets_mean": 1668.4, "valid_targets_min": 708 }, { "epoch": 5.810413129598189, "grad_norm": 0.4643873227865667, "learning_rate": 3.4323687496637837e-06, "loss": 0.0834, "loss_nan_ranks": 0, "loss_rank_avg": 0.032500360161066055, "step": 5135, "valid_targets_mean": 2129.5, "valid_targets_min": 617 }, { "epoch": 5.816072439162422, "grad_norm": 0.518654839110181, "learning_rate": 3.4008346262300852e-06, "loss": 0.0748, "loss_nan_ranks": 0, "loss_rank_avg": 0.03613649681210518, "step": 5140, "valid_targets_mean": 2495.0, "valid_targets_min": 720 }, { "epoch": 5.8217317487266556, "grad_norm": 0.6468513014194476, "learning_rate": 3.3694325627930846e-06, "loss": 0.0674, "loss_nan_ranks": 0, "loss_rank_avg": 0.04318820685148239, "step": 5145, "valid_targets_mean": 1537.8, "valid_targets_min": 628 }, { "epoch": 5.827391058290889, "grad_norm": 0.6398866548133438, "learning_rate": 3.3381628091819907e-06, "loss": 0.0877, "loss_nan_ranks": 0, "loss_rank_avg": 0.06686189025640488, "step": 5150, "valid_targets_mean": 2155.2, "valid_targets_min": 821 }, { "epoch": 5.8330503678551215, "grad_norm": 0.36439329813722365, "learning_rate": 3.3070256141733913e-06, "loss": 0.0668, "loss_nan_ranks": 0, "loss_rank_avg": 0.020443886518478394, "step": 5155, "valid_targets_mean": 3628.1, "valid_targets_min": 2863 }, { "epoch": 5.838709677419355, "grad_norm": 0.39380579851082065, "learning_rate": 3.2760212254892453e-06, "loss": 0.0663, "loss_nan_ranks": 0, "loss_rank_avg": 0.027335772290825844, "step": 5160, "valid_targets_mean": 3585.2, "valid_targets_min": 1773 }, { "epoch": 5.8443689869835875, "grad_norm": 0.514279348342231, "learning_rate": 3.245149889794932e-06, "loss": 0.0755, "loss_nan_ranks": 0, "loss_rank_avg": 0.04034529626369476, "step": 5165, "valid_targets_mean": 2356.6, "valid_targets_min": 721 }, { "epoch": 5.850028296547821, "grad_norm": 0.39588532237902196, "learning_rate": 3.2144118526972943e-06, "loss": 0.0609, "loss_nan_ranks": 0, "loss_rank_avg": 0.03888987377285957, "step": 5170, "valid_targets_mean": 5092.5, "valid_targets_min": 4222 }, { "epoch": 5.855687606112054, "grad_norm": 0.465672567676084, "learning_rate": 3.1838073587426676e-06, "loss": 0.0612, "loss_nan_ranks": 0, "loss_rank_avg": 0.03602100908756256, "step": 5175, "valid_targets_mean": 4604.0, "valid_targets_min": 2020 }, { "epoch": 5.861346915676288, "grad_norm": 0.3756373975254779, "learning_rate": 3.153336651414933e-06, "loss": 0.079, "loss_nan_ranks": 0, "loss_rank_avg": 0.027616024017333984, "step": 5180, "valid_targets_mean": 3097.9, "valid_targets_min": 739 }, { "epoch": 5.86700622524052, "grad_norm": 0.4149497449655576, "learning_rate": 3.1229999731336137e-06, "loss": 0.0941, "loss_nan_ranks": 0, "loss_rank_avg": 0.03883051872253418, "step": 5185, "valid_targets_mean": 3696.1, "valid_targets_min": 2945 }, { "epoch": 5.872665534804754, "grad_norm": 0.3979753959226805, "learning_rate": 3.0927975652518994e-06, "loss": 0.0713, "loss_nan_ranks": 0, "loss_rank_avg": 0.04112917184829712, "step": 5190, "valid_targets_mean": 3112.8, "valid_targets_min": 704 }, { "epoch": 5.878324844368987, "grad_norm": 0.4099255400951427, "learning_rate": 3.062729668054756e-06, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.032986707985401154, "step": 5195, "valid_targets_mean": 2490.9, "valid_targets_min": 774 }, { "epoch": 5.88398415393322, "grad_norm": 0.3941404199714783, "learning_rate": 3.032796520757002e-06, "loss": 0.0904, "loss_nan_ranks": 0, "loss_rank_avg": 0.026263339444994926, "step": 5200, "valid_targets_mean": 2570.2, "valid_targets_min": 485 }, { "epoch": 5.889643463497453, "grad_norm": 0.4427560923548638, "learning_rate": 3.0029983615014234e-06, "loss": 0.0683, "loss_nan_ranks": 0, "loss_rank_avg": 0.03036249428987503, "step": 5205, "valid_targets_mean": 3087.4, "valid_targets_min": 1048 }, { "epoch": 5.895302773061687, "grad_norm": 0.4229599842758237, "learning_rate": 2.9733354273568514e-06, "loss": 0.0739, "loss_nan_ranks": 0, "loss_rank_avg": 0.032209280878305435, "step": 5210, "valid_targets_mean": 2753.6, "valid_targets_min": 722 }, { "epoch": 5.900962082625919, "grad_norm": 0.6532864072235072, "learning_rate": 2.9438079543162914e-06, "loss": 0.0768, "loss_nan_ranks": 0, "loss_rank_avg": 0.050366684794425964, "step": 5215, "valid_targets_mean": 1836.2, "valid_targets_min": 865 }, { "epoch": 5.906621392190153, "grad_norm": 0.5332867595834957, "learning_rate": 2.9144161772950564e-06, "loss": 0.104, "loss_nan_ranks": 0, "loss_rank_avg": 0.03690391033887863, "step": 5220, "valid_targets_mean": 2377.5, "valid_targets_min": 675 }, { "epoch": 5.912280701754386, "grad_norm": 0.4605237897191458, "learning_rate": 2.885160330128871e-06, "loss": 0.0935, "loss_nan_ranks": 0, "loss_rank_avg": 0.03459594398736954, "step": 5225, "valid_targets_mean": 3323.0, "valid_targets_min": 782 }, { "epoch": 5.917940011318619, "grad_norm": 0.4701984376959242, "learning_rate": 2.8560406455720333e-06, "loss": 0.0698, "loss_nan_ranks": 0, "loss_rank_avg": 0.03195595368742943, "step": 5230, "valid_targets_mean": 2581.8, "valid_targets_min": 795 }, { "epoch": 5.923599320882852, "grad_norm": 0.4627978786039704, "learning_rate": 2.8270573552955616e-06, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.03759005665779114, "step": 5235, "valid_targets_mean": 3264.6, "valid_targets_min": 2017 }, { "epoch": 5.929258630447086, "grad_norm": 0.430552103519957, "learning_rate": 2.798210689885337e-06, "loss": 0.0684, "loss_nan_ranks": 0, "loss_rank_avg": 0.029955577105283737, "step": 5240, "valid_targets_mean": 2319.6, "valid_targets_min": 798 }, { "epoch": 5.934917940011319, "grad_norm": 0.40555015629365276, "learning_rate": 2.7695008788402765e-06, "loss": 0.0606, "loss_nan_ranks": 0, "loss_rank_avg": 0.03208666294813156, "step": 5245, "valid_targets_mean": 3299.6, "valid_targets_min": 860 }, { "epoch": 5.9405772495755516, "grad_norm": 0.45207921980647, "learning_rate": 2.740928150570512e-06, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.03434694558382034, "step": 5250, "valid_targets_mean": 3302.4, "valid_targets_min": 878 }, { "epoch": 5.946236559139785, "grad_norm": 0.36093174555240776, "learning_rate": 2.712492732395575e-06, "loss": 0.062, "loss_nan_ranks": 0, "loss_rank_avg": 0.026369066908955574, "step": 5255, "valid_targets_mean": 3832.2, "valid_targets_min": 2602 }, { "epoch": 5.951895868704018, "grad_norm": 0.526083349405698, "learning_rate": 2.6841948505425765e-06, "loss": 0.0701, "loss_nan_ranks": 0, "loss_rank_avg": 0.04250894486904144, "step": 5260, "valid_targets_mean": 2736.5, "valid_targets_min": 945 }, { "epoch": 5.957555178268251, "grad_norm": 0.5557462391969753, "learning_rate": 2.6560347301444035e-06, "loss": 0.0692, "loss_nan_ranks": 0, "loss_rank_avg": 0.04651749134063721, "step": 5265, "valid_targets_mean": 3831.1, "valid_targets_min": 3128 }, { "epoch": 5.963214487832484, "grad_norm": 0.49222443878858035, "learning_rate": 2.6280125952379567e-06, "loss": 0.0727, "loss_nan_ranks": 0, "loss_rank_avg": 0.038196124136447906, "step": 5270, "valid_targets_mean": 3966.2, "valid_targets_min": 2529 }, { "epoch": 5.968873797396718, "grad_norm": 0.4384145557882011, "learning_rate": 2.6001286687623382e-06, "loss": 0.0623, "loss_nan_ranks": 0, "loss_rank_avg": 0.042362622916698456, "step": 5275, "valid_targets_mean": 4704.8, "valid_targets_min": 892 }, { "epoch": 5.97453310696095, "grad_norm": 0.33561436487922225, "learning_rate": 2.5723831725570848e-06, "loss": 0.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.024302612990140915, "step": 5280, "valid_targets_mean": 4471.1, "valid_targets_min": 1657 }, { "epoch": 5.980192416525184, "grad_norm": 0.6312166327590963, "learning_rate": 2.544776327360419e-06, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.10875210165977478, "step": 5285, "valid_targets_mean": 1989.8, "valid_targets_min": 709 }, { "epoch": 5.985851726089417, "grad_norm": 0.45996404344118175, "learning_rate": 2.5173083528074683e-06, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.024792591109871864, "step": 5290, "valid_targets_mean": 3226.5, "valid_targets_min": 527 }, { "epoch": 5.99151103565365, "grad_norm": 0.4127218758642255, "learning_rate": 2.489979467428532e-06, "loss": 0.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.03901390731334686, "step": 5295, "valid_targets_mean": 3531.0, "valid_targets_min": 2318 }, { "epoch": 5.997170345217883, "grad_norm": 0.3788285488600974, "learning_rate": 2.4627898886473522e-06, "loss": 0.0656, "loss_nan_ranks": 0, "loss_rank_avg": 0.03326011449098587, "step": 5300, "valid_targets_mean": 3520.9, "valid_targets_min": 2883 }, { "epoch": 6.002263723825693, "grad_norm": 0.8276101671544355, "learning_rate": 2.435739832779358e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.07999004423618317, "step": 5305, "valid_targets_mean": 5904.0, "valid_targets_min": 4967 }, { "epoch": 6.007923033389926, "grad_norm": 0.7277283379257201, "learning_rate": 2.408829515029969e-06, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.09332052618265152, "step": 5310, "valid_targets_mean": 8641.4, "valid_targets_min": 5164 }, { "epoch": 6.01358234295416, "grad_norm": 0.5823805300569702, "learning_rate": 2.3820591494928635e-06, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.07082702219486237, "step": 5315, "valid_targets_mean": 6838.2, "valid_targets_min": 5200 }, { "epoch": 6.019241652518393, "grad_norm": 0.5016261384059876, "learning_rate": 2.3554289491482996e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.060256391763687134, "step": 5320, "valid_targets_mean": 5411.6, "valid_targets_min": 3853 }, { "epoch": 6.024900962082626, "grad_norm": 0.49029420602885754, "learning_rate": 2.3289391258613938e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.08309821784496307, "step": 5325, "valid_targets_mean": 5598.0, "valid_targets_min": 4669 }, { "epoch": 6.030560271646859, "grad_norm": 0.4696599875799638, "learning_rate": 2.3025898903804467e-06, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.07830261439085007, "step": 5330, "valid_targets_mean": 5953.0, "valid_targets_min": 4216 }, { "epoch": 6.036219581211093, "grad_norm": 0.4406152488917964, "learning_rate": 2.276381452335281e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.07636751979589462, "step": 5335, "valid_targets_mean": 5914.0, "valid_targets_min": 4589 }, { "epoch": 6.041878890775325, "grad_norm": 0.43789300649461604, "learning_rate": 2.2503140202355488e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.07406055927276611, "step": 5340, "valid_targets_mean": 6515.4, "valid_targets_min": 4588 }, { "epoch": 6.047538200339559, "grad_norm": 0.39488092916617257, "learning_rate": 2.2243878014690834e-06, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.06888176500797272, "step": 5345, "valid_targets_mean": 7015.2, "valid_targets_min": 4530 }, { "epoch": 6.053197509903792, "grad_norm": 0.4131437929720812, "learning_rate": 2.1986030023002568e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.08051659166812897, "step": 5350, "valid_targets_mean": 6202.6, "valid_targets_min": 4837 }, { "epoch": 6.058856819468025, "grad_norm": 0.5157470699606653, "learning_rate": 2.1729598278683264e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.04698694124817848, "step": 5355, "valid_targets_mean": 1720.9, "valid_targets_min": 229 }, { "epoch": 6.064516129032258, "grad_norm": 0.41192059594925284, "learning_rate": 2.147458482185807e-06, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.07047378271818161, "step": 5360, "valid_targets_mean": 5963.8, "valid_targets_min": 4216 }, { "epoch": 6.0701754385964914, "grad_norm": 0.4097676600547405, "learning_rate": 2.122099168136862e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.06870923936367035, "step": 5365, "valid_targets_mean": 5973.9, "valid_targets_min": 4835 }, { "epoch": 6.075834748160724, "grad_norm": 0.4826017757756714, "learning_rate": 2.0968820874756625e-06, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.06461106240749359, "step": 5370, "valid_targets_mean": 6669.8, "valid_targets_min": 4995 }, { "epoch": 6.081494057724957, "grad_norm": 0.4783505134049246, "learning_rate": 2.0718074408247955e-06, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.08431711792945862, "step": 5375, "valid_targets_mean": 5705.5, "valid_targets_min": 4108 }, { "epoch": 6.087153367289191, "grad_norm": 0.4603266617125913, "learning_rate": 2.0468754276736823e-06, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.09027671068906784, "step": 5380, "valid_targets_mean": 6594.0, "valid_targets_min": 4527 }, { "epoch": 6.092812676853424, "grad_norm": 0.4668190929700467, "learning_rate": 2.0220862463769665e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.08130667358636856, "step": 5385, "valid_targets_mean": 3100.9, "valid_targets_min": 2104 }, { "epoch": 6.098471986417657, "grad_norm": 0.4161670035323307, "learning_rate": 1.9974400941529493e-06, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.06128064543008804, "step": 5390, "valid_targets_mean": 5817.8, "valid_targets_min": 4757 }, { "epoch": 6.10413129598189, "grad_norm": 0.49506290970705313, "learning_rate": 1.972937167082014e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.08566483855247498, "step": 5395, "valid_targets_mean": 6333.0, "valid_targets_min": 5056 }, { "epoch": 6.109790605546124, "grad_norm": 0.40345628118169874, "learning_rate": 1.948577660105082e-06, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.06584078073501587, "step": 5400, "valid_targets_mean": 5956.0, "valid_targets_min": 2834 }, { "epoch": 6.115449915110356, "grad_norm": 0.42809149020646353, "learning_rate": 1.924361767022038e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.10012775659561157, "step": 5405, "valid_targets_mean": 6984.6, "valid_targets_min": 5744 }, { "epoch": 6.12110922467459, "grad_norm": 0.3948106402931891, "learning_rate": 1.9002896804902039e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.0651889443397522, "step": 5410, "valid_targets_mean": 7290.2, "valid_targets_min": 5640 }, { "epoch": 6.126768534238823, "grad_norm": 0.423531309091551, "learning_rate": 1.8763615920228084e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.0684753954410553, "step": 5415, "valid_targets_mean": 7036.0, "valid_targets_min": 5210 }, { "epoch": 6.132427843803056, "grad_norm": 0.4567806851439878, "learning_rate": 1.8525776919874472e-06, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.09491011500358582, "step": 5420, "valid_targets_mean": 7138.5, "valid_targets_min": 5292 }, { "epoch": 6.138087153367289, "grad_norm": 0.46052185078926156, "learning_rate": 1.8289381696045817e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.0801386907696724, "step": 5425, "valid_targets_mean": 6134.2, "valid_targets_min": 3531 }, { "epoch": 6.143746462931523, "grad_norm": 0.4369176855135763, "learning_rate": 1.8054432129460386e-06, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.08043287694454193, "step": 5430, "valid_targets_mean": 5968.2, "valid_targets_min": 4640 }, { "epoch": 6.149405772495755, "grad_norm": 0.41376792180743177, "learning_rate": 1.7820930089334965e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.07278323173522949, "step": 5435, "valid_targets_mean": 6249.6, "valid_targets_min": 4328 }, { "epoch": 6.155065082059989, "grad_norm": 0.45569587335080425, "learning_rate": 1.7588877433370076e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.08063621819019318, "step": 5440, "valid_targets_mean": 6002.4, "valid_targets_min": 3123 }, { "epoch": 6.160724391624222, "grad_norm": 0.4192478296963226, "learning_rate": 1.7358276007735276e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.07261161506175995, "step": 5445, "valid_targets_mean": 6372.2, "valid_targets_min": 4256 }, { "epoch": 6.166383701188455, "grad_norm": 0.44113680036675645, "learning_rate": 1.71291276470543e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.08018209040164948, "step": 5450, "valid_targets_mean": 5927.8, "valid_targets_min": 4753 }, { "epoch": 6.172043010752688, "grad_norm": 0.42289106743705024, "learning_rate": 1.6901434174390652e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.07243598997592926, "step": 5455, "valid_targets_mean": 6106.1, "valid_targets_min": 5370 }, { "epoch": 6.1777023203169215, "grad_norm": 0.46180892618572433, "learning_rate": 1.6675197401232869e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.08281978964805603, "step": 5460, "valid_targets_mean": 6240.6, "valid_targets_min": 4608 }, { "epoch": 6.183361629881155, "grad_norm": 0.44905545436226685, "learning_rate": 1.6450419127480422e-06, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.06940460205078125, "step": 5465, "valid_targets_mean": 5733.2, "valid_targets_min": 3801 }, { "epoch": 6.1890209394453874, "grad_norm": 0.42405331723647666, "learning_rate": 1.6227101141429114e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.07862474769353867, "step": 5470, "valid_targets_mean": 6430.1, "valid_targets_min": 4754 }, { "epoch": 6.194680249009621, "grad_norm": 0.3636777740153316, "learning_rate": 1.6005245219756927e-06, "loss": 0.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.05749621242284775, "step": 5475, "valid_targets_mean": 7375.2, "valid_targets_min": 6417 }, { "epoch": 6.200339558573854, "grad_norm": 0.5059615557907053, "learning_rate": 1.5784853127510058e-06, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.08089186251163483, "step": 5480, "valid_targets_mean": 6281.0, "valid_targets_min": 3468 }, { "epoch": 6.205998868138087, "grad_norm": 0.41804768443087675, "learning_rate": 1.5565926618088578e-06, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.07407131791114807, "step": 5485, "valid_targets_mean": 6532.4, "valid_targets_min": 5221 }, { "epoch": 6.21165817770232, "grad_norm": 0.4444679373526541, "learning_rate": 1.5348467433232728e-06, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.06167688965797424, "step": 5490, "valid_targets_mean": 5552.6, "valid_targets_min": 4438 }, { "epoch": 6.217317487266554, "grad_norm": 0.4344700346800421, "learning_rate": 1.5132477303009018e-06, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.07731674611568451, "step": 5495, "valid_targets_mean": 5878.1, "valid_targets_min": 3915 }, { "epoch": 6.222976796830786, "grad_norm": 0.37175162900794195, "learning_rate": 1.4917957945796313e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.056854572147130966, "step": 5500, "valid_targets_mean": 7082.6, "valid_targets_min": 4135 }, { "epoch": 6.22863610639502, "grad_norm": 0.4519834892138903, "learning_rate": 1.4704911068272366e-06, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.07420016825199127, "step": 5505, "valid_targets_mean": 5936.4, "valid_targets_min": 3947 }, { "epoch": 6.234295415959253, "grad_norm": 0.42474375595243313, "learning_rate": 1.4493338365400034e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.0952538400888443, "step": 5510, "valid_targets_mean": 6836.2, "valid_targets_min": 4865 }, { "epoch": 6.239954725523486, "grad_norm": 0.4019485048337539, "learning_rate": 1.428324152041407e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.07246479392051697, "step": 5515, "valid_targets_mean": 6539.4, "valid_targets_min": 4643 }, { "epoch": 6.245614035087719, "grad_norm": 0.3932962802175302, "learning_rate": 1.407462220480742e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.07242302596569061, "step": 5520, "valid_targets_mean": 6613.6, "valid_targets_min": 4959 }, { "epoch": 6.251273344651953, "grad_norm": 0.6506279406434788, "learning_rate": 1.3867482078318095e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.07954353094100952, "step": 5525, "valid_targets_mean": 6044.1, "valid_targets_min": 4652 }, { "epoch": 6.256932654216186, "grad_norm": 0.40380824614409955, "learning_rate": 1.3661822788916013e-06, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.06269079446792603, "step": 5530, "valid_targets_mean": 5893.9, "valid_targets_min": 4938 }, { "epoch": 6.262591963780419, "grad_norm": 0.39519519121780683, "learning_rate": 1.3457645972789778e-06, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.05853109061717987, "step": 5535, "valid_targets_mean": 5849.6, "valid_targets_min": 4546 }, { "epoch": 6.268251273344652, "grad_norm": 0.39750633755202286, "learning_rate": 1.3254953254333613e-06, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.06598692387342453, "step": 5540, "valid_targets_mean": 5751.5, "valid_targets_min": 3200 }, { "epoch": 6.2739105829088855, "grad_norm": 0.44355431281874347, "learning_rate": 1.305374624613469e-06, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.07301096618175507, "step": 5545, "valid_targets_mean": 6149.6, "valid_targets_min": 5010 }, { "epoch": 6.279569892473118, "grad_norm": 0.44465882297781856, "learning_rate": 1.285402654896004e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.08430242538452148, "step": 5550, "valid_targets_mean": 6551.2, "valid_targets_min": 4904 }, { "epoch": 6.2852292020373515, "grad_norm": 0.5270225139071596, "learning_rate": 1.265579575174387e-06, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.10046619921922684, "step": 5555, "valid_targets_mean": 5728.9, "valid_targets_min": 4812 }, { "epoch": 6.290888511601585, "grad_norm": 0.4452621705044153, "learning_rate": 1.245905543157504e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.059191398322582245, "step": 5560, "valid_targets_mean": 5047.9, "valid_targets_min": 3629 }, { "epoch": 6.2965478211658175, "grad_norm": 0.429665256933034, "learning_rate": 1.2263807153684448e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.07235387712717056, "step": 5565, "valid_targets_mean": 6260.0, "valid_targets_min": 4324 }, { "epoch": 6.302207130730051, "grad_norm": 0.3831745381517681, "learning_rate": 1.2070052471432535e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.0637582391500473, "step": 5570, "valid_targets_mean": 7853.1, "valid_targets_min": 4920 }, { "epoch": 6.307866440294284, "grad_norm": 0.4395856940321014, "learning_rate": 1.1877792926296893e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.07045142352581024, "step": 5575, "valid_targets_mean": 6231.0, "valid_targets_min": 4882 }, { "epoch": 6.313525749858517, "grad_norm": 0.4357912902955703, "learning_rate": 1.1687030047860248e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.06981360912322998, "step": 5580, "valid_targets_mean": 7472.9, "valid_targets_min": 3943 }, { "epoch": 6.31918505942275, "grad_norm": 0.447350489255607, "learning_rate": 1.1497765353797963e-06, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.07825092226266861, "step": 5585, "valid_targets_mean": 6840.2, "valid_targets_min": 5034 }, { "epoch": 6.324844368986984, "grad_norm": 0.42778721008696324, "learning_rate": 1.1310000349866136e-06, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.07604715973138809, "step": 5590, "valid_targets_mean": 6458.5, "valid_targets_min": 4461 }, { "epoch": 6.330503678551217, "grad_norm": 0.3928420540685352, "learning_rate": 1.1123736529889674e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.06796157360076904, "step": 5595, "valid_targets_mean": 6645.4, "valid_targets_min": 5188 }, { "epoch": 6.33616298811545, "grad_norm": 0.40726225641199704, "learning_rate": 1.093897537575026e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.07839426398277283, "step": 5600, "valid_targets_mean": 6002.9, "valid_targets_min": 5009 }, { "epoch": 6.341822297679683, "grad_norm": 0.5197824268371312, "learning_rate": 1.075571835737459e-06, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.08284924924373627, "step": 5605, "valid_targets_mean": 6025.9, "valid_targets_min": 4551 }, { "epoch": 6.347481607243917, "grad_norm": 0.37406341479037775, "learning_rate": 1.0573966932722902e-06, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.07350446283817291, "step": 5610, "valid_targets_mean": 7210.0, "valid_targets_min": 4492 }, { "epoch": 6.353140916808149, "grad_norm": 0.41816122930943833, "learning_rate": 1.039372254777702e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.07028060406446457, "step": 5615, "valid_targets_mean": 7051.4, "valid_targets_min": 4718 }, { "epoch": 6.358800226372383, "grad_norm": 0.4298009833839158, "learning_rate": 1.0214986636529112e-06, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.0760362297296524, "step": 5620, "valid_targets_mean": 6686.0, "valid_targets_min": 4827 }, { "epoch": 6.364459535936616, "grad_norm": 0.406689242569645, "learning_rate": 1.003776062097015e-06, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.05693672597408295, "step": 5625, "valid_targets_mean": 5311.9, "valid_targets_min": 3828 }, { "epoch": 6.370118845500849, "grad_norm": 0.38227984996431297, "learning_rate": 9.862045911078733e-07, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.061227746307849884, "step": 5630, "valid_targets_mean": 7078.9, "valid_targets_min": 4594 }, { "epoch": 6.375778155065082, "grad_norm": 0.44431979959785317, "learning_rate": 9.687843904809725e-07, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.061648838222026825, "step": 5635, "valid_targets_mean": 6393.8, "valid_targets_min": 4509 }, { "epoch": 6.3814374646293155, "grad_norm": 0.43153627059991495, "learning_rate": 9.515155988083125e-07, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.08048129826784134, "step": 5640, "valid_targets_mean": 7848.9, "valid_targets_min": 5649 }, { "epoch": 6.387096774193548, "grad_norm": 0.4032728817369529, "learning_rate": 9.343983534773238e-07, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.061408888548612595, "step": 5645, "valid_targets_mean": 6623.4, "valid_targets_min": 4343 }, { "epoch": 6.3927560837577815, "grad_norm": 0.42777057592335804, "learning_rate": 9.174327906697522e-07, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.06570357084274292, "step": 5650, "valid_targets_mean": 6255.9, "valid_targets_min": 4660 }, { "epoch": 6.398415393322015, "grad_norm": 0.413587497444861, "learning_rate": 9.006190453605867e-07, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.06969091296195984, "step": 5655, "valid_targets_mean": 8243.0, "valid_targets_min": 6281 }, { "epoch": 6.4040747028862475, "grad_norm": 0.3967725258563214, "learning_rate": 8.839572513169869e-07, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.06824289262294769, "step": 5660, "valid_targets_mean": 7083.5, "valid_targets_min": 4657 }, { "epoch": 6.409734012450481, "grad_norm": 0.45270305332037425, "learning_rate": 8.674475410972083e-07, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.08294831961393356, "step": 5665, "valid_targets_mean": 6399.8, "valid_targets_min": 5098 }, { "epoch": 6.415393322014714, "grad_norm": 0.48113155918133693, "learning_rate": 8.510900460495608e-07, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.08184739202260971, "step": 5670, "valid_targets_mean": 5257.4, "valid_targets_min": 1879 }, { "epoch": 6.421052631578947, "grad_norm": 0.462237732588396, "learning_rate": 8.348848963113498e-07, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.07992422580718994, "step": 5675, "valid_targets_mean": 5260.5, "valid_targets_min": 3619 }, { "epoch": 6.42671194114318, "grad_norm": 0.4376210559352717, "learning_rate": 8.188322208078614e-07, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.049073681235313416, "step": 5680, "valid_targets_mean": 3976.1, "valid_targets_min": 3545 }, { "epoch": 6.432371250707414, "grad_norm": 0.4443761443952523, "learning_rate": 8.02932147251314e-07, "loss": 0.0764, "loss_nan_ranks": 0, "loss_rank_avg": 0.03434424102306366, "step": 5685, "valid_targets_mean": 3099.4, "valid_targets_min": 1024 }, { "epoch": 6.438030560271647, "grad_norm": 0.3292086681702203, "learning_rate": 7.87184802139851e-07, "loss": 0.0687, "loss_nan_ranks": 0, "loss_rank_avg": 0.021340861916542053, "step": 5690, "valid_targets_mean": 3441.1, "valid_targets_min": 2927 }, { "epoch": 6.44368986983588, "grad_norm": 0.495630018274138, "learning_rate": 7.715903107565426e-07, "loss": 0.0866, "loss_nan_ranks": 0, "loss_rank_avg": 0.05481220781803131, "step": 5695, "valid_targets_mean": 3442.0, "valid_targets_min": 2213 }, { "epoch": 6.449349179400113, "grad_norm": 0.4498586504819099, "learning_rate": 7.56148797168379e-07, "loss": 0.0712, "loss_nan_ranks": 0, "loss_rank_avg": 0.04381895810365677, "step": 5700, "valid_targets_mean": 2907.4, "valid_targets_min": 1134 }, { "epoch": 6.455008488964347, "grad_norm": 0.47457148843186153, "learning_rate": 7.408603842252837e-07, "loss": 0.0749, "loss_nan_ranks": 0, "loss_rank_avg": 0.045509450137615204, "step": 5705, "valid_targets_mean": 2523.4, "valid_targets_min": 663 }, { "epoch": 6.460667798528579, "grad_norm": 0.6923423608886543, "learning_rate": 7.257251935591436e-07, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.055727388709783554, "step": 5710, "valid_targets_mean": 1893.8, "valid_targets_min": 535 }, { "epoch": 6.466327108092813, "grad_norm": 0.4086302890491953, "learning_rate": 7.107433455828317e-07, "loss": 0.0738, "loss_nan_ranks": 0, "loss_rank_avg": 0.030361641198396683, "step": 5715, "valid_targets_mean": 1971.8, "valid_targets_min": 811 }, { "epoch": 6.471986417657046, "grad_norm": 0.490315949097002, "learning_rate": 6.959149594892567e-07, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.0521058514714241, "step": 5720, "valid_targets_mean": 2785.5, "valid_targets_min": 2392 }, { "epoch": 6.477645727221279, "grad_norm": 0.28307075878357413, "learning_rate": 6.812401532504109e-07, "loss": 0.0933, "loss_nan_ranks": 0, "loss_rank_avg": 0.022131290286779404, "step": 5725, "valid_targets_mean": 4540.6, "valid_targets_min": 3285 }, { "epoch": 6.483305036785512, "grad_norm": 0.36605418977499043, "learning_rate": 6.667190436164351e-07, "loss": 0.0688, "loss_nan_ranks": 0, "loss_rank_avg": 0.03333090618252754, "step": 5730, "valid_targets_mean": 2926.8, "valid_targets_min": 764 }, { "epoch": 6.4889643463497455, "grad_norm": 0.3792739889735828, "learning_rate": 6.523517461146856e-07, "loss": 0.072, "loss_nan_ranks": 0, "loss_rank_avg": 0.03842036426067352, "step": 5735, "valid_targets_mean": 3378.6, "valid_targets_min": 1290 }, { "epoch": 6.494623655913978, "grad_norm": 0.5005953776912583, "learning_rate": 6.381383750488113e-07, "loss": 0.0693, "loss_nan_ranks": 0, "loss_rank_avg": 0.03875945508480072, "step": 5740, "valid_targets_mean": 2432.4, "valid_targets_min": 720 }, { "epoch": 6.5002829654782115, "grad_norm": 0.3298347107591839, "learning_rate": 6.240790434978628e-07, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.031254325062036514, "step": 5745, "valid_targets_mean": 3896.0, "valid_targets_min": 2336 }, { "epoch": 6.505942275042445, "grad_norm": 0.363089484382129, "learning_rate": 6.101738633153686e-07, "loss": 0.0653, "loss_nan_ranks": 0, "loss_rank_avg": 0.03155246376991272, "step": 5750, "valid_targets_mean": 2912.5, "valid_targets_min": 1049 }, { "epoch": 6.511601584606678, "grad_norm": 0.3590771499282617, "learning_rate": 5.964229451284586e-07, "loss": 0.073, "loss_nan_ranks": 0, "loss_rank_avg": 0.02306312322616577, "step": 5755, "valid_targets_mean": 3087.8, "valid_targets_min": 1086 }, { "epoch": 6.517260894170911, "grad_norm": 0.3892052060779421, "learning_rate": 5.828263983369864e-07, "loss": 0.0605, "loss_nan_ranks": 0, "loss_rank_avg": 0.03467557579278946, "step": 5760, "valid_targets_mean": 3296.5, "valid_targets_min": 732 }, { "epoch": 6.522920203735144, "grad_norm": 0.6316138887211705, "learning_rate": 5.693843311126523e-07, "loss": 0.0811, "loss_nan_ranks": 0, "loss_rank_avg": 0.04579807072877884, "step": 5765, "valid_targets_mean": 1688.5, "valid_targets_min": 770 }, { "epoch": 6.528579513299378, "grad_norm": 0.42657241895095116, "learning_rate": 5.560968503981378e-07, "loss": 0.0757, "loss_nan_ranks": 0, "loss_rank_avg": 0.03341136872768402, "step": 5770, "valid_targets_mean": 2574.8, "valid_targets_min": 592 }, { "epoch": 6.53423882286361, "grad_norm": 0.46142186165107835, "learning_rate": 5.429640619062726e-07, "loss": 0.0851, "loss_nan_ranks": 0, "loss_rank_avg": 0.04054953530430794, "step": 5775, "valid_targets_mean": 3089.1, "valid_targets_min": 2224 }, { "epoch": 6.539898132427844, "grad_norm": 0.4493689812933997, "learning_rate": 5.299860701191772e-07, "loss": 0.0827, "loss_nan_ranks": 0, "loss_rank_avg": 0.029141142964363098, "step": 5780, "valid_targets_mean": 2364.5, "valid_targets_min": 511 }, { "epoch": 6.545557441992077, "grad_norm": 0.43790299984161335, "learning_rate": 5.171629782874354e-07, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.04518071562051773, "step": 5785, "valid_targets_mean": 3775.5, "valid_targets_min": 2328 }, { "epoch": 6.55121675155631, "grad_norm": 0.42124865037915415, "learning_rate": 5.044948884292766e-07, "loss": 0.0643, "loss_nan_ranks": 0, "loss_rank_avg": 0.02882300317287445, "step": 5790, "valid_targets_mean": 2867.1, "valid_targets_min": 669 }, { "epoch": 6.556876061120543, "grad_norm": 0.6751482529617706, "learning_rate": 4.919819013297677e-07, "loss": 0.0882, "loss_nan_ranks": 0, "loss_rank_avg": 0.0536501370370388, "step": 5795, "valid_targets_mean": 1722.5, "valid_targets_min": 802 }, { "epoch": 6.562535370684777, "grad_norm": 0.6476380988588636, "learning_rate": 4.796241165399939e-07, "loss": 0.0904, "loss_nan_ranks": 0, "loss_rank_avg": 0.051889095455408096, "step": 5800, "valid_targets_mean": 1527.9, "valid_targets_min": 357 }, { "epoch": 6.568194680249009, "grad_norm": 0.442176682737924, "learning_rate": 4.674216323762881e-07, "loss": 0.0801, "loss_nan_ranks": 0, "loss_rank_avg": 0.035727713257074356, "step": 5805, "valid_targets_mean": 3831.6, "valid_targets_min": 2808 }, { "epoch": 6.573853989813243, "grad_norm": 0.5479385584946559, "learning_rate": 4.5537454591943584e-07, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.11486173421144485, "step": 5810, "valid_targets_mean": 2953.2, "valid_targets_min": 652 }, { "epoch": 6.579513299377476, "grad_norm": 0.41350133265317146, "learning_rate": 4.434829530139095e-07, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.04003699868917465, "step": 5815, "valid_targets_mean": 3963.6, "valid_targets_min": 3573 }, { "epoch": 6.5851726089417095, "grad_norm": 0.5482015029259201, "learning_rate": 4.3174694826709107e-07, "loss": 0.0839, "loss_nan_ranks": 0, "loss_rank_avg": 0.045565806329250336, "step": 5820, "valid_targets_mean": 2137.1, "valid_targets_min": 822 }, { "epoch": 6.590831918505942, "grad_norm": 0.6080484811075969, "learning_rate": 4.201666250485503e-07, "loss": 0.1027, "loss_nan_ranks": 0, "loss_rank_avg": 0.14063608646392822, "step": 5825, "valid_targets_mean": 2582.1, "valid_targets_min": 965 }, { "epoch": 6.5964912280701755, "grad_norm": 0.4073205411029621, "learning_rate": 4.087420754892635e-07, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.03254256024956703, "step": 5830, "valid_targets_mean": 4182.0, "valid_targets_min": 636 }, { "epoch": 6.602150537634409, "grad_norm": 0.4394219118655527, "learning_rate": 3.9747339048091136e-07, "loss": 0.0726, "loss_nan_ranks": 0, "loss_rank_avg": 0.05536698177456856, "step": 5835, "valid_targets_mean": 4735.0, "valid_targets_min": 2733 }, { "epoch": 6.6078098471986415, "grad_norm": 0.43545501648190743, "learning_rate": 3.863606596751379e-07, "loss": 0.0746, "loss_nan_ranks": 0, "loss_rank_avg": 0.046722978353500366, "step": 5840, "valid_targets_mean": 4307.1, "valid_targets_min": 2571 }, { "epoch": 6.613469156762875, "grad_norm": 0.32601803243775, "learning_rate": 3.7540397148284837e-07, "loss": 0.0732, "loss_nan_ranks": 0, "loss_rank_avg": 0.025708980858325958, "step": 5845, "valid_targets_mean": 3207.2, "valid_targets_min": 970 }, { "epoch": 6.619128466327108, "grad_norm": 0.3599900965727607, "learning_rate": 3.6460341307349653e-07, "loss": 0.0688, "loss_nan_ranks": 0, "loss_rank_avg": 0.027514172717928886, "step": 5850, "valid_targets_mean": 2923.8, "valid_targets_min": 748 }, { "epoch": 6.624787775891341, "grad_norm": 0.44324928927827856, "learning_rate": 3.539590703743967e-07, "loss": 0.0679, "loss_nan_ranks": 0, "loss_rank_avg": 0.041861265897750854, "step": 5855, "valid_targets_mean": 3834.1, "valid_targets_min": 3568 }, { "epoch": 6.630447085455574, "grad_norm": 0.5158990365964071, "learning_rate": 3.434710280700415e-07, "loss": 0.0713, "loss_nan_ranks": 0, "loss_rank_avg": 0.039465367794036865, "step": 5860, "valid_targets_mean": 2406.8, "valid_targets_min": 1820 }, { "epoch": 6.636106395019808, "grad_norm": 0.4050936034477056, "learning_rate": 3.331393696014207e-07, "loss": 0.0597, "loss_nan_ranks": 0, "loss_rank_avg": 0.03890451416373253, "step": 5865, "valid_targets_mean": 2587.6, "valid_targets_min": 772 }, { "epoch": 6.64176570458404, "grad_norm": 0.5110258826615129, "learning_rate": 3.22964177165368e-07, "loss": 0.1122, "loss_nan_ranks": 0, "loss_rank_avg": 0.05033072829246521, "step": 5870, "valid_targets_mean": 3260.0, "valid_targets_min": 1289 }, { "epoch": 6.647425014148274, "grad_norm": 0.40885125808704265, "learning_rate": 3.129455317138952e-07, "loss": 0.0538, "loss_nan_ranks": 0, "loss_rank_avg": 0.02987043187022209, "step": 5875, "valid_targets_mean": 3723.0, "valid_targets_min": 3122 }, { "epoch": 6.653084323712507, "grad_norm": 0.38109335536839384, "learning_rate": 3.030835129535592e-07, "loss": 0.0619, "loss_nan_ranks": 0, "loss_rank_avg": 0.03285347670316696, "step": 5880, "valid_targets_mean": 3712.5, "valid_targets_min": 1451 }, { "epoch": 6.658743633276741, "grad_norm": 0.420283639227681, "learning_rate": 2.9337819934481814e-07, "loss": 0.0609, "loss_nan_ranks": 0, "loss_rank_avg": 0.03552892059087753, "step": 5885, "valid_targets_mean": 3632.8, "valid_targets_min": 792 }, { "epoch": 6.664402942840973, "grad_norm": 0.5249883860736148, "learning_rate": 2.838296681014185e-07, "loss": 0.077, "loss_nan_ranks": 0, "loss_rank_avg": 0.03367924317717552, "step": 5890, "valid_targets_mean": 1992.4, "valid_targets_min": 795 }, { "epoch": 6.670062252405207, "grad_norm": 0.39437654832589936, "learning_rate": 2.744379951897691e-07, "loss": 0.0921, "loss_nan_ranks": 0, "loss_rank_avg": 0.034002915024757385, "step": 5895, "valid_targets_mean": 3431.4, "valid_targets_min": 1196 }, { "epoch": 6.67572156196944, "grad_norm": 0.5991953850107175, "learning_rate": 2.65203255328339e-07, "loss": 0.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.03567385673522949, "step": 5900, "valid_targets_mean": 1836.1, "valid_targets_min": 575 }, { "epoch": 6.681380871533673, "grad_norm": 0.7020941398300836, "learning_rate": 2.561255219870762e-07, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.05443864315748215, "step": 5905, "valid_targets_mean": 1908.8, "valid_targets_min": 609 }, { "epoch": 6.687040181097906, "grad_norm": 0.5464404537690308, "learning_rate": 2.472048673868033e-07, "loss": 0.0861, "loss_nan_ranks": 0, "loss_rank_avg": 0.02943640947341919, "step": 5910, "valid_targets_mean": 1497.2, "valid_targets_min": 542 }, { "epoch": 6.6926994906621395, "grad_norm": 0.3661819024596803, "learning_rate": 2.3844136249865367e-07, "loss": 0.1018, "loss_nan_ranks": 0, "loss_rank_avg": 0.03263043984770775, "step": 5915, "valid_targets_mean": 3701.8, "valid_targets_min": 2440 }, { "epoch": 6.698358800226372, "grad_norm": 0.4550654896101805, "learning_rate": 2.2983507704351426e-07, "loss": 0.0753, "loss_nan_ranks": 0, "loss_rank_avg": 0.02765018306672573, "step": 5920, "valid_targets_mean": 1648.2, "valid_targets_min": 629 }, { "epoch": 6.7040181097906055, "grad_norm": 0.4137364782748426, "learning_rate": 2.213860794914524e-07, "loss": 0.093, "loss_nan_ranks": 0, "loss_rank_avg": 0.038274720311164856, "step": 5925, "valid_targets_mean": 3953.0, "valid_targets_min": 3701 }, { "epoch": 6.709677419354839, "grad_norm": 0.5146684136695984, "learning_rate": 2.1309443706118538e-07, "loss": 0.0749, "loss_nan_ranks": 0, "loss_rank_avg": 0.03469971567392349, "step": 5930, "valid_targets_mean": 1700.9, "valid_targets_min": 485 }, { "epoch": 6.7153367289190715, "grad_norm": 0.49679016274514903, "learning_rate": 2.049602157195363e-07, "loss": 0.0752, "loss_nan_ranks": 0, "loss_rank_avg": 0.0654388889670372, "step": 5935, "valid_targets_mean": 2381.9, "valid_targets_min": 605 }, { "epoch": 6.720996038483305, "grad_norm": 0.351424709328263, "learning_rate": 1.9698348018092338e-07, "loss": 0.0648, "loss_nan_ranks": 0, "loss_rank_avg": 0.025245461612939835, "step": 5940, "valid_targets_mean": 2713.5, "valid_targets_min": 848 }, { "epoch": 6.726655348047538, "grad_norm": 0.35432740168743526, "learning_rate": 1.8916429390682944e-07, "loss": 0.0647, "loss_nan_ranks": 0, "loss_rank_avg": 0.031980741769075394, "step": 5945, "valid_targets_mean": 5106.4, "valid_targets_min": 4456 }, { "epoch": 6.732314657611772, "grad_norm": 0.40381665509366593, "learning_rate": 1.8150271910530204e-07, "loss": 0.068, "loss_nan_ranks": 0, "loss_rank_avg": 0.040590934455394745, "step": 5950, "valid_targets_mean": 3905.5, "valid_targets_min": 1864 }, { "epoch": 6.737973967176004, "grad_norm": 0.5014073985393658, "learning_rate": 1.7399881673046736e-07, "loss": 0.0797, "loss_nan_ranks": 0, "loss_rank_avg": 0.03374318778514862, "step": 5955, "valid_targets_mean": 3313.8, "valid_targets_min": 1361 }, { "epoch": 6.743633276740238, "grad_norm": 0.4408577069276251, "learning_rate": 1.666526464820284e-07, "loss": 0.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.040150947868824005, "step": 5960, "valid_targets_mean": 3500.1, "valid_targets_min": 1814 }, { "epoch": 6.74929258630447, "grad_norm": 0.5379572135308958, "learning_rate": 1.594642668048052e-07, "loss": 0.0863, "loss_nan_ranks": 0, "loss_rank_avg": 0.03901442512869835, "step": 5965, "valid_targets_mean": 1559.0, "valid_targets_min": 759 }, { "epoch": 6.754951895868704, "grad_norm": 0.3506083866275488, "learning_rate": 1.5243373488826653e-07, "loss": 0.0593, "loss_nan_ranks": 0, "loss_rank_avg": 0.029368489980697632, "step": 5970, "valid_targets_mean": 3942.6, "valid_targets_min": 2719 }, { "epoch": 6.760611205432937, "grad_norm": 0.5454659716357816, "learning_rate": 1.4556110666606783e-07, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.028036806732416153, "step": 5975, "valid_targets_mean": 1133.4, "valid_targets_min": 664 }, { "epoch": 6.766270514997171, "grad_norm": 0.3915993911091825, "learning_rate": 1.388464368156095e-07, "loss": 0.0725, "loss_nan_ranks": 0, "loss_rank_avg": 0.023933472111821175, "step": 5980, "valid_targets_mean": 2489.8, "valid_targets_min": 1584 }, { "epoch": 6.771929824561403, "grad_norm": 0.38581046462288265, "learning_rate": 1.322897787576105e-07, "loss": 0.0589, "loss_nan_ranks": 0, "loss_rank_avg": 0.028114689514040947, "step": 5985, "valid_targets_mean": 2685.4, "valid_targets_min": 1003 }, { "epoch": 6.777589134125637, "grad_norm": 0.38659993644399676, "learning_rate": 1.2589118465566875e-07, "loss": 0.0734, "loss_nan_ranks": 0, "loss_rank_avg": 0.029353385791182518, "step": 5990, "valid_targets_mean": 3180.8, "valid_targets_min": 560 }, { "epoch": 6.78324844368987, "grad_norm": 0.39635633472198784, "learning_rate": 1.1965070541585912e-07, "loss": 0.0728, "loss_nan_ranks": 0, "loss_rank_avg": 0.0360221303999424, "step": 5995, "valid_targets_mean": 3285.9, "valid_targets_min": 1049 }, { "epoch": 6.788907753254103, "grad_norm": 0.4768199556298617, "learning_rate": 1.1356839068632053e-07, "loss": 0.0845, "loss_nan_ranks": 0, "loss_rank_avg": 0.041404206305742264, "step": 6000, "valid_targets_mean": 2464.9, "valid_targets_min": 771 }, { "epoch": 6.794567062818336, "grad_norm": 0.4759804528663009, "learning_rate": 1.0764428885686073e-07, "loss": 0.0719, "loss_nan_ranks": 0, "loss_rank_avg": 0.03653126209974289, "step": 6005, "valid_targets_mean": 2959.5, "valid_targets_min": 825 }, { "epoch": 6.8002263723825696, "grad_norm": 0.5508016189657499, "learning_rate": 1.0187844705857875e-07, "loss": 0.0796, "loss_nan_ranks": 0, "loss_rank_avg": 0.04060523957014084, "step": 6010, "valid_targets_mean": 2602.1, "valid_targets_min": 829 }, { "epoch": 6.805885681946802, "grad_norm": 0.47780734613760967, "learning_rate": 9.627091116348076e-08, "loss": 0.0777, "loss_nan_ranks": 0, "loss_rank_avg": 0.04422842338681221, "step": 6015, "valid_targets_mean": 2106.1, "valid_targets_min": 650 }, { "epoch": 6.8115449915110355, "grad_norm": 0.47337810865412044, "learning_rate": 9.082172578412263e-08, "loss": 0.0778, "loss_nan_ranks": 0, "loss_rank_avg": 0.04251515865325928, "step": 6020, "valid_targets_mean": 2946.0, "valid_targets_min": 729 }, { "epoch": 6.817204301075269, "grad_norm": 0.31759103202396305, "learning_rate": 8.553093427325243e-08, "loss": 0.0665, "loss_nan_ranks": 0, "loss_rank_avg": 0.023808494210243225, "step": 6025, "valid_targets_mean": 3853.5, "valid_targets_min": 3152 }, { "epoch": 6.8228636106395015, "grad_norm": 0.3290538179958601, "learning_rate": 8.039857872345736e-08, "loss": 0.066, "loss_nan_ranks": 0, "loss_rank_avg": 0.0240267775952816, "step": 6030, "valid_targets_mean": 3448.2, "valid_targets_min": 2543 }, { "epoch": 6.828522920203735, "grad_norm": 0.48063721542746124, "learning_rate": 7.542469996684843e-08, "loss": 0.0915, "loss_nan_ranks": 0, "loss_rank_avg": 0.03989311307668686, "step": 6035, "valid_targets_mean": 2674.9, "valid_targets_min": 446 }, { "epoch": 6.834182229767968, "grad_norm": 0.4058482123607516, "learning_rate": 7.06093375747141e-08, "loss": 0.0608, "loss_nan_ranks": 0, "loss_rank_avg": 0.02851252630352974, "step": 6040, "valid_targets_mean": 2807.6, "valid_targets_min": 681 }, { "epoch": 6.839841539332202, "grad_norm": 0.5135647892958799, "learning_rate": 6.595252985721834e-08, "loss": 0.0706, "loss_nan_ranks": 0, "loss_rank_avg": 0.049752771854400635, "step": 6045, "valid_targets_mean": 5567.5, "valid_targets_min": 3772 }, { "epoch": 6.845500848896434, "grad_norm": 0.36184997124585655, "learning_rate": 6.145431386309186e-08, "loss": 0.0685, "loss_nan_ranks": 0, "loss_rank_avg": 0.032238394021987915, "step": 6050, "valid_targets_mean": 3662.4, "valid_targets_min": 484 }, { "epoch": 6.851160158460668, "grad_norm": 0.32341004212385127, "learning_rate": 5.711472537933693e-08, "loss": 0.0574, "loss_nan_ranks": 0, "loss_rank_avg": 0.02496453747153282, "step": 6055, "valid_targets_mean": 3900.0, "valid_targets_min": 861 }, { "epoch": 6.856819468024901, "grad_norm": 0.523808243909321, "learning_rate": 5.293379893094752e-08, "loss": 0.0704, "loss_nan_ranks": 0, "loss_rank_avg": 0.05595286563038826, "step": 6060, "valid_targets_mean": 4100.8, "valid_targets_min": 3268 }, { "epoch": 6.862478777589134, "grad_norm": 0.42563665626143066, "learning_rate": 4.891156778062734e-08, "loss": 0.071, "loss_nan_ranks": 0, "loss_rank_avg": 0.033235713839530945, "step": 6065, "valid_targets_mean": 3277.8, "valid_targets_min": 559 }, { "epoch": 6.868138087153367, "grad_norm": 0.4513013591790561, "learning_rate": 4.5048063928527785e-08, "loss": 0.0919, "loss_nan_ranks": 0, "loss_rank_avg": 0.030779201537370682, "step": 6070, "valid_targets_mean": 2986.2, "valid_targets_min": 689 }, { "epoch": 6.873797396717601, "grad_norm": 0.5888522930807201, "learning_rate": 4.134331811199932e-08, "loss": 0.0935, "loss_nan_ranks": 0, "loss_rank_avg": 0.05735611915588379, "step": 6075, "valid_targets_mean": 1831.6, "valid_targets_min": 616 }, { "epoch": 6.879456706281833, "grad_norm": 0.5316339779537674, "learning_rate": 3.7797359805333836e-08, "loss": 0.0535, "loss_nan_ranks": 0, "loss_rank_avg": 0.03486653417348862, "step": 6080, "valid_targets_mean": 2087.0, "valid_targets_min": 602 }, { "epoch": 6.885116015846067, "grad_norm": 0.39760459368891415, "learning_rate": 3.441021721954485e-08, "loss": 0.0871, "loss_nan_ranks": 0, "loss_rank_avg": 0.03535497188568115, "step": 6085, "valid_targets_mean": 3992.1, "valid_targets_min": 3551 }, { "epoch": 6.8907753254103, "grad_norm": 0.43388913745160906, "learning_rate": 3.11819173021366e-08, "loss": 0.0674, "loss_nan_ranks": 0, "loss_rank_avg": 0.02623586170375347, "step": 6090, "valid_targets_mean": 2115.1, "valid_targets_min": 596 }, { "epoch": 6.896434634974533, "grad_norm": 0.38243226683777753, "learning_rate": 2.8112485736881967e-08, "loss": 0.0697, "loss_nan_ranks": 0, "loss_rank_avg": 0.027614392340183258, "step": 6095, "valid_targets_mean": 3488.0, "valid_targets_min": 799 }, { "epoch": 6.902093944538766, "grad_norm": 0.4848799581538806, "learning_rate": 2.520194694363376e-08, "loss": 0.0821, "loss_nan_ranks": 0, "loss_rank_avg": 0.05016375333070755, "step": 6100, "valid_targets_mean": 3078.9, "valid_targets_min": 706 }, { "epoch": 6.907753254103, "grad_norm": 0.5335054810278811, "learning_rate": 2.2450324078120423e-08, "loss": 0.1072, "loss_nan_ranks": 0, "loss_rank_avg": 0.03868968039751053, "step": 6105, "valid_targets_mean": 1957.6, "valid_targets_min": 710 }, { "epoch": 6.913412563667233, "grad_norm": 0.42779014879456234, "learning_rate": 1.9857639031759522e-08, "loss": 0.0786, "loss_nan_ranks": 0, "loss_rank_avg": 0.030187007039785385, "step": 6110, "valid_targets_mean": 3112.4, "valid_targets_min": 647 }, { "epoch": 6.9190718732314656, "grad_norm": 0.5708406365969891, "learning_rate": 1.7423912431489e-08, "loss": 0.0716, "loss_nan_ranks": 0, "loss_rank_avg": 0.03383772075176239, "step": 6115, "valid_targets_mean": 1494.9, "valid_targets_min": 716 }, { "epoch": 6.924731182795699, "grad_norm": 0.4164948214390167, "learning_rate": 1.51491636396095e-08, "loss": 0.0675, "loss_nan_ranks": 0, "loss_rank_avg": 0.038247913122177124, "step": 6120, "valid_targets_mean": 3669.5, "valid_targets_min": 3122 }, { "epoch": 6.930390492359932, "grad_norm": 0.4980278280391314, "learning_rate": 1.3033410753608977e-08, "loss": 0.0678, "loss_nan_ranks": 0, "loss_rank_avg": 0.03384961932897568, "step": 6125, "valid_targets_mean": 2399.1, "valid_targets_min": 832 }, { "epoch": 6.936049801924165, "grad_norm": 0.5624363897364986, "learning_rate": 1.1076670606045004e-08, "loss": 0.0582, "loss_nan_ranks": 0, "loss_rank_avg": 0.0311758890748024, "step": 6130, "valid_targets_mean": 1216.9, "valid_targets_min": 635 }, { "epoch": 6.941709111488398, "grad_norm": 0.40337485535884043, "learning_rate": 9.278958764391554e-09, "loss": 0.0824, "loss_nan_ranks": 0, "loss_rank_avg": 0.03224567323923111, "step": 6135, "valid_targets_mean": 3078.1, "valid_targets_min": 756 }, { "epoch": 6.947368421052632, "grad_norm": 0.6199863900014508, "learning_rate": 7.64028953092133e-09, "loss": 0.0622, "loss_nan_ranks": 0, "loss_rank_avg": 0.03886682540178299, "step": 6140, "valid_targets_mean": 2387.1, "valid_targets_min": 744 }, { "epoch": 6.953027730616864, "grad_norm": 0.36540416345205473, "learning_rate": 6.16067594259695e-09, "loss": 0.0647, "loss_nan_ranks": 0, "loss_rank_avg": 0.023269277065992355, "step": 6145, "valid_targets_mean": 2088.4, "valid_targets_min": 529 }, { "epoch": 6.958687040181098, "grad_norm": 0.5059157441516826, "learning_rate": 4.840129770957713e-09, "loss": 0.0742, "loss_nan_ranks": 0, "loss_rank_avg": 0.04765991121530533, "step": 6150, "valid_targets_mean": 3932.1, "valid_targets_min": 2017 }, { "epoch": 6.964346349745331, "grad_norm": 0.32224893355652934, "learning_rate": 3.6786615220352208e-09, "loss": 0.0639, "loss_nan_ranks": 0, "loss_rank_avg": 0.02520209550857544, "step": 6155, "valid_targets_mean": 4790.0, "valid_targets_min": 516 }, { "epoch": 6.970005659309564, "grad_norm": 0.4023448099684757, "learning_rate": 2.6762804362623353e-09, "loss": 0.0625, "loss_nan_ranks": 0, "loss_rank_avg": 0.02867652103304863, "step": 6160, "valid_targets_mean": 2245.1, "valid_targets_min": 772 }, { "epoch": 6.975664968873797, "grad_norm": 0.470060085059617, "learning_rate": 1.8329944884021288e-09, "loss": 0.0663, "loss_nan_ranks": 0, "loss_rank_avg": 0.03312272951006889, "step": 6165, "valid_targets_mean": 3851.0, "valid_targets_min": 2196 }, { "epoch": 6.981324278438031, "grad_norm": 0.5501571965826606, "learning_rate": 1.1488103874923717e-09, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.11629301309585571, "step": 6170, "valid_targets_mean": 3094.1, "valid_targets_min": 2759 }, { "epoch": 6.986983588002264, "grad_norm": 0.3747210819200156, "learning_rate": 6.237335767744767e-10, "loss": 0.0781, "loss_nan_ranks": 0, "loss_rank_avg": 0.026630330830812454, "step": 6175, "valid_targets_mean": 3760.2, "valid_targets_min": 3175 }, { "epoch": 6.992642897566497, "grad_norm": 0.4336427114618938, "learning_rate": 2.577682336690757e-10, "loss": 0.0741, "loss_nan_ranks": 0, "loss_rank_avg": 0.025160185992717743, "step": 6180, "valid_targets_mean": 2446.5, "valid_targets_min": 759 }, { "epoch": 6.99830220713073, "grad_norm": 0.5105245398393162, "learning_rate": 5.091726972938915e-11, "loss": 0.0728, "loss_nan_ranks": 0, "loss_rank_avg": 0.08412353694438934, "step": 6185, "valid_targets_mean": 2332.5, "valid_targets_min": 927 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.03830413520336151, "step": 6187, "total_flos": 3.038645528557519e+18, "train_loss": 0.05716925004446894, "train_runtime": 84196.6554, "train_samples_per_second": 1.175, "train_steps_per_second": 0.073, "valid_targets_mean": 3729.2, "valid_targets_min": 1273 } ], "logging_steps": 5, "max_steps": 6188, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 3.038645528557519e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }