{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 5691, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.006150061500615006, "grad_norm": 14.34388511590367, "learning_rate": 2.8070175438596494e-07, "loss": 0.6962, "loss_nan_ranks": 0, "loss_rank_avg": 0.3923146724700928, "step": 5, "valid_targets_mean": 4422.0, "valid_targets_min": 1675 }, { "epoch": 0.012300123001230012, "grad_norm": 13.448672386958586, "learning_rate": 6.315789473684211e-07, "loss": 0.7044, "loss_nan_ranks": 0, "loss_rank_avg": 0.3457927703857422, "step": 10, "valid_targets_mean": 4058.2, "valid_targets_min": 808 }, { "epoch": 0.01845018450184502, "grad_norm": 13.80958883820625, "learning_rate": 9.824561403508773e-07, "loss": 0.6845, "loss_nan_ranks": 0, "loss_rank_avg": 0.392394483089447, "step": 15, "valid_targets_mean": 3577.9, "valid_targets_min": 746 }, { "epoch": 0.024600246002460024, "grad_norm": 10.929831076458443, "learning_rate": 1.3333333333333334e-06, "loss": 0.6333, "loss_nan_ranks": 0, "loss_rank_avg": 0.23890632390975952, "step": 20, "valid_targets_mean": 2239.2, "valid_targets_min": 514 }, { "epoch": 0.03075030750307503, "grad_norm": 8.42047367497516, "learning_rate": 1.6842105263157895e-06, "loss": 0.6591, "loss_nan_ranks": 0, "loss_rank_avg": 0.33744460344314575, "step": 25, "valid_targets_mean": 3684.1, "valid_targets_min": 1090 }, { "epoch": 0.03690036900369004, "grad_norm": 6.391556643780026, "learning_rate": 2.0350877192982456e-06, "loss": 0.6069, "loss_nan_ranks": 0, "loss_rank_avg": 0.38388872146606445, "step": 30, "valid_targets_mean": 4469.0, "valid_targets_min": 1708 }, { "epoch": 0.04305043050430504, "grad_norm": 4.973969891856266, "learning_rate": 2.385964912280702e-06, "loss": 0.5541, "loss_nan_ranks": 0, "loss_rank_avg": 0.30934831500053406, "step": 35, "valid_targets_mean": 5247.8, "valid_targets_min": 1343 }, { "epoch": 0.04920049200492005, "grad_norm": 4.127809911278667, "learning_rate": 2.7368421052631583e-06, "loss": 0.5143, "loss_nan_ranks": 0, "loss_rank_avg": 0.23439955711364746, "step": 40, "valid_targets_mean": 3866.9, "valid_targets_min": 984 }, { "epoch": 0.055350553505535055, "grad_norm": 2.2718878481854703, "learning_rate": 3.0877192982456146e-06, "loss": 0.4672, "loss_nan_ranks": 0, "loss_rank_avg": 0.26451146602630615, "step": 45, "valid_targets_mean": 3957.1, "valid_targets_min": 819 }, { "epoch": 0.06150061500615006, "grad_norm": 1.609682118490145, "learning_rate": 3.4385964912280705e-06, "loss": 0.4509, "loss_nan_ranks": 0, "loss_rank_avg": 0.19798928499221802, "step": 50, "valid_targets_mean": 2537.5, "valid_targets_min": 869 }, { "epoch": 0.06765067650676507, "grad_norm": 1.2193738230688447, "learning_rate": 3.789473684210527e-06, "loss": 0.4161, "loss_nan_ranks": 0, "loss_rank_avg": 0.20053730905056, "step": 55, "valid_targets_mean": 3389.4, "valid_targets_min": 744 }, { "epoch": 0.07380073800738007, "grad_norm": 0.9570881073406153, "learning_rate": 4.140350877192983e-06, "loss": 0.4078, "loss_nan_ranks": 0, "loss_rank_avg": 0.21180173754692078, "step": 60, "valid_targets_mean": 4312.9, "valid_targets_min": 1261 }, { "epoch": 0.07995079950799508, "grad_norm": 1.03550100295078, "learning_rate": 4.491228070175439e-06, "loss": 0.4163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1993039846420288, "step": 65, "valid_targets_mean": 5299.9, "valid_targets_min": 947 }, { "epoch": 0.08610086100861009, "grad_norm": 0.7504311838601766, "learning_rate": 4.842105263157895e-06, "loss": 0.3857, "loss_nan_ranks": 0, "loss_rank_avg": 0.1999400556087494, "step": 70, "valid_targets_mean": 3929.1, "valid_targets_min": 1000 }, { "epoch": 0.09225092250922509, "grad_norm": 0.8268666766388924, "learning_rate": 5.192982456140351e-06, "loss": 0.3897, "loss_nan_ranks": 0, "loss_rank_avg": 0.22943969070911407, "step": 75, "valid_targets_mean": 4366.0, "valid_targets_min": 1211 }, { "epoch": 0.0984009840098401, "grad_norm": 0.747110484184559, "learning_rate": 5.543859649122807e-06, "loss": 0.3751, "loss_nan_ranks": 0, "loss_rank_avg": 0.19703662395477295, "step": 80, "valid_targets_mean": 4036.1, "valid_targets_min": 1185 }, { "epoch": 0.1045510455104551, "grad_norm": 0.5537844165209603, "learning_rate": 5.8947368421052634e-06, "loss": 0.3571, "loss_nan_ranks": 0, "loss_rank_avg": 0.16840311884880066, "step": 85, "valid_targets_mean": 5368.6, "valid_targets_min": 766 }, { "epoch": 0.11070110701107011, "grad_norm": 0.6864250316557902, "learning_rate": 6.245614035087721e-06, "loss": 0.3567, "loss_nan_ranks": 0, "loss_rank_avg": 0.13957206904888153, "step": 90, "valid_targets_mean": 2732.4, "valid_targets_min": 680 }, { "epoch": 0.11685116851168512, "grad_norm": 0.596229294576692, "learning_rate": 6.596491228070177e-06, "loss": 0.3513, "loss_nan_ranks": 0, "loss_rank_avg": 0.20503294467926025, "step": 95, "valid_targets_mean": 5133.0, "valid_targets_min": 1377 }, { "epoch": 0.12300123001230012, "grad_norm": 0.6047039473694451, "learning_rate": 6.947368421052632e-06, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.14418484270572662, "step": 100, "valid_targets_mean": 3241.2, "valid_targets_min": 761 }, { "epoch": 0.12915129151291513, "grad_norm": 0.5872283891893437, "learning_rate": 7.298245614035089e-06, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.12034086883068085, "step": 105, "valid_targets_mean": 2892.4, "valid_targets_min": 984 }, { "epoch": 0.13530135301353013, "grad_norm": 0.7415375959976724, "learning_rate": 7.649122807017545e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.14090844988822937, "step": 110, "valid_targets_mean": 2352.1, "valid_targets_min": 849 }, { "epoch": 0.14145141451414514, "grad_norm": 0.5437557695218617, "learning_rate": 8.000000000000001e-06, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.17638526856899261, "step": 115, "valid_targets_mean": 6170.4, "valid_targets_min": 4370 }, { "epoch": 0.14760147601476015, "grad_norm": 0.5709639191817446, "learning_rate": 8.350877192982458e-06, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.1743180900812149, "step": 120, "valid_targets_mean": 4692.6, "valid_targets_min": 817 }, { "epoch": 0.15375153751537515, "grad_norm": 0.6906789119538572, "learning_rate": 8.701754385964914e-06, "loss": 0.3067, "loss_nan_ranks": 0, "loss_rank_avg": 0.1441097855567932, "step": 125, "valid_targets_mean": 2680.5, "valid_targets_min": 765 }, { "epoch": 0.15990159901599016, "grad_norm": 0.7978504206375153, "learning_rate": 9.05263157894737e-06, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.17898012697696686, "step": 130, "valid_targets_mean": 3776.6, "valid_targets_min": 1048 }, { "epoch": 0.16605166051660517, "grad_norm": 0.5339689834834898, "learning_rate": 9.403508771929825e-06, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.16535097360610962, "step": 135, "valid_targets_mean": 5200.0, "valid_targets_min": 1428 }, { "epoch": 0.17220172201722017, "grad_norm": 0.7138460856852715, "learning_rate": 9.754385964912281e-06, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.13366712629795074, "step": 140, "valid_targets_mean": 2722.0, "valid_targets_min": 814 }, { "epoch": 0.17835178351783518, "grad_norm": 0.6833985699574258, "learning_rate": 1.0105263157894738e-05, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.14312300086021423, "step": 145, "valid_targets_mean": 2762.5, "valid_targets_min": 713 }, { "epoch": 0.18450184501845018, "grad_norm": 0.631945933839444, "learning_rate": 1.0456140350877194e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.12792186439037323, "step": 150, "valid_targets_mean": 2997.9, "valid_targets_min": 873 }, { "epoch": 0.1906519065190652, "grad_norm": 0.6577696206587937, "learning_rate": 1.080701754385965e-05, "loss": 0.2884, "loss_nan_ranks": 0, "loss_rank_avg": 0.09442654252052307, "step": 155, "valid_targets_mean": 2254.8, "valid_targets_min": 819 }, { "epoch": 0.1968019680196802, "grad_norm": 0.6200058152448497, "learning_rate": 1.1157894736842105e-05, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.09284514933824539, "step": 160, "valid_targets_mean": 3005.8, "valid_targets_min": 790 }, { "epoch": 0.2029520295202952, "grad_norm": 0.6591719878163999, "learning_rate": 1.1508771929824563e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.1334449201822281, "step": 165, "valid_targets_mean": 3188.4, "valid_targets_min": 760 }, { "epoch": 0.2091020910209102, "grad_norm": 0.5924754029967354, "learning_rate": 1.1859649122807017e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.17737087607383728, "step": 170, "valid_targets_mean": 4252.5, "valid_targets_min": 1433 }, { "epoch": 0.21525215252152521, "grad_norm": 1.0184410261686934, "learning_rate": 1.2210526315789475e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.17169860005378723, "step": 175, "valid_targets_mean": 1873.9, "valid_targets_min": 756 }, { "epoch": 0.22140221402214022, "grad_norm": 0.578241174609644, "learning_rate": 1.256140350877193e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.14338549971580505, "step": 180, "valid_targets_mean": 4758.5, "valid_targets_min": 791 }, { "epoch": 0.22755227552275523, "grad_norm": 0.6864828289619771, "learning_rate": 1.2912280701754386e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455353945493698, "step": 185, "valid_targets_mean": 3026.6, "valid_targets_min": 728 }, { "epoch": 0.23370233702337023, "grad_norm": 0.5485110296810749, "learning_rate": 1.3263157894736843e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.1245964914560318, "step": 190, "valid_targets_mean": 3965.1, "valid_targets_min": 762 }, { "epoch": 0.23985239852398524, "grad_norm": 0.5813314121792098, "learning_rate": 1.3614035087719299e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.12770430743694305, "step": 195, "valid_targets_mean": 4276.4, "valid_targets_min": 1078 }, { "epoch": 0.24600246002460024, "grad_norm": 0.5283972520686584, "learning_rate": 1.3964912280701755e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.13646262884140015, "step": 200, "valid_targets_mean": 5790.0, "valid_targets_min": 1717 }, { "epoch": 0.2521525215252153, "grad_norm": 0.6928374414390275, "learning_rate": 1.4315789473684212e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.11271065473556519, "step": 205, "valid_targets_mean": 2796.9, "valid_targets_min": 652 }, { "epoch": 0.25830258302583026, "grad_norm": 0.6257799469020816, "learning_rate": 1.4666666666666666e-05, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.1546066850423813, "step": 210, "valid_targets_mean": 4036.1, "valid_targets_min": 1295 }, { "epoch": 0.2644526445264453, "grad_norm": 0.8479494000722226, "learning_rate": 1.5017543859649124e-05, "loss": 0.278, "loss_nan_ranks": 0, "loss_rank_avg": 0.15057896077632904, "step": 215, "valid_targets_mean": 2860.0, "valid_targets_min": 920 }, { "epoch": 0.27060270602706027, "grad_norm": 0.7677675659776181, "learning_rate": 1.536842105263158e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.12351485341787338, "step": 220, "valid_targets_mean": 3755.5, "valid_targets_min": 930 }, { "epoch": 0.2767527675276753, "grad_norm": 0.6162237852479014, "learning_rate": 1.5719298245614037e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.09808851778507233, "step": 225, "valid_targets_mean": 2842.8, "valid_targets_min": 596 }, { "epoch": 0.2829028290282903, "grad_norm": 0.7503428527025812, "learning_rate": 1.6070175438596495e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.11257848143577576, "step": 230, "valid_targets_mean": 2738.8, "valid_targets_min": 1373 }, { "epoch": 0.2890528905289053, "grad_norm": 0.6475625123302046, "learning_rate": 1.642105263157895e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.12272156774997711, "step": 235, "valid_targets_mean": 4599.2, "valid_targets_min": 1101 }, { "epoch": 0.2952029520295203, "grad_norm": 0.7380563592229803, "learning_rate": 1.6771929824561408e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.1349666565656662, "step": 240, "valid_targets_mean": 2908.2, "valid_targets_min": 781 }, { "epoch": 0.3013530135301353, "grad_norm": 0.7378534007066728, "learning_rate": 1.7122807017543862e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.1576254665851593, "step": 245, "valid_targets_mean": 3112.8, "valid_targets_min": 1197 }, { "epoch": 0.3075030750307503, "grad_norm": 0.6607086458282392, "learning_rate": 1.7473684210526317e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.09825752675533295, "step": 250, "valid_targets_mean": 2597.6, "valid_targets_min": 722 }, { "epoch": 0.31365313653136534, "grad_norm": 0.6021963200533332, "learning_rate": 1.7824561403508775e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.12922337651252747, "step": 255, "valid_targets_mean": 3576.2, "valid_targets_min": 756 }, { "epoch": 0.3198031980319803, "grad_norm": 0.5498231779416419, "learning_rate": 1.817543859649123e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.13279210031032562, "step": 260, "valid_targets_mean": 4544.5, "valid_targets_min": 937 }, { "epoch": 0.32595325953259535, "grad_norm": 1.7321729583092624, "learning_rate": 1.8526315789473684e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.15385058522224426, "step": 265, "valid_targets_mean": 4503.1, "valid_targets_min": 1306 }, { "epoch": 0.33210332103321033, "grad_norm": 0.6306691456267176, "learning_rate": 1.8877192982456142e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.12353003025054932, "step": 270, "valid_targets_mean": 4045.9, "valid_targets_min": 1333 }, { "epoch": 0.33825338253382536, "grad_norm": 0.7323662938659886, "learning_rate": 1.9228070175438597e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.13493561744689941, "step": 275, "valid_targets_mean": 3111.6, "valid_targets_min": 863 }, { "epoch": 0.34440344403444034, "grad_norm": 0.641520115611209, "learning_rate": 1.9578947368421055e-05, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.1304367035627365, "step": 280, "valid_targets_mean": 4524.1, "valid_targets_min": 1188 }, { "epoch": 0.3505535055350554, "grad_norm": 1.3045396785116659, "learning_rate": 1.992982456140351e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.16399013996124268, "step": 285, "valid_targets_mean": 3966.9, "valid_targets_min": 1111 }, { "epoch": 0.35670356703567035, "grad_norm": 0.7525603531903772, "learning_rate": 2.0280701754385967e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.10396411269903183, "step": 290, "valid_targets_mean": 1999.9, "valid_targets_min": 855 }, { "epoch": 0.3628536285362854, "grad_norm": 0.5775656415843651, "learning_rate": 2.0631578947368425e-05, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.11433359980583191, "step": 295, "valid_targets_mean": 4188.5, "valid_targets_min": 695 }, { "epoch": 0.36900369003690037, "grad_norm": 0.6449434275826967, "learning_rate": 2.0982456140350877e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475314199924469, "step": 300, "valid_targets_mean": 4157.8, "valid_targets_min": 1078 }, { "epoch": 0.3751537515375154, "grad_norm": 0.6096518949787825, "learning_rate": 2.1333333333333335e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.09974195063114166, "step": 305, "valid_targets_mean": 3326.5, "valid_targets_min": 1144 }, { "epoch": 0.3813038130381304, "grad_norm": 0.689835865195794, "learning_rate": 2.1684210526315793e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.0843476951122284, "step": 310, "valid_targets_mean": 2435.8, "valid_targets_min": 893 }, { "epoch": 0.3874538745387454, "grad_norm": 0.7325642340307881, "learning_rate": 2.203508771929825e-05, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.10683587193489075, "step": 315, "valid_targets_mean": 2763.4, "valid_targets_min": 824 }, { "epoch": 0.3936039360393604, "grad_norm": 0.5127811599160287, "learning_rate": 2.2385964912280702e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.16119329631328583, "step": 320, "valid_targets_mean": 6344.2, "valid_targets_min": 1054 }, { "epoch": 0.3997539975399754, "grad_norm": 0.5796006887347024, "learning_rate": 2.273684210526316e-05, "loss": 0.2547, "loss_nan_ranks": 0, "loss_rank_avg": 0.13043825328350067, "step": 325, "valid_targets_mean": 4569.6, "valid_targets_min": 1415 }, { "epoch": 0.4059040590405904, "grad_norm": 0.7654349225213335, "learning_rate": 2.3087719298245618e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.16439379751682281, "step": 330, "valid_targets_mean": 3416.4, "valid_targets_min": 677 }, { "epoch": 0.41205412054120544, "grad_norm": 0.7923911693218662, "learning_rate": 2.3438596491228073e-05, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.16690054535865784, "step": 335, "valid_targets_mean": 4589.4, "valid_targets_min": 1259 }, { "epoch": 0.4182041820418204, "grad_norm": 0.5497897100215323, "learning_rate": 2.3789473684210527e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.12379418313503265, "step": 340, "valid_targets_mean": 4529.6, "valid_targets_min": 545 }, { "epoch": 0.42435424354243545, "grad_norm": 0.5397909285693497, "learning_rate": 2.4140350877192985e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.11294364184141159, "step": 345, "valid_targets_mean": 4670.1, "valid_targets_min": 960 }, { "epoch": 0.43050430504305043, "grad_norm": 0.6827878269740454, "learning_rate": 2.449122807017544e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.12532299757003784, "step": 350, "valid_targets_mean": 3995.5, "valid_targets_min": 1045 }, { "epoch": 0.43665436654366546, "grad_norm": 0.5834526984728204, "learning_rate": 2.4842105263157898e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.1181444525718689, "step": 355, "valid_targets_mean": 4259.4, "valid_targets_min": 1124 }, { "epoch": 0.44280442804428044, "grad_norm": 0.8097876401661674, "learning_rate": 2.5192982456140352e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.13173595070838928, "step": 360, "valid_targets_mean": 3900.5, "valid_targets_min": 798 }, { "epoch": 0.4489544895448955, "grad_norm": 0.6402467279819687, "learning_rate": 2.5543859649122807e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.12714681029319763, "step": 365, "valid_targets_mean": 4407.1, "valid_targets_min": 822 }, { "epoch": 0.45510455104551045, "grad_norm": 0.7146089386247548, "learning_rate": 2.5894736842105265e-05, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.0844363421201706, "step": 370, "valid_targets_mean": 1544.2, "valid_targets_min": 888 }, { "epoch": 0.4612546125461255, "grad_norm": 0.5825739163735174, "learning_rate": 2.6245614035087723e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.14574196934700012, "step": 375, "valid_targets_mean": 5416.8, "valid_targets_min": 830 }, { "epoch": 0.46740467404674046, "grad_norm": 0.5986218806616732, "learning_rate": 2.6596491228070174e-05, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.12313855439424515, "step": 380, "valid_targets_mean": 4090.0, "valid_targets_min": 505 }, { "epoch": 0.4735547355473555, "grad_norm": 0.6605150095735414, "learning_rate": 2.6947368421052632e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.15636996924877167, "step": 385, "valid_targets_mean": 4446.0, "valid_targets_min": 1180 }, { "epoch": 0.4797047970479705, "grad_norm": 0.6324684396446358, "learning_rate": 2.729824561403509e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.12866069376468658, "step": 390, "valid_targets_mean": 3533.9, "valid_targets_min": 1058 }, { "epoch": 0.4858548585485855, "grad_norm": 0.6662998202285606, "learning_rate": 2.764912280701755e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.10635501146316528, "step": 395, "valid_targets_mean": 2783.5, "valid_targets_min": 650 }, { "epoch": 0.4920049200492005, "grad_norm": 0.6247271495703325, "learning_rate": 2.8e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.12806738913059235, "step": 400, "valid_targets_mean": 3668.4, "valid_targets_min": 1193 }, { "epoch": 0.4981549815498155, "grad_norm": 0.6566549512264044, "learning_rate": 2.8350877192982458e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.140034019947052, "step": 405, "valid_targets_mean": 3933.4, "valid_targets_min": 1446 }, { "epoch": 0.5043050430504306, "grad_norm": 0.560957404856101, "learning_rate": 2.8701754385964916e-05, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.10376521199941635, "step": 410, "valid_targets_mean": 3788.6, "valid_targets_min": 642 }, { "epoch": 0.5104551045510455, "grad_norm": 0.5918715305614818, "learning_rate": 2.9052631578947374e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.15398825705051422, "step": 415, "valid_targets_mean": 4870.4, "valid_targets_min": 906 }, { "epoch": 0.5166051660516605, "grad_norm": 0.6840002116163053, "learning_rate": 2.9403508771929825e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.09648455679416656, "step": 420, "valid_targets_mean": 2946.9, "valid_targets_min": 922 }, { "epoch": 0.5227552275522755, "grad_norm": 0.6991668740858077, "learning_rate": 2.9754385964912283e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.12691104412078857, "step": 425, "valid_targets_mean": 3454.4, "valid_targets_min": 1005 }, { "epoch": 0.5289052890528906, "grad_norm": 0.6057067284077027, "learning_rate": 3.010526315789474e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.14319056272506714, "step": 430, "valid_targets_mean": 4794.1, "valid_targets_min": 708 }, { "epoch": 0.5350553505535055, "grad_norm": 0.5941894810235845, "learning_rate": 3.0456140350877195e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.11128835380077362, "step": 435, "valid_targets_mean": 3645.6, "valid_targets_min": 1287 }, { "epoch": 0.5412054120541205, "grad_norm": 0.61624164780544, "learning_rate": 3.080701754385965e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.11885511875152588, "step": 440, "valid_targets_mean": 3409.5, "valid_targets_min": 1004 }, { "epoch": 0.5473554735547356, "grad_norm": 0.6575804659128035, "learning_rate": 3.1157894736842105e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.14894616603851318, "step": 445, "valid_targets_mean": 3475.8, "valid_targets_min": 953 }, { "epoch": 0.5535055350553506, "grad_norm": 0.6890003470083387, "learning_rate": 3.150877192982456e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.0839521661400795, "step": 450, "valid_targets_mean": 2157.6, "valid_targets_min": 885 }, { "epoch": 0.5596555965559655, "grad_norm": 0.5228244349102561, "learning_rate": 3.185964912280702e-05, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.11843560636043549, "step": 455, "valid_targets_mean": 5570.5, "valid_targets_min": 1278 }, { "epoch": 0.5658056580565806, "grad_norm": 0.6135745125381087, "learning_rate": 3.221052631578947e-05, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.13862308859825134, "step": 460, "valid_targets_mean": 4292.4, "valid_targets_min": 809 }, { "epoch": 0.5719557195571956, "grad_norm": 0.5856788659327695, "learning_rate": 3.256140350877193e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.11673273146152496, "step": 465, "valid_targets_mean": 4726.9, "valid_targets_min": 922 }, { "epoch": 0.5781057810578106, "grad_norm": 0.7031341038651712, "learning_rate": 3.291228070175439e-05, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.14521513879299164, "step": 470, "valid_targets_mean": 3073.2, "valid_targets_min": 682 }, { "epoch": 0.5842558425584256, "grad_norm": 0.6119983489600114, "learning_rate": 3.3263157894736846e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.11497868597507477, "step": 475, "valid_targets_mean": 3424.2, "valid_targets_min": 563 }, { "epoch": 0.5904059040590406, "grad_norm": 0.6563106237909677, "learning_rate": 3.36140350877193e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.09766963869333267, "step": 480, "valid_targets_mean": 2831.5, "valid_targets_min": 770 }, { "epoch": 0.5965559655596556, "grad_norm": 0.6234159492386329, "learning_rate": 3.3964912280701755e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.13836853206157684, "step": 485, "valid_targets_mean": 2741.6, "valid_targets_min": 1390 }, { "epoch": 0.6027060270602707, "grad_norm": 0.6908214055958825, "learning_rate": 3.431578947368421e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.09620989859104156, "step": 490, "valid_targets_mean": 2789.9, "valid_targets_min": 748 }, { "epoch": 0.6088560885608856, "grad_norm": 0.5672418144373478, "learning_rate": 3.466666666666667e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471034586429596, "step": 495, "valid_targets_mean": 5695.5, "valid_targets_min": 1120 }, { "epoch": 0.6150061500615006, "grad_norm": 0.5892132708436436, "learning_rate": 3.501754385964912e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.10246916860342026, "step": 500, "valid_targets_mean": 3984.2, "valid_targets_min": 1395 }, { "epoch": 0.6211562115621156, "grad_norm": 0.4618293405009735, "learning_rate": 3.536842105263158e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.1416078805923462, "step": 505, "valid_targets_mean": 6996.8, "valid_targets_min": 1943 }, { "epoch": 0.6273062730627307, "grad_norm": 0.5941175843723603, "learning_rate": 3.571929824561404e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.15049150586128235, "step": 510, "valid_targets_mean": 4797.2, "valid_targets_min": 1365 }, { "epoch": 0.6334563345633456, "grad_norm": 0.7205522483055742, "learning_rate": 3.6070175438596497e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.10621985793113708, "step": 515, "valid_targets_mean": 2456.4, "valid_targets_min": 777 }, { "epoch": 0.6396063960639606, "grad_norm": 0.606247855571102, "learning_rate": 3.6421052631578955e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.14817304909229279, "step": 520, "valid_targets_mean": 4189.4, "valid_targets_min": 888 }, { "epoch": 0.6457564575645757, "grad_norm": 0.5739045072909725, "learning_rate": 3.6771929824561406e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.12606631219387054, "step": 525, "valid_targets_mean": 4690.6, "valid_targets_min": 909 }, { "epoch": 0.6519065190651907, "grad_norm": 0.6833692875672978, "learning_rate": 3.7122807017543864e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.08352625370025635, "step": 530, "valid_targets_mean": 1783.1, "valid_targets_min": 696 }, { "epoch": 0.6580565805658056, "grad_norm": 0.6207727738102795, "learning_rate": 3.747368421052632e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.09904326498508453, "step": 535, "valid_targets_mean": 2827.1, "valid_targets_min": 1535 }, { "epoch": 0.6642066420664207, "grad_norm": 0.6437986931296231, "learning_rate": 3.782456140350878e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.10277711600065231, "step": 540, "valid_targets_mean": 2709.9, "valid_targets_min": 775 }, { "epoch": 0.6703567035670357, "grad_norm": 0.5491691992502378, "learning_rate": 3.817543859649123e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.09722322225570679, "step": 545, "valid_targets_mean": 3374.2, "valid_targets_min": 1129 }, { "epoch": 0.6765067650676507, "grad_norm": 0.5224553002032761, "learning_rate": 3.852631578947369e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.1046345978975296, "step": 550, "valid_targets_mean": 3934.6, "valid_targets_min": 868 }, { "epoch": 0.6826568265682657, "grad_norm": 0.6693332722010621, "learning_rate": 3.887719298245615e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.12382499873638153, "step": 555, "valid_targets_mean": 3000.4, "valid_targets_min": 879 }, { "epoch": 0.6888068880688807, "grad_norm": 0.553481707783701, "learning_rate": 3.92280701754386e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.15222081542015076, "step": 560, "valid_targets_mean": 5865.9, "valid_targets_min": 4226 }, { "epoch": 0.6949569495694957, "grad_norm": 0.5730366034440327, "learning_rate": 3.9578947368421056e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.0955621600151062, "step": 565, "valid_targets_mean": 3486.2, "valid_targets_min": 1177 }, { "epoch": 0.7011070110701108, "grad_norm": 0.6652205945553179, "learning_rate": 3.9929824561403514e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.11635396629571915, "step": 570, "valid_targets_mean": 2395.6, "valid_targets_min": 741 }, { "epoch": 0.7072570725707257, "grad_norm": 0.5956099028772482, "learning_rate": 3.9999939784269625e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.1362784057855606, "step": 575, "valid_targets_mean": 4311.1, "valid_targets_min": 883 }, { "epoch": 0.7134071340713407, "grad_norm": 0.6146107763137679, "learning_rate": 3.999969515848639e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.06651298701763153, "step": 580, "valid_targets_mean": 2019.5, "valid_targets_min": 726 }, { "epoch": 0.7195571955719557, "grad_norm": 0.6343543081731409, "learning_rate": 3.9999262361467005e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.09140601009130478, "step": 585, "valid_targets_mean": 2581.9, "valid_targets_min": 795 }, { "epoch": 0.7257072570725708, "grad_norm": 0.6894184309108627, "learning_rate": 3.999864139728351e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.08771437406539917, "step": 590, "valid_targets_mean": 3145.0, "valid_targets_min": 1170 }, { "epoch": 0.7318573185731857, "grad_norm": 0.5482093353519395, "learning_rate": 3.999783227177839e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.12046876549720764, "step": 595, "valid_targets_mean": 4569.9, "valid_targets_min": 1073 }, { "epoch": 0.7380073800738007, "grad_norm": 0.5851961009573206, "learning_rate": 3.9996834992564466e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.11402551829814911, "step": 600, "valid_targets_mean": 3774.1, "valid_targets_min": 714 }, { "epoch": 0.7441574415744158, "grad_norm": 0.7296287458386673, "learning_rate": 3.999564956902483e-05, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.11000651121139526, "step": 605, "valid_targets_mean": 2601.1, "valid_targets_min": 954 }, { "epoch": 0.7503075030750308, "grad_norm": 0.5760597451958402, "learning_rate": 3.99942760123128e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.10833773016929626, "step": 610, "valid_targets_mean": 3435.2, "valid_targets_min": 928 }, { "epoch": 0.7564575645756457, "grad_norm": 0.6943640448961329, "learning_rate": 3.999271433535176e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.17129077017307281, "step": 615, "valid_targets_mean": 4504.4, "valid_targets_min": 1482 }, { "epoch": 0.7626076260762608, "grad_norm": 0.5992686377470863, "learning_rate": 3.999096455283507e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.12008202821016312, "step": 620, "valid_targets_mean": 3744.4, "valid_targets_min": 636 }, { "epoch": 0.7687576875768758, "grad_norm": 0.560354350495624, "learning_rate": 3.998902668122591e-05, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.09997505694627762, "step": 625, "valid_targets_mean": 3714.2, "valid_targets_min": 1246 }, { "epoch": 0.7749077490774908, "grad_norm": 0.663824524099195, "learning_rate": 3.9986900738757154e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.08692231774330139, "step": 630, "valid_targets_mean": 1984.8, "valid_targets_min": 835 }, { "epoch": 0.7810578105781057, "grad_norm": 0.5697800913867379, "learning_rate": 3.998458674543116e-05, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.10943552851676941, "step": 635, "valid_targets_mean": 4525.5, "valid_targets_min": 1488 }, { "epoch": 0.7872078720787208, "grad_norm": 0.6098594731220626, "learning_rate": 3.998208472301962e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.12786969542503357, "step": 640, "valid_targets_mean": 4307.6, "valid_targets_min": 677 }, { "epoch": 0.7933579335793358, "grad_norm": 0.5680955054141075, "learning_rate": 3.9979394695063306e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.10294528305530548, "step": 645, "valid_targets_mean": 3989.6, "valid_targets_min": 842 }, { "epoch": 0.7995079950799509, "grad_norm": 0.4531766121560527, "learning_rate": 3.9976516686871915e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.13426783680915833, "step": 650, "valid_targets_mean": 6125.5, "valid_targets_min": 1385 }, { "epoch": 0.8056580565805658, "grad_norm": 0.7081288279396023, "learning_rate": 3.997345072552377e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.10611796379089355, "step": 655, "valid_targets_mean": 2718.1, "valid_targets_min": 826 }, { "epoch": 0.8118081180811808, "grad_norm": 0.5095252606710687, "learning_rate": 3.99701968398656e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.0888926312327385, "step": 660, "valid_targets_mean": 3124.4, "valid_targets_min": 815 }, { "epoch": 0.8179581795817958, "grad_norm": 0.5038212489700703, "learning_rate": 3.996675506051225e-05, "loss": 0.2209, "loss_nan_ranks": 0, "loss_rank_avg": 0.1266401708126068, "step": 665, "valid_targets_mean": 4402.2, "valid_targets_min": 1074 }, { "epoch": 0.8241082410824109, "grad_norm": 0.5890742175314511, "learning_rate": 3.996312541984642e-05, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.1030929833650589, "step": 670, "valid_targets_mean": 2584.6, "valid_targets_min": 761 }, { "epoch": 0.8302583025830258, "grad_norm": 0.6356350712622403, "learning_rate": 3.995930795201831e-05, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.10172396153211594, "step": 675, "valid_targets_mean": 2809.1, "valid_targets_min": 985 }, { "epoch": 0.8364083640836408, "grad_norm": 0.5274083076797975, "learning_rate": 3.9955302692945374e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.09649267047643661, "step": 680, "valid_targets_mean": 3972.9, "valid_targets_min": 1176 }, { "epoch": 0.8425584255842559, "grad_norm": 0.5376020521602856, "learning_rate": 3.9951109680311895e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.13508303463459015, "step": 685, "valid_targets_mean": 5890.8, "valid_targets_min": 1350 }, { "epoch": 0.8487084870848709, "grad_norm": 0.6004054189462937, "learning_rate": 3.9946728953568704e-05, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.1343661993741989, "step": 690, "valid_targets_mean": 3911.5, "valid_targets_min": 788 }, { "epoch": 0.8548585485854858, "grad_norm": 0.7328780243982768, "learning_rate": 3.994216055393276e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.10920784622430801, "step": 695, "valid_targets_mean": 3000.6, "valid_targets_min": 1065 }, { "epoch": 0.8610086100861009, "grad_norm": 0.5752830131830805, "learning_rate": 3.993740452438679e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.10322065651416779, "step": 700, "valid_targets_mean": 3641.1, "valid_targets_min": 682 }, { "epoch": 0.8671586715867159, "grad_norm": 0.5724944605467019, "learning_rate": 3.993246090967887e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.09728273749351501, "step": 705, "valid_targets_mean": 3621.1, "valid_targets_min": 1021 }, { "epoch": 0.8733087330873309, "grad_norm": 0.5148833129384647, "learning_rate": 3.992732975632202e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.09972958266735077, "step": 710, "valid_targets_mean": 4536.9, "valid_targets_min": 1185 }, { "epoch": 0.8794587945879458, "grad_norm": 0.6231510005592564, "learning_rate": 3.992201111259375e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.10495687276124954, "step": 715, "valid_targets_mean": 2813.1, "valid_targets_min": 746 }, { "epoch": 0.8856088560885609, "grad_norm": 0.5357245589958889, "learning_rate": 3.991650502853561e-05, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.11093232035636902, "step": 720, "valid_targets_mean": 4334.6, "valid_targets_min": 896 }, { "epoch": 0.8917589175891759, "grad_norm": 0.5698573784802536, "learning_rate": 3.991081155595272e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.14591939747333527, "step": 725, "valid_targets_mean": 5415.6, "valid_targets_min": 812 }, { "epoch": 0.897908979089791, "grad_norm": 0.5580461627711715, "learning_rate": 3.990493074841329e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.1268429160118103, "step": 730, "valid_targets_mean": 3923.8, "valid_targets_min": 1082 }, { "epoch": 0.9040590405904059, "grad_norm": 0.5484280424908219, "learning_rate": 3.989886266124809e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.07535350322723389, "step": 735, "valid_targets_mean": 3045.1, "valid_targets_min": 693 }, { "epoch": 0.9102091020910209, "grad_norm": 0.5882246917841814, "learning_rate": 3.9892607351549984e-05, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.1213439330458641, "step": 740, "valid_targets_mean": 3782.9, "valid_targets_min": 1303 }, { "epoch": 0.9163591635916359, "grad_norm": 0.5431561417113111, "learning_rate": 3.988616487817332e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.08019325137138367, "step": 745, "valid_targets_mean": 2830.4, "valid_targets_min": 607 }, { "epoch": 0.922509225092251, "grad_norm": 0.6136354957743274, "learning_rate": 3.9879535301733436e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.10432184487581253, "step": 750, "valid_targets_mean": 3336.4, "valid_targets_min": 821 }, { "epoch": 0.9286592865928659, "grad_norm": 0.5690547356684668, "learning_rate": 3.987271868460607e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.09149742126464844, "step": 755, "valid_targets_mean": 3187.6, "valid_targets_min": 851 }, { "epoch": 0.9348093480934809, "grad_norm": 0.5485525214734037, "learning_rate": 3.986571509092676e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.11811724305152893, "step": 760, "valid_targets_mean": 4903.9, "valid_targets_min": 1324 }, { "epoch": 0.940959409594096, "grad_norm": 0.5140959758446015, "learning_rate": 3.9858524586590235e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.09690752625465393, "step": 765, "valid_targets_mean": 4038.5, "valid_targets_min": 1524 }, { "epoch": 0.947109471094711, "grad_norm": 0.624772386001772, "learning_rate": 3.985114723924986e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.10119441151618958, "step": 770, "valid_targets_mean": 2797.9, "valid_targets_min": 684 }, { "epoch": 0.9532595325953259, "grad_norm": 0.6328308571681359, "learning_rate": 3.984358311831691e-05, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.08481530845165253, "step": 775, "valid_targets_mean": 2336.0, "valid_targets_min": 730 }, { "epoch": 0.959409594095941, "grad_norm": 0.5882442521314974, "learning_rate": 3.983583229495996e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.15235298871994019, "step": 780, "valid_targets_mean": 5127.1, "valid_targets_min": 1568 }, { "epoch": 0.965559655596556, "grad_norm": 0.6800908309936957, "learning_rate": 3.9827894842104234e-05, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.13019883632659912, "step": 785, "valid_targets_mean": 3817.9, "valid_targets_min": 1288 }, { "epoch": 0.971709717097171, "grad_norm": 0.5368647330195034, "learning_rate": 3.981977083443088e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.1295686960220337, "step": 790, "valid_targets_mean": 4428.8, "valid_targets_min": 1419 }, { "epoch": 0.977859778597786, "grad_norm": 0.5050231596516701, "learning_rate": 3.9811460348376297e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423277109861374, "step": 795, "valid_targets_mean": 5464.0, "valid_targets_min": 1130 }, { "epoch": 0.984009840098401, "grad_norm": 0.6048207125459876, "learning_rate": 3.980296346213139e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.1799425482749939, "step": 800, "valid_targets_mean": 4189.5, "valid_targets_min": 901 }, { "epoch": 0.990159901599016, "grad_norm": 0.5572527201040101, "learning_rate": 3.9794280255640864e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.1222771406173706, "step": 805, "valid_targets_mean": 4308.4, "valid_targets_min": 893 }, { "epoch": 0.996309963099631, "grad_norm": 0.6101121600903643, "learning_rate": 3.978541081060245e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.10646595060825348, "step": 810, "valid_targets_mean": 3194.2, "valid_targets_min": 593 }, { "epoch": 1.002460024600246, "grad_norm": 0.512453158452269, "learning_rate": 3.977635521046613e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.1067245677113533, "step": 815, "valid_targets_mean": 5039.1, "valid_targets_min": 1266 }, { "epoch": 1.0086100861008611, "grad_norm": 0.5697282740006272, "learning_rate": 3.976711354043339e-05, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.09792441129684448, "step": 820, "valid_targets_mean": 4302.0, "valid_targets_min": 891 }, { "epoch": 1.014760147601476, "grad_norm": 0.5477501061399453, "learning_rate": 3.9757685887456374e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.07114817202091217, "step": 825, "valid_targets_mean": 2860.6, "valid_targets_min": 748 }, { "epoch": 1.020910209102091, "grad_norm": 0.5454078089966694, "learning_rate": 3.974807234023709e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.10332266986370087, "step": 830, "valid_targets_mean": 4091.5, "valid_targets_min": 1647 }, { "epoch": 1.027060270602706, "grad_norm": 0.6619144608369546, "learning_rate": 3.9738272989226566e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.09315122663974762, "step": 835, "valid_targets_mean": 2405.8, "valid_targets_min": 724 }, { "epoch": 1.033210332103321, "grad_norm": 0.5656128567180967, "learning_rate": 3.9728287926624013e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.08677469938993454, "step": 840, "valid_targets_mean": 4562.6, "valid_targets_min": 713 }, { "epoch": 1.039360393603936, "grad_norm": 0.6577914529799598, "learning_rate": 3.9718117246375946e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.08870288729667664, "step": 845, "valid_targets_mean": 2273.0, "valid_targets_min": 684 }, { "epoch": 1.045510455104551, "grad_norm": 0.6163431926341251, "learning_rate": 3.970776104417528e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.09998206794261932, "step": 850, "valid_targets_mean": 3411.0, "valid_targets_min": 774 }, { "epoch": 1.051660516605166, "grad_norm": 0.5426764248783481, "learning_rate": 3.969721941746048e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.11000164598226547, "step": 855, "valid_targets_mean": 4086.0, "valid_targets_min": 1050 }, { "epoch": 1.0578105781057812, "grad_norm": 0.5624023109088332, "learning_rate": 3.9686492465414604e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.12527331709861755, "step": 860, "valid_targets_mean": 4599.8, "valid_targets_min": 1430 }, { "epoch": 1.063960639606396, "grad_norm": 0.522478876660166, "learning_rate": 3.967558028896439e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.09331618994474411, "step": 865, "valid_targets_mean": 4297.6, "valid_targets_min": 874 }, { "epoch": 1.070110701107011, "grad_norm": 0.6061702948387535, "learning_rate": 3.966448299077927e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.06690007448196411, "step": 870, "valid_targets_mean": 2106.2, "valid_targets_min": 826 }, { "epoch": 1.0762607626076262, "grad_norm": 0.5455281617805586, "learning_rate": 3.965320067527047e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.10937830805778503, "step": 875, "valid_targets_mean": 5750.5, "valid_targets_min": 1507 }, { "epoch": 1.082410824108241, "grad_norm": 0.4720396465603722, "learning_rate": 3.964173344858995e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.1531623750925064, "step": 880, "valid_targets_mean": 6774.9, "valid_targets_min": 1644 }, { "epoch": 1.088560885608856, "grad_norm": 0.632410114573719, "learning_rate": 3.9630081418629486e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.11100660264492035, "step": 885, "valid_targets_mean": 2789.1, "valid_targets_min": 687 }, { "epoch": 1.0947109471094711, "grad_norm": 0.569124224978277, "learning_rate": 3.961824469501958e-05, "loss": 0.2131, "loss_nan_ranks": 0, "loss_rank_avg": 0.14877255260944366, "step": 890, "valid_targets_mean": 3959.4, "valid_targets_min": 1437 }, { "epoch": 1.100861008610086, "grad_norm": 0.5475289579116467, "learning_rate": 3.960622338912849e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.10590916872024536, "step": 895, "valid_targets_mean": 3396.9, "valid_targets_min": 714 }, { "epoch": 1.1070110701107012, "grad_norm": 0.5951604986651677, "learning_rate": 3.959401761406112e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.09570469707250595, "step": 900, "valid_targets_mean": 2590.4, "valid_targets_min": 1157 }, { "epoch": 1.1131611316113161, "grad_norm": 0.5735630872456072, "learning_rate": 3.958162748465803e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.09289798885583878, "step": 905, "valid_targets_mean": 4598.4, "valid_targets_min": 820 }, { "epoch": 1.119311193111931, "grad_norm": 0.6567622145178927, "learning_rate": 3.9569053117494276e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.07980631291866302, "step": 910, "valid_targets_mean": 1776.5, "valid_targets_min": 626 }, { "epoch": 1.1254612546125462, "grad_norm": 0.5459210228262543, "learning_rate": 3.955629463087838e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.11270461976528168, "step": 915, "valid_targets_mean": 4065.0, "valid_targets_min": 1291 }, { "epoch": 1.1316113161131611, "grad_norm": 0.6169196601178953, "learning_rate": 3.9543352144851186e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.09531322121620178, "step": 920, "valid_targets_mean": 2537.8, "valid_targets_min": 752 }, { "epoch": 1.137761377613776, "grad_norm": 0.5475073102730614, "learning_rate": 3.9530225781184726e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.08803798258304596, "step": 925, "valid_targets_mean": 3299.6, "valid_targets_min": 694 }, { "epoch": 1.1439114391143912, "grad_norm": 0.7392470655361305, "learning_rate": 3.951691566338108e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.13760310411453247, "step": 930, "valid_targets_mean": 3740.5, "valid_targets_min": 1124 }, { "epoch": 1.1500615006150061, "grad_norm": 0.6915428677199909, "learning_rate": 3.9503421916671235e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.10935693979263306, "step": 935, "valid_targets_mean": 3935.5, "valid_targets_min": 985 }, { "epoch": 1.156211562115621, "grad_norm": 0.7136268383963796, "learning_rate": 3.948974466801387e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.11539360880851746, "step": 940, "valid_targets_mean": 2160.4, "valid_targets_min": 732 }, { "epoch": 1.1623616236162362, "grad_norm": 0.5096395383377019, "learning_rate": 3.947588404609418e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.13573335111141205, "step": 945, "valid_targets_mean": 5011.8, "valid_targets_min": 1168 }, { "epoch": 1.168511685116851, "grad_norm": 0.6181503537374962, "learning_rate": 3.946184018132268e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.08616000413894653, "step": 950, "valid_targets_mean": 2225.5, "valid_targets_min": 937 }, { "epoch": 1.1746617466174663, "grad_norm": 0.5767897351195992, "learning_rate": 3.9447613205833947e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.1230311393737793, "step": 955, "valid_targets_mean": 3215.6, "valid_targets_min": 820 }, { "epoch": 1.1808118081180812, "grad_norm": 0.5292485819890297, "learning_rate": 3.9433203253485406e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.09185110032558441, "step": 960, "valid_targets_mean": 3096.8, "valid_targets_min": 646 }, { "epoch": 1.186961869618696, "grad_norm": 0.5181443964377307, "learning_rate": 3.941861045985605e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.10440077632665634, "step": 965, "valid_targets_mean": 3527.9, "valid_targets_min": 1279 }, { "epoch": 1.1931119311193112, "grad_norm": 0.5728482875406273, "learning_rate": 3.940383496224516e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.05747752636671066, "step": 970, "valid_targets_mean": 2366.6, "valid_targets_min": 911 }, { "epoch": 1.1992619926199262, "grad_norm": 0.6465990822128065, "learning_rate": 3.938887689967106e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.09574022889137268, "step": 975, "valid_targets_mean": 4110.6, "valid_targets_min": 807 }, { "epoch": 1.2054120541205413, "grad_norm": 0.701606242096391, "learning_rate": 3.937373641286973e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.09395575523376465, "step": 980, "valid_targets_mean": 2305.0, "valid_targets_min": 787 }, { "epoch": 1.2115621156211562, "grad_norm": 0.6514050475900018, "learning_rate": 3.935841364429355e-05, "loss": 0.2139, "loss_nan_ranks": 0, "loss_rank_avg": 0.14189472794532776, "step": 985, "valid_targets_mean": 3700.2, "valid_targets_min": 1365 }, { "epoch": 1.2177121771217712, "grad_norm": 0.634389277119909, "learning_rate": 3.934290873810995e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.07238497585058212, "step": 990, "valid_targets_mean": 1775.8, "valid_targets_min": 718 }, { "epoch": 1.2238622386223863, "grad_norm": 0.5108627501449012, "learning_rate": 3.9327221840200016e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.06333731859922409, "step": 995, "valid_targets_mean": 2359.6, "valid_targets_min": 734 }, { "epoch": 1.2300123001230012, "grad_norm": 0.5558236206528789, "learning_rate": 3.931135309815712e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.1480255275964737, "step": 1000, "valid_targets_mean": 4993.5, "valid_targets_min": 2118 }, { "epoch": 1.2361623616236161, "grad_norm": 0.5798554403366425, "learning_rate": 3.929530266128562e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.1239444687962532, "step": 1005, "valid_targets_mean": 3851.4, "valid_targets_min": 1234 }, { "epoch": 1.2423124231242313, "grad_norm": 0.520486886304569, "learning_rate": 3.927907068059931e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.08450537919998169, "step": 1010, "valid_targets_mean": 3581.9, "valid_targets_min": 1157 }, { "epoch": 1.2484624846248462, "grad_norm": 0.6768563245137302, "learning_rate": 3.926265730882013e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.1397990584373474, "step": 1015, "valid_targets_mean": 4325.9, "valid_targets_min": 896 }, { "epoch": 1.2546125461254611, "grad_norm": 0.5924431861285315, "learning_rate": 3.9246062700376646e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.1152370274066925, "step": 1020, "valid_targets_mean": 3168.4, "valid_targets_min": 843 }, { "epoch": 1.2607626076260763, "grad_norm": 0.6274533030255577, "learning_rate": 3.922928701140265e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.12988096475601196, "step": 1025, "valid_targets_mean": 3169.6, "valid_targets_min": 693 }, { "epoch": 1.2669126691266912, "grad_norm": 0.53288201273405, "learning_rate": 3.9212330399735644e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.10920664668083191, "step": 1030, "valid_targets_mean": 3358.4, "valid_targets_min": 1382 }, { "epoch": 1.2730627306273063, "grad_norm": 0.5410316469429407, "learning_rate": 3.919519302491539e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.10489871352910995, "step": 1035, "valid_targets_mean": 2982.8, "valid_targets_min": 893 }, { "epoch": 1.2792127921279213, "grad_norm": 0.6184491732052296, "learning_rate": 3.91778750481824e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.10059502720832825, "step": 1040, "valid_targets_mean": 3470.5, "valid_targets_min": 890 }, { "epoch": 1.2853628536285364, "grad_norm": 0.4584675462132558, "learning_rate": 3.9160376632476405e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.10227296501398087, "step": 1045, "valid_targets_mean": 6008.1, "valid_targets_min": 1178 }, { "epoch": 1.2915129151291513, "grad_norm": 0.5337202948203579, "learning_rate": 3.914269794243484e-05, "loss": 0.2061, "loss_nan_ranks": 0, "loss_rank_avg": 0.0854802206158638, "step": 1050, "valid_targets_mean": 3249.8, "valid_targets_min": 928 }, { "epoch": 1.2976629766297663, "grad_norm": 0.5820247130189102, "learning_rate": 3.912483914439131e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.06562792509794235, "step": 1055, "valid_targets_mean": 2284.6, "valid_targets_min": 848 }, { "epoch": 1.3038130381303814, "grad_norm": 0.5132628138079065, "learning_rate": 3.910680040637395e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.09079452604055405, "step": 1060, "valid_targets_mean": 3807.0, "valid_targets_min": 1433 }, { "epoch": 1.3099630996309963, "grad_norm": 0.603789984461244, "learning_rate": 3.908858189810395e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.09293949604034424, "step": 1065, "valid_targets_mean": 2820.5, "valid_targets_min": 780 }, { "epoch": 1.3161131611316113, "grad_norm": 0.5629563540257153, "learning_rate": 3.9070183790993875e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.11707718670368195, "step": 1070, "valid_targets_mean": 3472.4, "valid_targets_min": 762 }, { "epoch": 1.3222632226322264, "grad_norm": 0.4840017321170116, "learning_rate": 3.905160625814609e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.12266204506158829, "step": 1075, "valid_targets_mean": 3921.2, "valid_targets_min": 1339 }, { "epoch": 1.3284132841328413, "grad_norm": 0.6480542454306704, "learning_rate": 3.9032849474351126e-05, "loss": 0.2111, "loss_nan_ranks": 0, "loss_rank_avg": 0.11063967645168304, "step": 1080, "valid_targets_mean": 3975.5, "valid_targets_min": 1315 }, { "epoch": 1.3345633456334562, "grad_norm": 0.8313864388016285, "learning_rate": 3.901391361608604e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.0995841771364212, "step": 1085, "valid_targets_mean": 3277.6, "valid_targets_min": 1045 }, { "epoch": 1.3407134071340714, "grad_norm": 0.5661093206697985, "learning_rate": 3.899479886151273e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.11698712408542633, "step": 1090, "valid_targets_mean": 4376.4, "valid_targets_min": 717 }, { "epoch": 1.3468634686346863, "grad_norm": 0.5318111285912578, "learning_rate": 3.89755053904763e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.09042427688837051, "step": 1095, "valid_targets_mean": 3347.5, "valid_targets_min": 1071 }, { "epoch": 1.3530135301353012, "grad_norm": 0.5190037755717483, "learning_rate": 3.8956033384503316e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.1193787157535553, "step": 1100, "valid_targets_mean": 4729.8, "valid_targets_min": 1022 }, { "epoch": 1.3591635916359164, "grad_norm": 0.5604486674251695, "learning_rate": 3.893638302680015e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.11157633364200592, "step": 1105, "valid_targets_mean": 4136.1, "valid_targets_min": 661 }, { "epoch": 1.3653136531365313, "grad_norm": 0.6003489564772163, "learning_rate": 3.891655450225122e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.10691434144973755, "step": 1110, "valid_targets_mean": 3694.1, "valid_targets_min": 729 }, { "epoch": 1.3714637146371464, "grad_norm": 0.5053316489492773, "learning_rate": 3.889654799741728e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.09286430478096008, "step": 1115, "valid_targets_mean": 4077.6, "valid_targets_min": 1772 }, { "epoch": 1.3776137761377614, "grad_norm": 0.5792133242424264, "learning_rate": 3.887636370053363e-05, "loss": 0.2105, "loss_nan_ranks": 0, "loss_rank_avg": 0.08103743195533752, "step": 1120, "valid_targets_mean": 2605.0, "valid_targets_min": 762 }, { "epoch": 1.3837638376383765, "grad_norm": 0.4818886265033423, "learning_rate": 3.885600180150837e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.09132908284664154, "step": 1125, "valid_targets_mean": 4023.1, "valid_targets_min": 982 }, { "epoch": 1.3899138991389914, "grad_norm": 0.5336478954744306, "learning_rate": 3.88354624919206e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.1306639313697815, "step": 1130, "valid_targets_mean": 4328.4, "valid_targets_min": 1666 }, { "epoch": 1.3960639606396064, "grad_norm": 0.572497497167398, "learning_rate": 3.8814745965018636e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.10151968896389008, "step": 1135, "valid_targets_mean": 3521.8, "valid_targets_min": 968 }, { "epoch": 1.4022140221402215, "grad_norm": 0.9625870373835352, "learning_rate": 3.879385241571817e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.07492039352655411, "step": 1140, "valid_targets_mean": 2917.2, "valid_targets_min": 1042 }, { "epoch": 1.4083640836408364, "grad_norm": 0.5710744015592739, "learning_rate": 3.877278204060045e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.0715465098619461, "step": 1145, "valid_targets_mean": 2445.5, "valid_targets_min": 1085 }, { "epoch": 1.4145141451414514, "grad_norm": 0.580727351557091, "learning_rate": 3.875153503791042e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.11731253564357758, "step": 1150, "valid_targets_mean": 3761.8, "valid_targets_min": 1333 }, { "epoch": 1.4206642066420665, "grad_norm": 0.7021363633316672, "learning_rate": 3.873011160755487e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.08568359911441803, "step": 1155, "valid_targets_mean": 3474.9, "valid_targets_min": 1050 }, { "epoch": 1.4268142681426814, "grad_norm": 0.46785177504470826, "learning_rate": 3.870851195110054e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.10430695116519928, "step": 1160, "valid_targets_mean": 5682.6, "valid_targets_min": 3450 }, { "epoch": 1.4329643296432963, "grad_norm": 0.4745062875227194, "learning_rate": 3.8686736271772224e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.1187187060713768, "step": 1165, "valid_targets_mean": 5361.2, "valid_targets_min": 879 }, { "epoch": 1.4391143911439115, "grad_norm": 0.5088780895776316, "learning_rate": 3.866478477445088e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1163216382265091, "step": 1170, "valid_targets_mean": 5038.2, "valid_targets_min": 996 }, { "epoch": 1.4452644526445264, "grad_norm": 0.5289990236261362, "learning_rate": 3.864265766567167e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.06807369738817215, "step": 1175, "valid_targets_mean": 2729.0, "valid_targets_min": 824 }, { "epoch": 1.4514145141451413, "grad_norm": 0.5502624184439973, "learning_rate": 3.862035515362203e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.10798356682062149, "step": 1180, "valid_targets_mean": 3511.1, "valid_targets_min": 1229 }, { "epoch": 1.4575645756457565, "grad_norm": 0.5546713114453061, "learning_rate": 3.8597877448139744e-05, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.10588104277849197, "step": 1185, "valid_targets_mean": 3067.6, "valid_targets_min": 1073 }, { "epoch": 1.4637146371463714, "grad_norm": 0.5859881372700351, "learning_rate": 3.857522476071089e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.09349851310253143, "step": 1190, "valid_targets_mean": 3037.6, "valid_targets_min": 909 }, { "epoch": 1.4698646986469865, "grad_norm": 0.49789959170537496, "learning_rate": 3.855239730446795e-05, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.1064479872584343, "step": 1195, "valid_targets_mean": 3940.4, "valid_targets_min": 878 }, { "epoch": 1.4760147601476015, "grad_norm": 0.5254927384577484, "learning_rate": 3.852939529418771e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.07499948143959045, "step": 1200, "valid_targets_mean": 2803.4, "valid_targets_min": 1249 }, { "epoch": 1.4821648216482166, "grad_norm": 0.4918483613906252, "learning_rate": 3.8506218946289315e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.10088559240102768, "step": 1205, "valid_targets_mean": 4231.8, "valid_targets_min": 792 }, { "epoch": 1.4883148831488315, "grad_norm": 0.4635491453214155, "learning_rate": 3.848286847883219e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.08798468858003616, "step": 1210, "valid_targets_mean": 4164.1, "valid_targets_min": 1159 }, { "epoch": 1.4944649446494465, "grad_norm": 0.5467963971768149, "learning_rate": 3.8459344111514e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.12110284715890884, "step": 1215, "valid_targets_mean": 4131.5, "valid_targets_min": 1242 }, { "epoch": 1.5006150061500616, "grad_norm": 0.8727175521600122, "learning_rate": 3.843564606566858e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.1183200478553772, "step": 1220, "valid_targets_mean": 2485.9, "valid_targets_min": 913 }, { "epoch": 1.5067650676506765, "grad_norm": 0.5005573987553051, "learning_rate": 3.841177456426386e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.09200870990753174, "step": 1225, "valid_targets_mean": 3835.5, "valid_targets_min": 1320 }, { "epoch": 1.5129151291512914, "grad_norm": 0.5729217543273271, "learning_rate": 3.838772983189975e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.13913193345069885, "step": 1230, "valid_targets_mean": 4432.9, "valid_targets_min": 689 }, { "epoch": 1.5190651906519066, "grad_norm": 0.49925142673285466, "learning_rate": 3.836351209480607e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.08487389981746674, "step": 1235, "valid_targets_mean": 3952.6, "valid_targets_min": 812 }, { "epoch": 1.5252152521525215, "grad_norm": 0.5384277463948903, "learning_rate": 3.833912158084035e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.09497053176164627, "step": 1240, "valid_targets_mean": 3174.6, "valid_targets_min": 901 }, { "epoch": 1.5313653136531364, "grad_norm": 0.4833570030551031, "learning_rate": 3.831455851948576e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.11096090078353882, "step": 1245, "valid_targets_mean": 4853.8, "valid_targets_min": 1401 }, { "epoch": 1.5375153751537516, "grad_norm": 0.44419038921149023, "learning_rate": 3.828982314184889e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.05619562417268753, "step": 1250, "valid_targets_mean": 2399.8, "valid_targets_min": 851 }, { "epoch": 1.5436654366543665, "grad_norm": 0.6231540043540117, "learning_rate": 3.826491568065762e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.1023961529135704, "step": 1255, "valid_targets_mean": 2622.8, "valid_targets_min": 1085 }, { "epoch": 1.5498154981549814, "grad_norm": 0.49821236161660165, "learning_rate": 3.823983637025892e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.11277259141206741, "step": 1260, "valid_targets_mean": 4299.8, "valid_targets_min": 1190 }, { "epoch": 1.5559655596555966, "grad_norm": 0.4680653424854338, "learning_rate": 3.821458544661662e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.0951245054602623, "step": 1265, "valid_targets_mean": 4406.1, "valid_targets_min": 1134 }, { "epoch": 1.5621156211562117, "grad_norm": 0.426786678188967, "learning_rate": 3.818916314730922e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.08958496898412704, "step": 1270, "valid_targets_mean": 5430.9, "valid_targets_min": 1363 }, { "epoch": 1.5682656826568264, "grad_norm": 0.5493640924249626, "learning_rate": 3.816356971152763e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.10626004636287689, "step": 1275, "valid_targets_mean": 3462.8, "valid_targets_min": 655 }, { "epoch": 1.5744157441574416, "grad_norm": 0.5040666290639284, "learning_rate": 3.813780538007295e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.12168212234973907, "step": 1280, "valid_targets_mean": 4491.5, "valid_targets_min": 1484 }, { "epoch": 1.5805658056580567, "grad_norm": 0.5354436593377919, "learning_rate": 3.811187039535419e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1084877997636795, "step": 1285, "valid_targets_mean": 3328.8, "valid_targets_min": 924 }, { "epoch": 1.5867158671586716, "grad_norm": 0.503196261690315, "learning_rate": 3.808576500138596e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.07113277167081833, "step": 1290, "valid_targets_mean": 2856.4, "valid_targets_min": 815 }, { "epoch": 1.5928659286592866, "grad_norm": 0.5396821477459569, "learning_rate": 3.805948944378622e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.09005014598369598, "step": 1295, "valid_targets_mean": 2599.0, "valid_targets_min": 809 }, { "epoch": 1.5990159901599017, "grad_norm": 0.5528728526078117, "learning_rate": 3.803304396977397e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.09361758083105087, "step": 1300, "valid_targets_mean": 3898.5, "valid_targets_min": 960 }, { "epoch": 1.6051660516605166, "grad_norm": 0.46891903930889195, "learning_rate": 3.800642882816684e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.10345235466957092, "step": 1305, "valid_targets_mean": 4713.8, "valid_targets_min": 1492 }, { "epoch": 1.6113161131611315, "grad_norm": 0.5518967813360433, "learning_rate": 3.797964426937888e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.10282796621322632, "step": 1310, "valid_targets_mean": 3685.5, "valid_targets_min": 1206 }, { "epoch": 1.6174661746617467, "grad_norm": 0.5060002126739849, "learning_rate": 3.795269054541809e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.14236804842948914, "step": 1315, "valid_targets_mean": 5181.6, "valid_targets_min": 1364 }, { "epoch": 1.6236162361623616, "grad_norm": 0.5547520161561545, "learning_rate": 3.7925567909884125e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.11089588701725006, "step": 1320, "valid_targets_mean": 3716.6, "valid_targets_min": 1163 }, { "epoch": 1.6297662976629765, "grad_norm": 0.5975968356685399, "learning_rate": 3.789827661796586e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.0989069864153862, "step": 1325, "valid_targets_mean": 2657.9, "valid_targets_min": 1043 }, { "epoch": 1.6359163591635917, "grad_norm": 0.49298477710698163, "learning_rate": 3.787081692643902e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.1150115504860878, "step": 1330, "valid_targets_mean": 5553.1, "valid_targets_min": 987 }, { "epoch": 1.6420664206642066, "grad_norm": 0.4785087045601313, "learning_rate": 3.784318909366375e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.07596011459827423, "step": 1335, "valid_targets_mean": 3686.5, "valid_targets_min": 796 }, { "epoch": 1.6482164821648215, "grad_norm": 0.9735561067648053, "learning_rate": 3.781539337958219e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.11845865845680237, "step": 1340, "valid_targets_mean": 4059.6, "valid_targets_min": 716 }, { "epoch": 1.6543665436654367, "grad_norm": 0.48313444194883975, "learning_rate": 3.7787430045716e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.08939701318740845, "step": 1345, "valid_targets_mean": 4065.6, "valid_targets_min": 1380 }, { "epoch": 1.6605166051660518, "grad_norm": 0.5296674373271556, "learning_rate": 3.775929935516396e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.09042255580425262, "step": 1350, "valid_targets_mean": 3754.2, "valid_targets_min": 728 }, { "epoch": 1.6666666666666665, "grad_norm": 0.501936654372202, "learning_rate": 3.773100157259945e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.10522586107254028, "step": 1355, "valid_targets_mean": 4155.0, "valid_targets_min": 822 }, { "epoch": 1.6728167281672817, "grad_norm": 0.4968330680618515, "learning_rate": 3.7702536964267944e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.1146087795495987, "step": 1360, "valid_targets_mean": 4046.8, "valid_targets_min": 809 }, { "epoch": 1.6789667896678968, "grad_norm": 0.5595402782397794, "learning_rate": 3.767390579798456e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.08506064116954803, "step": 1365, "valid_targets_mean": 2417.2, "valid_targets_min": 629 }, { "epoch": 1.6851168511685117, "grad_norm": 0.48880821787298084, "learning_rate": 3.764510834313152e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.1252322793006897, "step": 1370, "valid_targets_mean": 5895.0, "valid_targets_min": 847 }, { "epoch": 1.6912669126691267, "grad_norm": 0.5050145314206561, "learning_rate": 3.761614487065556e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.09901121258735657, "step": 1375, "valid_targets_mean": 4068.0, "valid_targets_min": 933 }, { "epoch": 1.6974169741697418, "grad_norm": 0.5949004284187435, "learning_rate": 3.758701565306547e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.07950301468372345, "step": 1380, "valid_targets_mean": 2436.5, "valid_targets_min": 869 }, { "epoch": 1.7035670356703567, "grad_norm": 0.5346712803424558, "learning_rate": 3.7557720964429473e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1618548035621643, "step": 1385, "valid_targets_mean": 3668.6, "valid_targets_min": 619 }, { "epoch": 1.7097170971709716, "grad_norm": 0.47722162028924653, "learning_rate": 3.752826108037266e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.10579360276460648, "step": 1390, "valid_targets_mean": 4692.4, "valid_targets_min": 1104 }, { "epoch": 1.7158671586715868, "grad_norm": 0.6577604646961259, "learning_rate": 3.7498636278074376e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.10559843480587006, "step": 1395, "valid_targets_mean": 4804.1, "valid_targets_min": 740 }, { "epoch": 1.7220172201722017, "grad_norm": 0.6896510510145436, "learning_rate": 3.746884683626567e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.10995135456323624, "step": 1400, "valid_targets_mean": 2253.2, "valid_targets_min": 791 }, { "epoch": 1.7281672816728166, "grad_norm": 0.45844108471788086, "learning_rate": 3.7438893035226615e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.09560881555080414, "step": 1405, "valid_targets_mean": 5043.2, "valid_targets_min": 739 }, { "epoch": 1.7343173431734318, "grad_norm": 0.47496112767282045, "learning_rate": 3.7408775156783696e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.0626043751835823, "step": 1410, "valid_targets_mean": 2590.8, "valid_targets_min": 835 }, { "epoch": 1.7404674046740467, "grad_norm": 0.6188065748950373, "learning_rate": 3.737849348430716e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.08986514806747437, "step": 1415, "valid_targets_mean": 2038.0, "valid_targets_min": 1018 }, { "epoch": 1.7466174661746616, "grad_norm": 0.5260988430934506, "learning_rate": 3.7348048302708325e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.048175595700740814, "step": 1420, "valid_targets_mean": 1722.9, "valid_targets_min": 657 }, { "epoch": 1.7527675276752768, "grad_norm": 0.48641738114128835, "learning_rate": 3.7317439898436934e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.07783234119415283, "step": 1425, "valid_targets_mean": 3405.0, "valid_targets_min": 911 }, { "epoch": 1.758917589175892, "grad_norm": 0.6043799620806836, "learning_rate": 3.728666855947844e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.09733516722917557, "step": 1430, "valid_targets_mean": 2843.6, "valid_targets_min": 1302 }, { "epoch": 1.7650676506765066, "grad_norm": 0.47616042389950425, "learning_rate": 3.72557345753513e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.11222381889820099, "step": 1435, "valid_targets_mean": 5592.2, "valid_targets_min": 1147 }, { "epoch": 1.7712177121771218, "grad_norm": 0.5356638323920245, "learning_rate": 3.7224638237104254e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.09824912250041962, "step": 1440, "valid_targets_mean": 3397.1, "valid_targets_min": 1031 }, { "epoch": 1.777367773677737, "grad_norm": 0.4940236303170333, "learning_rate": 3.719337983731358e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.10997024178504944, "step": 1445, "valid_targets_mean": 3770.8, "valid_targets_min": 1087 }, { "epoch": 1.7835178351783518, "grad_norm": 0.6126065018305925, "learning_rate": 3.716195967008035e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.0981617420911789, "step": 1450, "valid_targets_mean": 2462.4, "valid_targets_min": 1168 }, { "epoch": 1.7896678966789668, "grad_norm": 0.6751630731854735, "learning_rate": 3.713037803102764e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.06809885054826736, "step": 1455, "valid_targets_mean": 1932.5, "valid_targets_min": 1098 }, { "epoch": 1.795817958179582, "grad_norm": 0.5140172612774082, "learning_rate": 3.709863521729781e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.1045265644788742, "step": 1460, "valid_targets_mean": 3631.9, "valid_targets_min": 1462 }, { "epoch": 1.8019680196801968, "grad_norm": 0.5042408872022428, "learning_rate": 3.7066731527549616e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.10661792755126953, "step": 1465, "valid_targets_mean": 4541.1, "valid_targets_min": 572 }, { "epoch": 1.8081180811808117, "grad_norm": 0.5595314361622906, "learning_rate": 3.703466726195547e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.12330175936222076, "step": 1470, "valid_targets_mean": 4489.2, "valid_targets_min": 1046 }, { "epoch": 1.8142681426814269, "grad_norm": 0.45685905233793006, "learning_rate": 3.7002442722198605e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.09649819880723953, "step": 1475, "valid_targets_mean": 4542.2, "valid_targets_min": 1086 }, { "epoch": 1.8204182041820418, "grad_norm": 0.5031768523848916, "learning_rate": 3.6970058211470224e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.10478343069553375, "step": 1480, "valid_targets_mean": 4728.8, "valid_targets_min": 806 }, { "epoch": 1.8265682656826567, "grad_norm": 0.42532934954842594, "learning_rate": 3.693751403446662e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.08650326728820801, "step": 1485, "valid_targets_mean": 4036.0, "valid_targets_min": 917 }, { "epoch": 1.8327183271832719, "grad_norm": 0.5832130915144736, "learning_rate": 3.6904810497386366e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.10903920233249664, "step": 1490, "valid_targets_mean": 2777.5, "valid_targets_min": 930 }, { "epoch": 1.8388683886838868, "grad_norm": 0.5029643540034519, "learning_rate": 3.687194790792742e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.10596004128456116, "step": 1495, "valid_targets_mean": 3624.2, "valid_targets_min": 807 }, { "epoch": 1.8450184501845017, "grad_norm": 0.4948422791768945, "learning_rate": 3.683892657528418e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.13056054711341858, "step": 1500, "valid_targets_mean": 4737.4, "valid_targets_min": 1629 }, { "epoch": 1.8511685116851169, "grad_norm": 0.5950735101917919, "learning_rate": 3.680574681014463e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.09535035490989685, "step": 1505, "valid_targets_mean": 3788.2, "valid_targets_min": 1408 }, { "epoch": 1.857318573185732, "grad_norm": 0.5084588855367531, "learning_rate": 3.677240892468741e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.07698500156402588, "step": 1510, "valid_targets_mean": 2796.6, "valid_targets_min": 888 }, { "epoch": 1.8634686346863467, "grad_norm": 0.4726816423976889, "learning_rate": 3.673891323257886e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.11065435409545898, "step": 1515, "valid_targets_mean": 4451.4, "valid_targets_min": 1364 }, { "epoch": 1.8696186961869619, "grad_norm": 0.5189172903016105, "learning_rate": 3.670526004897006e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.07834093272686005, "step": 1520, "valid_targets_mean": 3034.5, "valid_targets_min": 1061 }, { "epoch": 1.875768757687577, "grad_norm": 0.5290905994514233, "learning_rate": 3.6671449690493896e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.07623681426048279, "step": 1525, "valid_targets_mean": 2919.0, "valid_targets_min": 790 }, { "epoch": 1.881918819188192, "grad_norm": 0.477147164336205, "learning_rate": 3.6637482475262076e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.06917934864759445, "step": 1530, "valid_targets_mean": 3360.8, "valid_targets_min": 849 }, { "epoch": 1.8880688806888068, "grad_norm": 0.4762516294245979, "learning_rate": 3.6603358722862106e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.14056900143623352, "step": 1535, "valid_targets_mean": 5183.1, "valid_targets_min": 1242 }, { "epoch": 1.894218942189422, "grad_norm": 0.524911522240793, "learning_rate": 3.656907875435432e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.07982973754405975, "step": 1540, "valid_targets_mean": 2392.1, "valid_targets_min": 937 }, { "epoch": 1.900369003690037, "grad_norm": 0.4747394707858542, "learning_rate": 3.653464289226882e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.10742057114839554, "step": 1545, "valid_targets_mean": 4995.4, "valid_targets_min": 1278 }, { "epoch": 1.9065190651906518, "grad_norm": 0.5900867879081909, "learning_rate": 3.6500051460602496e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.1337573528289795, "step": 1550, "valid_targets_mean": 5394.8, "valid_targets_min": 1697 }, { "epoch": 1.912669126691267, "grad_norm": 0.5127809538868972, "learning_rate": 3.6465304784815927e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.09060677140951157, "step": 1555, "valid_targets_mean": 2900.6, "valid_targets_min": 1038 }, { "epoch": 1.918819188191882, "grad_norm": 0.5142732827884361, "learning_rate": 3.643040319183035e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.11093857884407043, "step": 1560, "valid_targets_mean": 4138.8, "valid_targets_min": 1332 }, { "epoch": 1.9249692496924968, "grad_norm": 0.5023289283424182, "learning_rate": 3.639534701002455e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.10212238132953644, "step": 1565, "valid_targets_mean": 3121.2, "valid_targets_min": 1184 }, { "epoch": 1.931119311193112, "grad_norm": 0.45011497746244516, "learning_rate": 3.636013656923182e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.08078508079051971, "step": 1570, "valid_targets_mean": 3689.2, "valid_targets_min": 914 }, { "epoch": 1.937269372693727, "grad_norm": 0.5178600546338055, "learning_rate": 3.632477220073681e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.09905163198709488, "step": 1575, "valid_targets_mean": 3351.5, "valid_targets_min": 992 }, { "epoch": 1.9434194341943418, "grad_norm": 0.4628126119613772, "learning_rate": 3.6289254237272454e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.09697072952985764, "step": 1580, "valid_targets_mean": 4569.1, "valid_targets_min": 1105 }, { "epoch": 1.949569495694957, "grad_norm": 0.5093051065653287, "learning_rate": 3.625358301301678e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.07729291915893555, "step": 1585, "valid_targets_mean": 3356.6, "valid_targets_min": 548 }, { "epoch": 1.9557195571955721, "grad_norm": 0.45666457647505343, "learning_rate": 3.621775886358983e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.06966480612754822, "step": 1590, "valid_targets_mean": 2683.8, "valid_targets_min": 1240 }, { "epoch": 1.9618696186961868, "grad_norm": 0.4937970822194384, "learning_rate": 3.618178212605046e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.038976266980171204, "step": 1595, "valid_targets_mean": 1423.8, "valid_targets_min": 705 }, { "epoch": 1.968019680196802, "grad_norm": 0.4582674110900814, "learning_rate": 3.614565313889321e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.10724746435880661, "step": 1600, "valid_targets_mean": 4829.1, "valid_targets_min": 1116 }, { "epoch": 1.974169741697417, "grad_norm": 0.5105452760966861, "learning_rate": 3.610937224204504e-05, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.10440842807292938, "step": 1605, "valid_targets_mean": 4159.0, "valid_targets_min": 625 }, { "epoch": 1.980319803198032, "grad_norm": 0.4565982688896811, "learning_rate": 3.6072939776862236e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.13977614045143127, "step": 1610, "valid_targets_mean": 5577.5, "valid_targets_min": 1347 }, { "epoch": 1.986469864698647, "grad_norm": 0.4874558353893182, "learning_rate": 3.603635608612711e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.10176213085651398, "step": 1615, "valid_targets_mean": 4424.8, "valid_targets_min": 1345 }, { "epoch": 1.992619926199262, "grad_norm": 0.4757483167596365, "learning_rate": 3.5999621514044825e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.14148062467575073, "step": 1620, "valid_targets_mean": 5153.4, "valid_targets_min": 974 }, { "epoch": 1.998769987699877, "grad_norm": 0.6126351657242327, "learning_rate": 3.596273640624015e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.09883184731006622, "step": 1625, "valid_targets_mean": 2404.1, "valid_targets_min": 793 }, { "epoch": 2.004920049200492, "grad_norm": 0.5243077165247066, "learning_rate": 3.592570110975419e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.11883203685283661, "step": 1630, "valid_targets_mean": 3816.8, "valid_targets_min": 1002 }, { "epoch": 2.011070110701107, "grad_norm": 0.4173052631338242, "learning_rate": 3.588851597304112e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.07014939188957214, "step": 1635, "valid_targets_mean": 5814.2, "valid_targets_min": 1920 }, { "epoch": 2.0172201722017222, "grad_norm": 0.5920676478092707, "learning_rate": 3.585118134596494e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.09625989198684692, "step": 1640, "valid_targets_mean": 2566.2, "valid_targets_min": 957 }, { "epoch": 2.023370233702337, "grad_norm": 0.6024734912141144, "learning_rate": 3.5813697579796144e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.06967133283615112, "step": 1645, "valid_targets_mean": 3114.9, "valid_targets_min": 797 }, { "epoch": 2.029520295202952, "grad_norm": 0.5438114156989086, "learning_rate": 3.577606502720845e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.11378873884677887, "step": 1650, "valid_targets_mean": 4084.4, "valid_targets_min": 613 }, { "epoch": 2.035670356703567, "grad_norm": 0.5918035290139211, "learning_rate": 3.5738284042275434e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.1081269234418869, "step": 1655, "valid_targets_mean": 3336.6, "valid_targets_min": 632 }, { "epoch": 2.041820418204182, "grad_norm": 0.4444849944204281, "learning_rate": 3.570035498046727e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.1056932806968689, "step": 1660, "valid_targets_mean": 5827.1, "valid_targets_min": 887 }, { "epoch": 2.047970479704797, "grad_norm": 0.5225839419367659, "learning_rate": 3.566227819864729e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.07713170349597931, "step": 1665, "valid_targets_mean": 3526.6, "valid_targets_min": 783 }, { "epoch": 2.054120541205412, "grad_norm": 0.46616326608373404, "learning_rate": 3.562405405506874e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.0829431414604187, "step": 1670, "valid_targets_mean": 4568.4, "valid_targets_min": 893 }, { "epoch": 2.060270602706027, "grad_norm": 0.5123653624604934, "learning_rate": 3.55856829093713e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.07135461270809174, "step": 1675, "valid_targets_mean": 2873.1, "valid_targets_min": 745 }, { "epoch": 2.066420664206642, "grad_norm": 0.46854159304991505, "learning_rate": 3.5547165122577765e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.08598525077104568, "step": 1680, "valid_targets_mean": 4960.9, "valid_targets_min": 2186 }, { "epoch": 2.072570725707257, "grad_norm": 0.6258528484595688, "learning_rate": 3.5508501057090654e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.0794835016131401, "step": 1685, "valid_targets_mean": 4042.2, "valid_targets_min": 847 }, { "epoch": 2.078720787207872, "grad_norm": 0.45706630966983675, "learning_rate": 3.546969107668875e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.10448753833770752, "step": 1690, "valid_targets_mean": 5523.4, "valid_targets_min": 1266 }, { "epoch": 2.084870848708487, "grad_norm": 0.534873213357355, "learning_rate": 3.543073554652372e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1391887068748474, "step": 1695, "valid_targets_mean": 4543.2, "valid_targets_min": 615 }, { "epoch": 2.091020910209102, "grad_norm": 0.4582733490763445, "learning_rate": 3.5391634833116665e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.0811735987663269, "step": 1700, "valid_targets_mean": 4539.9, "valid_targets_min": 1198 }, { "epoch": 2.097170971709717, "grad_norm": 0.4937893118285565, "learning_rate": 3.5352389304354666e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.0982910543680191, "step": 1705, "valid_targets_mean": 5020.0, "valid_targets_min": 1932 }, { "epoch": 2.103321033210332, "grad_norm": 0.6053975754609369, "learning_rate": 3.531299932948735e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.0896589457988739, "step": 1710, "valid_targets_mean": 2514.2, "valid_targets_min": 684 }, { "epoch": 2.109471094710947, "grad_norm": 0.589391928848343, "learning_rate": 3.527346527912336e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.10648193210363388, "step": 1715, "valid_targets_mean": 3808.4, "valid_targets_min": 1278 }, { "epoch": 2.1156211562115623, "grad_norm": 0.621704460884244, "learning_rate": 3.523378752522693e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.057993847876787186, "step": 1720, "valid_targets_mean": 1930.9, "valid_targets_min": 1020 }, { "epoch": 2.121771217712177, "grad_norm": 0.5218271734942508, "learning_rate": 3.5193966441114345e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.09666042774915695, "step": 1725, "valid_targets_mean": 4095.9, "valid_targets_min": 992 }, { "epoch": 2.127921279212792, "grad_norm": 0.46328958118763347, "learning_rate": 3.515400240145046e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.08929213136434555, "step": 1730, "valid_targets_mean": 4731.5, "valid_targets_min": 853 }, { "epoch": 2.1340713407134073, "grad_norm": 0.5262376367081194, "learning_rate": 3.5113895782245134e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.09835997223854065, "step": 1735, "valid_targets_mean": 4514.0, "valid_targets_min": 930 }, { "epoch": 2.140221402214022, "grad_norm": 0.5505041291299339, "learning_rate": 3.507364696084972e-05, "loss": 0.1851, "loss_nan_ranks": 0, "loss_rank_avg": 0.06782595068216324, "step": 1740, "valid_targets_mean": 2526.9, "valid_targets_min": 936 }, { "epoch": 2.146371463714637, "grad_norm": 0.626362440819134, "learning_rate": 3.503325631595352e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.119917131960392, "step": 1745, "valid_targets_mean": 3010.5, "valid_targets_min": 564 }, { "epoch": 2.1525215252152523, "grad_norm": 0.5262475327597472, "learning_rate": 3.49927242275802e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.10288462042808533, "step": 1750, "valid_targets_mean": 3660.6, "valid_targets_min": 913 }, { "epoch": 2.158671586715867, "grad_norm": 1.5639629641041328, "learning_rate": 3.495205107708425e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.07738654315471649, "step": 1755, "valid_targets_mean": 2947.2, "valid_targets_min": 1511 }, { "epoch": 2.164821648216482, "grad_norm": 0.5191092489134466, "learning_rate": 3.491123724714733e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.10357122123241425, "step": 1760, "valid_targets_mean": 3593.0, "valid_targets_min": 1156 }, { "epoch": 2.1709717097170973, "grad_norm": 0.6215664360999175, "learning_rate": 3.4870283121774746e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.10146811604499817, "step": 1765, "valid_targets_mean": 3114.8, "valid_targets_min": 1295 }, { "epoch": 2.177121771217712, "grad_norm": 0.5196366914731959, "learning_rate": 3.4829189086291785e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.06479023396968842, "step": 1770, "valid_targets_mean": 3533.8, "valid_targets_min": 739 }, { "epoch": 2.183271832718327, "grad_norm": 0.5289026028254815, "learning_rate": 3.478795552734012e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.08850535750389099, "step": 1775, "valid_targets_mean": 3198.8, "valid_targets_min": 567 }, { "epoch": 2.1894218942189423, "grad_norm": 0.48223754387106, "learning_rate": 3.474658283287414e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.12505097687244415, "step": 1780, "valid_targets_mean": 5906.9, "valid_targets_min": 4099 }, { "epoch": 2.195571955719557, "grad_norm": 0.47498236361568363, "learning_rate": 3.470507139215735e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.07444043457508087, "step": 1785, "valid_targets_mean": 3798.5, "valid_targets_min": 993 }, { "epoch": 2.201722017220172, "grad_norm": 0.4824888535185058, "learning_rate": 3.4663421595758646e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.10236834734678268, "step": 1790, "valid_targets_mean": 4214.4, "valid_targets_min": 881 }, { "epoch": 2.2078720787207873, "grad_norm": 0.49368939832945224, "learning_rate": 3.462163383554868e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.06503598392009735, "step": 1795, "valid_targets_mean": 3193.1, "valid_targets_min": 882 }, { "epoch": 2.2140221402214024, "grad_norm": 0.5289486643460859, "learning_rate": 3.457970850469619e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.06786412745714188, "step": 1800, "valid_targets_mean": 2628.6, "valid_targets_min": 782 }, { "epoch": 2.220172201722017, "grad_norm": 0.4739542781466288, "learning_rate": 3.453764599766424e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.09068910777568817, "step": 1805, "valid_targets_mean": 3949.4, "valid_targets_min": 1019 }, { "epoch": 2.2263222632226323, "grad_norm": 0.5142497198048981, "learning_rate": 3.449544671020655e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.07851199805736542, "step": 1810, "valid_targets_mean": 4175.1, "valid_targets_min": 641 }, { "epoch": 2.2324723247232474, "grad_norm": 0.4539031477350509, "learning_rate": 3.44531110393638e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.10548322647809982, "step": 1815, "valid_targets_mean": 5639.8, "valid_targets_min": 963 }, { "epoch": 2.238622386223862, "grad_norm": 0.5403891290572767, "learning_rate": 3.441063938345982e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.08264362812042236, "step": 1820, "valid_targets_mean": 2898.1, "valid_targets_min": 656 }, { "epoch": 2.2447724477244773, "grad_norm": 0.49720882879305345, "learning_rate": 3.43680321420979e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.08277932554483414, "step": 1825, "valid_targets_mean": 4421.4, "valid_targets_min": 739 }, { "epoch": 2.2509225092250924, "grad_norm": 0.44661121875999416, "learning_rate": 3.432528971615702e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.09439855813980103, "step": 1830, "valid_targets_mean": 5139.5, "valid_targets_min": 1585 }, { "epoch": 2.257072570725707, "grad_norm": 0.5104457694682429, "learning_rate": 3.428241250778807e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.0804177075624466, "step": 1835, "valid_targets_mean": 2974.8, "valid_targets_min": 908 }, { "epoch": 2.2632226322263223, "grad_norm": 0.5164552600869374, "learning_rate": 3.423940092041005e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.08347299695014954, "step": 1840, "valid_targets_mean": 4309.0, "valid_targets_min": 1170 }, { "epoch": 2.2693726937269374, "grad_norm": 0.5111882731172788, "learning_rate": 3.4196255358706324e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.07734288275241852, "step": 1845, "valid_targets_mean": 2717.6, "valid_targets_min": 668 }, { "epoch": 2.275522755227552, "grad_norm": 0.5329146839450533, "learning_rate": 3.415297622862075e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.12941431999206543, "step": 1850, "valid_targets_mean": 5433.4, "valid_targets_min": 1278 }, { "epoch": 2.2816728167281672, "grad_norm": 0.5402654149001758, "learning_rate": 3.410956393735391e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.08417652547359467, "step": 1855, "valid_targets_mean": 3604.5, "valid_targets_min": 875 }, { "epoch": 2.2878228782287824, "grad_norm": 0.50683716176892, "learning_rate": 3.406601889335926e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.12431508302688599, "step": 1860, "valid_targets_mean": 5270.0, "valid_targets_min": 1533 }, { "epoch": 2.2939729397293975, "grad_norm": 0.4956489408049929, "learning_rate": 3.4022341506339274e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.08791838586330414, "step": 1865, "valid_targets_mean": 3060.8, "valid_targets_min": 958 }, { "epoch": 2.3001230012300122, "grad_norm": 0.5017188163980323, "learning_rate": 3.3978532187241614e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.09323479235172272, "step": 1870, "valid_targets_mean": 3938.6, "valid_targets_min": 724 }, { "epoch": 2.3062730627306274, "grad_norm": 0.5066996834210351, "learning_rate": 3.3934591348255246e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.0862000435590744, "step": 1875, "valid_targets_mean": 4162.0, "valid_targets_min": 549 }, { "epoch": 2.312423124231242, "grad_norm": 0.5158665171775458, "learning_rate": 3.389051940280658e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.08762037009000778, "step": 1880, "valid_targets_mean": 3430.1, "valid_targets_min": 1529 }, { "epoch": 2.3185731857318572, "grad_norm": 0.4996497785866437, "learning_rate": 3.384631676555556e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.1017792820930481, "step": 1885, "valid_targets_mean": 4760.0, "valid_targets_min": 1181 }, { "epoch": 2.3247232472324724, "grad_norm": 0.47518671427713155, "learning_rate": 3.380198385239175e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.10088784992694855, "step": 1890, "valid_targets_mean": 4937.2, "valid_targets_min": 781 }, { "epoch": 2.3308733087330875, "grad_norm": 0.48984155868767715, "learning_rate": 3.375752108043048e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.10612259805202484, "step": 1895, "valid_targets_mean": 4649.6, "valid_targets_min": 786 }, { "epoch": 2.337023370233702, "grad_norm": 0.45775890721910284, "learning_rate": 3.371292886800886e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.0842120349407196, "step": 1900, "valid_targets_mean": 4092.5, "valid_targets_min": 776 }, { "epoch": 2.3431734317343174, "grad_norm": 0.6598274027850817, "learning_rate": 3.366820763468187e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.10250968486070633, "step": 1905, "valid_targets_mean": 2989.2, "valid_targets_min": 810 }, { "epoch": 2.3493234932349325, "grad_norm": 0.5967373414003015, "learning_rate": 3.3623357801218415e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.10870860517024994, "step": 1910, "valid_targets_mean": 2967.1, "valid_targets_min": 957 }, { "epoch": 2.355473554735547, "grad_norm": 0.5575394127561428, "learning_rate": 3.357837978959735e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.09510388225317001, "step": 1915, "valid_targets_mean": 3234.8, "valid_targets_min": 955 }, { "epoch": 2.3616236162361623, "grad_norm": 0.46154437452355346, "learning_rate": 3.353327402300353e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.07429394870996475, "step": 1920, "valid_targets_mean": 3559.4, "valid_targets_min": 1075 }, { "epoch": 2.3677736777367775, "grad_norm": 0.5408034876436789, "learning_rate": 3.348804092582382e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.08712077140808105, "step": 1925, "valid_targets_mean": 3194.0, "valid_targets_min": 1197 }, { "epoch": 2.373923739237392, "grad_norm": 0.465802765546518, "learning_rate": 3.344268092364311e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.06669642776250839, "step": 1930, "valid_targets_mean": 2905.9, "valid_targets_min": 746 }, { "epoch": 2.3800738007380073, "grad_norm": 0.48733118195245584, "learning_rate": 3.3397194443240255e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.0931989774107933, "step": 1935, "valid_targets_mean": 4740.1, "valid_targets_min": 682 }, { "epoch": 2.3862238622386225, "grad_norm": 0.49408351184281923, "learning_rate": 3.3351581912584165e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.10559767484664917, "step": 1940, "valid_targets_mean": 4967.0, "valid_targets_min": 744 }, { "epoch": 2.392373923739237, "grad_norm": 0.46608584427402655, "learning_rate": 3.330584376082969e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.07794773578643799, "step": 1945, "valid_targets_mean": 3437.2, "valid_targets_min": 1141 }, { "epoch": 2.3985239852398523, "grad_norm": 0.5566159825639682, "learning_rate": 3.3259980418313627e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.08732946217060089, "step": 1950, "valid_targets_mean": 3032.6, "valid_targets_min": 704 }, { "epoch": 2.4046740467404675, "grad_norm": 0.6317169801431017, "learning_rate": 3.321399231655063e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.07550832629203796, "step": 1955, "valid_targets_mean": 2734.6, "valid_targets_min": 805 }, { "epoch": 2.4108241082410826, "grad_norm": 0.5578507572793279, "learning_rate": 3.3167879888229195e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.06913506984710693, "step": 1960, "valid_targets_mean": 1947.5, "valid_targets_min": 916 }, { "epoch": 2.4169741697416973, "grad_norm": 0.5776692228993966, "learning_rate": 3.312164356720757e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.09849021583795547, "step": 1965, "valid_targets_mean": 2952.2, "valid_targets_min": 615 }, { "epoch": 2.4231242312423125, "grad_norm": 0.6006794962255738, "learning_rate": 3.307528378850967e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.10083635151386261, "step": 1970, "valid_targets_mean": 3884.2, "valid_targets_min": 1306 }, { "epoch": 2.4292742927429276, "grad_norm": 0.5226470537922095, "learning_rate": 3.3028800988320995e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.07776734232902527, "step": 1975, "valid_targets_mean": 3161.1, "valid_targets_min": 1177 }, { "epoch": 2.4354243542435423, "grad_norm": 0.4782877992750988, "learning_rate": 3.298219560398449e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.06971317529678345, "step": 1980, "valid_targets_mean": 3718.8, "valid_targets_min": 870 }, { "epoch": 2.4415744157441575, "grad_norm": 0.4559598020815533, "learning_rate": 3.2935468073996496e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.09818018972873688, "step": 1985, "valid_targets_mean": 4419.2, "valid_targets_min": 1652 }, { "epoch": 2.4477244772447726, "grad_norm": 0.505435822689401, "learning_rate": 3.288861883800255e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.06142653152346611, "step": 1990, "valid_targets_mean": 2591.2, "valid_targets_min": 1245 }, { "epoch": 2.4538745387453873, "grad_norm": 0.5222476550001706, "learning_rate": 3.284164833679332e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.08206497132778168, "step": 1995, "valid_targets_mean": 3462.0, "valid_targets_min": 930 }, { "epoch": 2.4600246002460024, "grad_norm": 0.4832843978844827, "learning_rate": 3.2794557012300404e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.08409826457500458, "step": 2000, "valid_targets_mean": 4188.4, "valid_targets_min": 635 }, { "epoch": 2.4661746617466176, "grad_norm": 0.5408692480553025, "learning_rate": 3.274734530759219e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.11485058069229126, "step": 2005, "valid_targets_mean": 3784.5, "valid_targets_min": 1284 }, { "epoch": 2.4723247232472323, "grad_norm": 0.43419425416737284, "learning_rate": 3.270001366686968e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.10403525084257126, "step": 2010, "valid_targets_mean": 5663.1, "valid_targets_min": 1374 }, { "epoch": 2.4784747847478474, "grad_norm": 0.5299308496182256, "learning_rate": 3.265256253546234e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.07585825026035309, "step": 2015, "valid_targets_mean": 3291.1, "valid_targets_min": 611 }, { "epoch": 2.4846248462484626, "grad_norm": 1.0792016068091295, "learning_rate": 3.260499235982388e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.10445999354124069, "step": 2020, "valid_targets_mean": 3832.1, "valid_targets_min": 770 }, { "epoch": 2.4907749077490777, "grad_norm": 0.698986045921313, "learning_rate": 3.255730358752804e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.08058764040470123, "step": 2025, "valid_targets_mean": 3242.8, "valid_targets_min": 703 }, { "epoch": 2.4969249692496924, "grad_norm": 0.546362476730347, "learning_rate": 3.2509496667264455e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.06084280461072922, "step": 2030, "valid_targets_mean": 2335.9, "valid_targets_min": 849 }, { "epoch": 2.5030750307503076, "grad_norm": 0.6423068881273603, "learning_rate": 3.2461572048834313e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.0933295264840126, "step": 2035, "valid_targets_mean": 3781.5, "valid_targets_min": 795 }, { "epoch": 2.5092250922509223, "grad_norm": 0.5495734572149842, "learning_rate": 3.241353018314624e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.10316911339759827, "step": 2040, "valid_targets_mean": 3266.0, "valid_targets_min": 1061 }, { "epoch": 2.5153751537515374, "grad_norm": 0.4876568470159601, "learning_rate": 3.236537152221198e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.08447950333356857, "step": 2045, "valid_targets_mean": 4142.5, "valid_targets_min": 938 }, { "epoch": 2.5215252152521526, "grad_norm": 0.5051448004297999, "learning_rate": 3.2317096519142175e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.075490802526474, "step": 2050, "valid_targets_mean": 2780.2, "valid_targets_min": 567 }, { "epoch": 2.5276752767527677, "grad_norm": 0.45950658313208836, "learning_rate": 3.22687056281421e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.08851166814565659, "step": 2055, "valid_targets_mean": 4858.0, "valid_targets_min": 504 }, { "epoch": 2.5338253382533824, "grad_norm": 0.5400123267642455, "learning_rate": 3.222019930450739e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.06616988778114319, "step": 2060, "valid_targets_mean": 2311.4, "valid_targets_min": 1105 }, { "epoch": 2.5399753997539976, "grad_norm": 0.5837630632081082, "learning_rate": 3.217157800461975e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.09007904678583145, "step": 2065, "valid_targets_mean": 3383.2, "valid_targets_min": 716 }, { "epoch": 2.5461254612546127, "grad_norm": 0.45828178011795273, "learning_rate": 3.212284218594264e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.1027955710887909, "step": 2070, "valid_targets_mean": 4865.9, "valid_targets_min": 791 }, { "epoch": 2.5522755227552274, "grad_norm": 0.4841594574033935, "learning_rate": 3.207399230701702e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.08975324779748917, "step": 2075, "valid_targets_mean": 4866.8, "valid_targets_min": 1036 }, { "epoch": 2.5584255842558425, "grad_norm": 0.48863970800326134, "learning_rate": 3.202502882745701e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.09955969452857971, "step": 2080, "valid_targets_mean": 3850.4, "valid_targets_min": 902 }, { "epoch": 2.5645756457564577, "grad_norm": 0.5776030035793362, "learning_rate": 3.197595220794554e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.0664263665676117, "step": 2085, "valid_targets_mean": 3681.8, "valid_targets_min": 740 }, { "epoch": 2.570725707257073, "grad_norm": 0.5664997351084213, "learning_rate": 3.192676291023006e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.09068871289491653, "step": 2090, "valid_targets_mean": 3820.2, "valid_targets_min": 309 }, { "epoch": 2.5768757687576875, "grad_norm": 0.5911403025393728, "learning_rate": 3.187746139711818e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.05383612588047981, "step": 2095, "valid_targets_mean": 1794.6, "valid_targets_min": 585 }, { "epoch": 2.5830258302583027, "grad_norm": 0.5749723511725446, "learning_rate": 3.1828048132473295e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.06191668286919594, "step": 2100, "valid_targets_mean": 2664.1, "valid_targets_min": 1080 }, { "epoch": 2.5891758917589174, "grad_norm": 0.5447755200027713, "learning_rate": 3.1778523581210255e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.1104673445224762, "step": 2105, "valid_targets_mean": 4234.9, "valid_targets_min": 885 }, { "epoch": 2.5953259532595325, "grad_norm": 0.6795880232450013, "learning_rate": 3.1728888209290946e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.10889527201652527, "step": 2110, "valid_targets_mean": 3480.6, "valid_targets_min": 742 }, { "epoch": 2.6014760147601477, "grad_norm": 0.528559679500913, "learning_rate": 3.167914248371997e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.09621582925319672, "step": 2115, "valid_targets_mean": 3210.9, "valid_targets_min": 790 }, { "epoch": 2.607626076260763, "grad_norm": 0.5383051724411886, "learning_rate": 3.1629286872540186e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.08600321412086487, "step": 2120, "valid_targets_mean": 2903.4, "valid_targets_min": 986 }, { "epoch": 2.6137761377613775, "grad_norm": 0.4919746943557101, "learning_rate": 3.1579321844828346e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.0712924599647522, "step": 2125, "valid_targets_mean": 3461.8, "valid_targets_min": 657 }, { "epoch": 2.6199261992619927, "grad_norm": 0.5673822138054107, "learning_rate": 3.1529247870690664e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.12092947959899902, "step": 2130, "valid_targets_mean": 3591.4, "valid_targets_min": 802 }, { "epoch": 2.6260762607626074, "grad_norm": 0.5497421190043564, "learning_rate": 3.1479065421258405e-05, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.10298366099596024, "step": 2135, "valid_targets_mean": 2774.2, "valid_targets_min": 1140 }, { "epoch": 2.6322263222632225, "grad_norm": 0.5132806776892035, "learning_rate": 3.1428774968683435e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.09595505893230438, "step": 2140, "valid_targets_mean": 3863.9, "valid_targets_min": 594 }, { "epoch": 2.6383763837638377, "grad_norm": 0.49790073483671826, "learning_rate": 3.137837698613381e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.08299355208873749, "step": 2145, "valid_targets_mean": 3946.6, "valid_targets_min": 722 }, { "epoch": 2.644526445264453, "grad_norm": 0.5813883421575223, "learning_rate": 3.132787194778928e-05, "loss": 0.1728, "loss_nan_ranks": 0, "loss_rank_avg": 0.07799771428108215, "step": 2150, "valid_targets_mean": 2537.5, "valid_targets_min": 613 }, { "epoch": 2.6506765067650675, "grad_norm": 0.620296547665903, "learning_rate": 3.127726032883687e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.09733926504850388, "step": 2155, "valid_targets_mean": 2988.4, "valid_targets_min": 821 }, { "epoch": 2.6568265682656826, "grad_norm": 0.6386470061418499, "learning_rate": 3.122654260546638e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.07757748663425446, "step": 2160, "valid_targets_mean": 2905.8, "valid_targets_min": 768 }, { "epoch": 2.662976629766298, "grad_norm": 0.5225347305491789, "learning_rate": 3.1175719254865904e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.07279728353023529, "step": 2165, "valid_targets_mean": 3298.6, "valid_targets_min": 1109 }, { "epoch": 2.6691266912669125, "grad_norm": 0.6166199534571374, "learning_rate": 3.11247907552174e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.10531272739171982, "step": 2170, "valid_targets_mean": 5083.0, "valid_targets_min": 1629 }, { "epoch": 2.6752767527675276, "grad_norm": 0.6632519276400445, "learning_rate": 3.107375758569208e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.08699870109558105, "step": 2175, "valid_targets_mean": 1740.8, "valid_targets_min": 449 }, { "epoch": 2.6814268142681428, "grad_norm": 0.47260053699780497, "learning_rate": 3.1022620226446e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.08576695621013641, "step": 2180, "valid_targets_mean": 4602.2, "valid_targets_min": 1101 }, { "epoch": 2.687576875768758, "grad_norm": 0.4891614796306115, "learning_rate": 3.097137915861551e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.10201077908277512, "step": 2185, "valid_targets_mean": 5774.5, "valid_targets_min": 732 }, { "epoch": 2.6937269372693726, "grad_norm": 0.5113041851467374, "learning_rate": 3.092003486431269e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.11469049006700516, "step": 2190, "valid_targets_mean": 4127.1, "valid_targets_min": 1420 }, { "epoch": 2.6998769987699878, "grad_norm": 0.4477313358512578, "learning_rate": 3.0868587826620885e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.08219954371452332, "step": 2195, "valid_targets_mean": 4049.0, "valid_targets_min": 734 }, { "epoch": 2.7060270602706025, "grad_norm": 0.5785458631080089, "learning_rate": 3.08170385295901e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.08696188032627106, "step": 2200, "valid_targets_mean": 2943.6, "valid_targets_min": 741 }, { "epoch": 2.7121771217712176, "grad_norm": 0.5154059025784247, "learning_rate": 3.076538745823249e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.11488153785467148, "step": 2205, "valid_targets_mean": 4743.4, "valid_targets_min": 1242 }, { "epoch": 2.7183271832718328, "grad_norm": 0.5241984479834872, "learning_rate": 3.071363509851773e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.084464892745018, "step": 2210, "valid_targets_mean": 3118.0, "valid_targets_min": 890 }, { "epoch": 2.724477244772448, "grad_norm": 0.5150107262604267, "learning_rate": 3.066178193736855e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.11683715879917145, "step": 2215, "valid_targets_mean": 4706.2, "valid_targets_min": 1122 }, { "epoch": 2.7306273062730626, "grad_norm": 0.6162304395052073, "learning_rate": 3.060982846265604e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.07482162117958069, "step": 2220, "valid_targets_mean": 2574.2, "valid_targets_min": 684 }, { "epoch": 2.7367773677736777, "grad_norm": 0.4631512614093479, "learning_rate": 3.0557775163195126e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.07485739886760712, "step": 2225, "valid_targets_mean": 3813.6, "valid_targets_min": 1663 }, { "epoch": 2.742927429274293, "grad_norm": 0.5143649735266802, "learning_rate": 3.050562252873997e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.0832708328962326, "step": 2230, "valid_targets_mean": 3539.0, "valid_targets_min": 1167 }, { "epoch": 2.7490774907749076, "grad_norm": 0.5227130034773454, "learning_rate": 3.0453371049979324e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.08692235499620438, "step": 2235, "valid_targets_mean": 3754.2, "valid_targets_min": 927 }, { "epoch": 2.7552275522755227, "grad_norm": 0.4976728290338799, "learning_rate": 3.0401021218531956e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.0895761251449585, "step": 2240, "valid_targets_mean": 3627.8, "valid_targets_min": 1099 }, { "epoch": 2.761377613776138, "grad_norm": 0.46825941507801294, "learning_rate": 3.034857352694199e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.127121239900589, "step": 2245, "valid_targets_mean": 5966.4, "valid_targets_min": 1501 }, { "epoch": 2.767527675276753, "grad_norm": 0.48184006484753195, "learning_rate": 3.0296028468674313e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.10622835159301758, "step": 2250, "valid_targets_mean": 5889.8, "valid_targets_min": 1421 }, { "epoch": 2.7736777367773677, "grad_norm": 0.4508942702524368, "learning_rate": 3.024338653810986e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.07747922837734222, "step": 2255, "valid_targets_mean": 3874.0, "valid_targets_min": 570 }, { "epoch": 2.779827798277983, "grad_norm": 0.46724717938780136, "learning_rate": 3.0190648230541067e-05, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.12043651193380356, "step": 2260, "valid_targets_mean": 5011.5, "valid_targets_min": 1270 }, { "epoch": 2.7859778597785976, "grad_norm": 0.4683727924314104, "learning_rate": 3.013781404216711e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.07968182116746902, "step": 2265, "valid_targets_mean": 3799.6, "valid_targets_min": 824 }, { "epoch": 2.7921279212792127, "grad_norm": 0.5385810219664474, "learning_rate": 3.0084884470089296e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.08386295288801193, "step": 2270, "valid_targets_mean": 3734.4, "valid_targets_min": 1102 }, { "epoch": 2.798277982779828, "grad_norm": 0.45245499219642243, "learning_rate": 3.003186001230636e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.09439323842525482, "step": 2275, "valid_targets_mean": 4903.8, "valid_targets_min": 1329 }, { "epoch": 2.804428044280443, "grad_norm": 0.4940315817910554, "learning_rate": 2.9978741167709796e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.13937702775001526, "step": 2280, "valid_targets_mean": 3603.1, "valid_targets_min": 1262 }, { "epoch": 2.8105781057810577, "grad_norm": 0.49746805123115423, "learning_rate": 2.992552843607916e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.1218264102935791, "step": 2285, "valid_targets_mean": 4513.8, "valid_targets_min": 1255 }, { "epoch": 2.816728167281673, "grad_norm": 0.47658623286138785, "learning_rate": 2.9872222318077353e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.13050565123558044, "step": 2290, "valid_targets_mean": 5611.1, "valid_targets_min": 1497 }, { "epoch": 2.8228782287822876, "grad_norm": 0.522661090423526, "learning_rate": 2.9818823315245933e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.09891247004270554, "step": 2295, "valid_targets_mean": 4264.4, "valid_targets_min": 1380 }, { "epoch": 2.8290282902829027, "grad_norm": 0.6529422685543568, "learning_rate": 2.9765331930000366e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.11567439138889313, "step": 2300, "valid_targets_mean": 2530.1, "valid_targets_min": 979 }, { "epoch": 2.835178351783518, "grad_norm": 0.46323069930632194, "learning_rate": 2.971174866562533e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.09001781046390533, "step": 2305, "valid_targets_mean": 4287.8, "valid_targets_min": 1393 }, { "epoch": 2.841328413284133, "grad_norm": 0.5030409922489438, "learning_rate": 2.9658074026269967e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.10567715764045715, "step": 2310, "valid_targets_mean": 4341.6, "valid_targets_min": 961 }, { "epoch": 2.8474784747847477, "grad_norm": 0.47464153475552046, "learning_rate": 2.9604308516943133e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.08723067492246628, "step": 2315, "valid_targets_mean": 4334.2, "valid_targets_min": 1360 }, { "epoch": 2.853628536285363, "grad_norm": 0.6245015392109261, "learning_rate": 2.9550452643508663e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.10392093658447266, "step": 2320, "valid_targets_mean": 2707.8, "valid_targets_min": 695 }, { "epoch": 2.859778597785978, "grad_norm": 0.422634120991052, "learning_rate": 2.9496506912680587e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.1133454442024231, "step": 2325, "valid_targets_mean": 6812.8, "valid_targets_min": 1034 }, { "epoch": 2.8659286592865927, "grad_norm": 0.5634287962300095, "learning_rate": 2.9442471832018386e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.07557663321495056, "step": 2330, "valid_targets_mean": 3040.9, "valid_targets_min": 1315 }, { "epoch": 2.872078720787208, "grad_norm": 0.4623219805830947, "learning_rate": 2.938834790992221e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.06218584626913071, "step": 2335, "valid_targets_mean": 2710.9, "valid_targets_min": 1237 }, { "epoch": 2.878228782287823, "grad_norm": 0.4891533715959747, "learning_rate": 2.9334135655628072e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.0654270350933075, "step": 2340, "valid_targets_mean": 3311.1, "valid_targets_min": 1145 }, { "epoch": 2.884378843788438, "grad_norm": 0.4755509287295262, "learning_rate": 2.9279835579203114e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.10518981516361237, "step": 2345, "valid_targets_mean": 4752.6, "valid_targets_min": 1158 }, { "epoch": 2.890528905289053, "grad_norm": 0.5594039695166282, "learning_rate": 2.922544819154073e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.11531180888414383, "step": 2350, "valid_targets_mean": 3394.2, "valid_targets_min": 1118 }, { "epoch": 2.896678966789668, "grad_norm": 0.5880699435224075, "learning_rate": 2.917097400435583e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.0978911817073822, "step": 2355, "valid_targets_mean": 3524.2, "valid_targets_min": 881 }, { "epoch": 2.9028290282902827, "grad_norm": 0.6156548379697123, "learning_rate": 2.9116413530179975e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.10010180622339249, "step": 2360, "valid_targets_mean": 2336.5, "valid_targets_min": 1286 }, { "epoch": 2.908979089790898, "grad_norm": 0.506443402249804, "learning_rate": 2.906176728235658e-05, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.08779266476631165, "step": 2365, "valid_targets_mean": 3942.4, "valid_targets_min": 832 }, { "epoch": 2.915129151291513, "grad_norm": 0.7387343642776686, "learning_rate": 2.90070357750361e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.10175585746765137, "step": 2370, "valid_targets_mean": 2909.9, "valid_targets_min": 1289 }, { "epoch": 2.921279212792128, "grad_norm": 0.48459055212808255, "learning_rate": 2.8952219523171136e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.08510647714138031, "step": 2375, "valid_targets_mean": 4494.2, "valid_targets_min": 1074 }, { "epoch": 2.927429274292743, "grad_norm": 0.5581455833589545, "learning_rate": 2.8897319042511646e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.11474175751209259, "step": 2380, "valid_targets_mean": 4132.6, "valid_targets_min": 1150 }, { "epoch": 2.933579335793358, "grad_norm": 0.4442973610756425, "learning_rate": 2.8842334849600077e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.0717523843050003, "step": 2385, "valid_targets_mean": 4071.4, "valid_targets_min": 1168 }, { "epoch": 2.939729397293973, "grad_norm": 0.5985437255621016, "learning_rate": 2.878726746176648e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.07459800690412521, "step": 2390, "valid_targets_mean": 3167.8, "valid_targets_min": 725 }, { "epoch": 2.945879458794588, "grad_norm": 0.4654162885420748, "learning_rate": 2.8732117397123685e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.10197076201438904, "step": 2395, "valid_targets_mean": 4816.4, "valid_targets_min": 1179 }, { "epoch": 2.952029520295203, "grad_norm": 0.5665428182847307, "learning_rate": 2.867688517456238e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.11168975383043289, "step": 2400, "valid_targets_mean": 3892.2, "valid_targets_min": 1214 }, { "epoch": 2.958179581795818, "grad_norm": 0.4898717590110592, "learning_rate": 2.8621571313746277e-05, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.07751792669296265, "step": 2405, "valid_targets_mean": 3511.6, "valid_targets_min": 1106 }, { "epoch": 2.9643296432964332, "grad_norm": 0.5914722730384244, "learning_rate": 2.856617633510718e-05, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.1021716296672821, "step": 2410, "valid_targets_mean": 3449.5, "valid_targets_min": 1393 }, { "epoch": 2.970479704797048, "grad_norm": 0.5194239098692871, "learning_rate": 2.8510700759840122e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.09077870845794678, "step": 2415, "valid_targets_mean": 6526.2, "valid_targets_min": 1437 }, { "epoch": 2.976629766297663, "grad_norm": 0.5334216154629376, "learning_rate": 2.8455145109898433e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.072516068816185, "step": 2420, "valid_targets_mean": 2606.6, "valid_targets_min": 659 }, { "epoch": 2.9827798277982778, "grad_norm": 0.6195282094770925, "learning_rate": 2.839950990798884e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.0613383986055851, "step": 2425, "valid_targets_mean": 2602.0, "valid_targets_min": 1043 }, { "epoch": 2.988929889298893, "grad_norm": 0.475861928950688, "learning_rate": 2.8343795677566565e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.0737854614853859, "step": 2430, "valid_targets_mean": 4144.8, "valid_targets_min": 898 }, { "epoch": 2.995079950799508, "grad_norm": 0.4624433782217203, "learning_rate": 2.828800294283037e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.0590396523475647, "step": 2435, "valid_targets_mean": 3481.4, "valid_targets_min": 1260 }, { "epoch": 3.001230012300123, "grad_norm": 0.5824147004658514, "learning_rate": 2.823213222871766e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.06392265856266022, "step": 2440, "valid_targets_mean": 2831.8, "valid_targets_min": 816 }, { "epoch": 3.007380073800738, "grad_norm": 0.4397252109941433, "learning_rate": 2.8176184060899517e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.08135375380516052, "step": 2445, "valid_targets_mean": 5627.1, "valid_targets_min": 665 }, { "epoch": 3.013530135301353, "grad_norm": 0.499673640912437, "learning_rate": 2.812015896577574e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.07968012988567352, "step": 2450, "valid_targets_mean": 3778.1, "valid_targets_min": 1264 }, { "epoch": 3.019680196801968, "grad_norm": 0.47703649249758645, "learning_rate": 2.806405747046995e-05, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.08472508192062378, "step": 2455, "valid_targets_mean": 4961.8, "valid_targets_min": 1348 }, { "epoch": 3.025830258302583, "grad_norm": 0.47368816999564745, "learning_rate": 2.8007880102824577e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.07601846754550934, "step": 2460, "valid_targets_mean": 4021.6, "valid_targets_min": 856 }, { "epoch": 3.031980319803198, "grad_norm": 0.5381997443190752, "learning_rate": 2.795162739139591e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.0939515084028244, "step": 2465, "valid_targets_mean": 3821.5, "valid_targets_min": 1200 }, { "epoch": 3.038130381303813, "grad_norm": 0.5175822157844081, "learning_rate": 2.7895299865449125e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.07786659896373749, "step": 2470, "valid_targets_mean": 4191.4, "valid_targets_min": 1191 }, { "epoch": 3.044280442804428, "grad_norm": 0.4645847409203417, "learning_rate": 2.7838898054953312e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.09309229254722595, "step": 2475, "valid_targets_mean": 4879.2, "valid_targets_min": 713 }, { "epoch": 3.050430504305043, "grad_norm": 0.4919289011436946, "learning_rate": 2.7782422490576486e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.08897897601127625, "step": 2480, "valid_targets_mean": 4580.9, "valid_targets_min": 648 }, { "epoch": 3.056580565805658, "grad_norm": 0.5014002250670305, "learning_rate": 2.772587370368057e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.0919342190027237, "step": 2485, "valid_targets_mean": 5648.8, "valid_targets_min": 1337 }, { "epoch": 3.062730627306273, "grad_norm": 0.4822755743705165, "learning_rate": 2.766925222631645e-05, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.06121302768588066, "step": 2490, "valid_targets_mean": 3656.1, "valid_targets_min": 1546 }, { "epoch": 3.068880688806888, "grad_norm": 0.48195767022573716, "learning_rate": 2.76125585912189e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.0824492871761322, "step": 2495, "valid_targets_mean": 5027.4, "valid_targets_min": 1023 }, { "epoch": 3.075030750307503, "grad_norm": 0.5559772633012304, "learning_rate": 2.7555793331801622e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.0640774518251419, "step": 2500, "valid_targets_mean": 2843.8, "valid_targets_min": 750 }, { "epoch": 3.081180811808118, "grad_norm": 0.46434570755393245, "learning_rate": 2.749895698215221e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.0955158919095993, "step": 2505, "valid_targets_mean": 5511.4, "valid_targets_min": 1181 }, { "epoch": 3.087330873308733, "grad_norm": 0.5065383332022071, "learning_rate": 2.744205007702713e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.09405210614204407, "step": 2510, "valid_targets_mean": 3855.5, "valid_targets_min": 1114 }, { "epoch": 3.093480934809348, "grad_norm": 0.5095722080534543, "learning_rate": 2.7385073151846667e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.07722511142492294, "step": 2515, "valid_targets_mean": 3710.2, "valid_targets_min": 1048 }, { "epoch": 3.0996309963099633, "grad_norm": 0.5138846812255643, "learning_rate": 2.732802674268992e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.08271900564432144, "step": 2520, "valid_targets_mean": 3739.8, "valid_targets_min": 1138 }, { "epoch": 3.105781057810578, "grad_norm": 0.5886188606523651, "learning_rate": 2.7270911386289735e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.07168637216091156, "step": 2525, "valid_targets_mean": 2690.8, "valid_targets_min": 1353 }, { "epoch": 3.111931119311193, "grad_norm": 0.46882295852560096, "learning_rate": 2.7213727620027667e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.08605489134788513, "step": 2530, "valid_targets_mean": 5042.1, "valid_targets_min": 1357 }, { "epoch": 3.1180811808118083, "grad_norm": 0.5848348439523262, "learning_rate": 2.7156475981928902e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.10847694426774979, "step": 2535, "valid_targets_mean": 3534.2, "valid_targets_min": 650 }, { "epoch": 3.124231242312423, "grad_norm": 0.43241446081805607, "learning_rate": 2.7099157010657245e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.08864249289035797, "step": 2540, "valid_targets_mean": 6223.6, "valid_targets_min": 1532 }, { "epoch": 3.130381303813038, "grad_norm": 0.5133012492820908, "learning_rate": 2.7041771245509996e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.08195997774600983, "step": 2545, "valid_targets_mean": 4203.6, "valid_targets_min": 892 }, { "epoch": 3.1365313653136533, "grad_norm": 0.5718819367036605, "learning_rate": 2.6984319226412886e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.06313544511795044, "step": 2550, "valid_targets_mean": 2448.9, "valid_targets_min": 646 }, { "epoch": 3.142681426814268, "grad_norm": 0.6364683218344229, "learning_rate": 2.6926801493915046e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.08119294792413712, "step": 2555, "valid_targets_mean": 2953.6, "valid_targets_min": 790 }, { "epoch": 3.148831488314883, "grad_norm": 0.5459860640784475, "learning_rate": 2.686921858918386e-05, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.06781558692455292, "step": 2560, "valid_targets_mean": 2899.2, "valid_targets_min": 1195 }, { "epoch": 3.1549815498154983, "grad_norm": 0.5293486901428869, "learning_rate": 2.6811571053999902e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.0706283450126648, "step": 2565, "valid_targets_mean": 3130.5, "valid_targets_min": 766 }, { "epoch": 3.161131611316113, "grad_norm": 0.5332831053952426, "learning_rate": 2.675385943075184e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.0654885470867157, "step": 2570, "valid_targets_mean": 2729.9, "valid_targets_min": 773 }, { "epoch": 3.167281672816728, "grad_norm": 0.5189347202516605, "learning_rate": 2.6696084262431315e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.08411689102649689, "step": 2575, "valid_targets_mean": 3577.9, "valid_targets_min": 244 }, { "epoch": 3.1734317343173433, "grad_norm": 0.48494501784084065, "learning_rate": 2.6638246092627872e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.07317544519901276, "step": 2580, "valid_targets_mean": 4671.8, "valid_targets_min": 1234 }, { "epoch": 3.179581795817958, "grad_norm": 0.5456109495415848, "learning_rate": 2.6580345465523785e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.08382262289524078, "step": 2585, "valid_targets_mean": 3731.5, "valid_targets_min": 1217 }, { "epoch": 3.185731857318573, "grad_norm": 0.5908616856574463, "learning_rate": 2.6522382925888997e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.07151857018470764, "step": 2590, "valid_targets_mean": 2263.6, "valid_targets_min": 886 }, { "epoch": 3.1918819188191883, "grad_norm": 0.5194482617774568, "learning_rate": 2.646435901907595e-05, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.08012768626213074, "step": 2595, "valid_targets_mean": 4004.4, "valid_targets_min": 640 }, { "epoch": 3.1980319803198034, "grad_norm": 0.48147337539747703, "learning_rate": 2.6406274291014477e-05, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.04858190566301346, "step": 2600, "valid_targets_mean": 2034.8, "valid_targets_min": 841 }, { "epoch": 3.204182041820418, "grad_norm": 0.5334810071357533, "learning_rate": 2.634812928820667e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.08282295614480972, "step": 2605, "valid_targets_mean": 3136.9, "valid_targets_min": 731 }, { "epoch": 3.2103321033210332, "grad_norm": 0.49249300840244425, "learning_rate": 2.6289924557721715e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.09127512574195862, "step": 2610, "valid_targets_mean": 4883.0, "valid_targets_min": 636 }, { "epoch": 3.2164821648216484, "grad_norm": 0.4900333823683637, "learning_rate": 2.623166064719077e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.08774002641439438, "step": 2615, "valid_targets_mean": 4132.8, "valid_targets_min": 1572 }, { "epoch": 3.222632226322263, "grad_norm": 0.4825138851450061, "learning_rate": 2.6173338104801784e-05, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.06398773193359375, "step": 2620, "valid_targets_mean": 3631.1, "valid_targets_min": 933 }, { "epoch": 3.2287822878228782, "grad_norm": 0.6336346315985616, "learning_rate": 2.6114957479294365e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.06542333960533142, "step": 2625, "valid_targets_mean": 1869.8, "valid_targets_min": 976 }, { "epoch": 3.2349323493234934, "grad_norm": 0.5597472254460725, "learning_rate": 2.6056519319954623e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.09998220205307007, "step": 2630, "valid_targets_mean": 3676.1, "valid_targets_min": 820 }, { "epoch": 3.241082410824108, "grad_norm": 0.4562480392066877, "learning_rate": 2.599802417660996e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.07622061669826508, "step": 2635, "valid_targets_mean": 4234.2, "valid_targets_min": 1055 }, { "epoch": 3.2472324723247232, "grad_norm": 0.6121978848476852, "learning_rate": 2.5939472599623942e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.05895080789923668, "step": 2640, "valid_targets_mean": 2002.8, "valid_targets_min": 618 }, { "epoch": 3.2533825338253384, "grad_norm": 0.5370262581759196, "learning_rate": 2.588086513989109e-05, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.09554477035999298, "step": 2645, "valid_targets_mean": 4236.2, "valid_targets_min": 760 }, { "epoch": 3.259532595325953, "grad_norm": 0.4479939560465353, "learning_rate": 2.5822202348831722e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.07247894257307053, "step": 2650, "valid_targets_mean": 4365.1, "valid_targets_min": 1098 }, { "epoch": 3.265682656826568, "grad_norm": 0.522793952873124, "learning_rate": 2.576348477838675e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.06713450700044632, "step": 2655, "valid_targets_mean": 3066.9, "valid_targets_min": 958 }, { "epoch": 3.2718327183271834, "grad_norm": 0.48214958463559254, "learning_rate": 2.5704712981012473e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.06675916165113449, "step": 2660, "valid_targets_mean": 3855.0, "valid_targets_min": 1421 }, { "epoch": 3.2779827798277985, "grad_norm": 0.5095903211526931, "learning_rate": 2.5645887509675424e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.0593230202794075, "step": 2665, "valid_targets_mean": 2953.1, "valid_targets_min": 1168 }, { "epoch": 3.284132841328413, "grad_norm": 0.5820951219397775, "learning_rate": 2.5587008917847107e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.09749455749988556, "step": 2670, "valid_targets_mean": 3805.8, "valid_targets_min": 923 }, { "epoch": 3.2902829028290284, "grad_norm": 0.5025757953361653, "learning_rate": 2.5528077759498842e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.08753708004951477, "step": 2675, "valid_targets_mean": 4346.0, "valid_targets_min": 1279 }, { "epoch": 3.296432964329643, "grad_norm": 0.5282398650712525, "learning_rate": 2.5469094589096527e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.09425686299800873, "step": 2680, "valid_targets_mean": 4216.2, "valid_targets_min": 1392 }, { "epoch": 3.302583025830258, "grad_norm": 0.49910627712015104, "learning_rate": 2.5410059961595428e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.06500237435102463, "step": 2685, "valid_targets_mean": 3755.8, "valid_targets_min": 1512 }, { "epoch": 3.3087330873308733, "grad_norm": 0.605379606343561, "learning_rate": 2.5350974432434942e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.0832923948764801, "step": 2690, "valid_targets_mean": 2664.9, "valid_targets_min": 797 }, { "epoch": 3.3148831488314885, "grad_norm": 0.5013142884349607, "learning_rate": 2.52918385575334e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.08029305934906006, "step": 2695, "valid_targets_mean": 4261.5, "valid_targets_min": 1492 }, { "epoch": 3.321033210332103, "grad_norm": 0.5381840379133357, "learning_rate": 2.523265289328283e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.12291625142097473, "step": 2700, "valid_targets_mean": 4962.0, "valid_targets_min": 798 }, { "epoch": 3.3271832718327183, "grad_norm": 0.46781773567889223, "learning_rate": 2.5173417996543673e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.06877776235342026, "step": 2705, "valid_targets_mean": 4169.6, "valid_targets_min": 700 }, { "epoch": 3.3333333333333335, "grad_norm": 0.5653286842605626, "learning_rate": 2.511413442463964e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.084671251475811, "step": 2710, "valid_targets_mean": 3526.8, "valid_targets_min": 825 }, { "epoch": 3.339483394833948, "grad_norm": 0.4985823875382402, "learning_rate": 2.5054802735352363e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.06729922443628311, "step": 2715, "valid_targets_mean": 3257.2, "valid_targets_min": 1325 }, { "epoch": 3.3456334563345633, "grad_norm": 0.5285798353799441, "learning_rate": 2.499542348691623e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.07990030944347382, "step": 2720, "valid_targets_mean": 3634.4, "valid_targets_min": 1275 }, { "epoch": 3.3517835178351785, "grad_norm": 0.6574408260852771, "learning_rate": 2.4935997238013068e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.07905502617359161, "step": 2725, "valid_targets_mean": 1994.1, "valid_targets_min": 505 }, { "epoch": 3.357933579335793, "grad_norm": 0.43995084249134475, "learning_rate": 2.4876524547766954e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.06483259797096252, "step": 2730, "valid_targets_mean": 3831.4, "valid_targets_min": 973 }, { "epoch": 3.3640836408364083, "grad_norm": 0.5301162387802413, "learning_rate": 2.4817005975738892e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.05946962907910347, "step": 2735, "valid_targets_mean": 2651.9, "valid_targets_min": 701 }, { "epoch": 3.3702337023370235, "grad_norm": 0.4610777012343169, "learning_rate": 2.4757442081921577e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.09016251564025879, "step": 2740, "valid_targets_mean": 5271.4, "valid_targets_min": 1537 }, { "epoch": 3.376383763837638, "grad_norm": 0.5291095045155567, "learning_rate": 2.4697833426734124e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.07902340590953827, "step": 2745, "valid_targets_mean": 3405.5, "valid_targets_min": 1263 }, { "epoch": 3.3825338253382533, "grad_norm": 0.4966024203150633, "learning_rate": 2.4638180571016815e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.08345846831798553, "step": 2750, "valid_targets_mean": 4344.2, "valid_targets_min": 790 }, { "epoch": 3.3886838868388685, "grad_norm": 0.5128824279128211, "learning_rate": 2.457848407602577e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.0801117941737175, "step": 2755, "valid_targets_mean": 4145.4, "valid_targets_min": 1271 }, { "epoch": 3.3948339483394836, "grad_norm": 0.5643768252894239, "learning_rate": 2.4518744503427713e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.09472721815109253, "step": 2760, "valid_targets_mean": 3298.6, "valid_targets_min": 920 }, { "epoch": 3.4009840098400983, "grad_norm": 0.4755483158799478, "learning_rate": 2.445896241529468e-05, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.08024337142705917, "step": 2765, "valid_targets_mean": 4097.9, "valid_targets_min": 1124 }, { "epoch": 3.4071340713407134, "grad_norm": 0.4886847154447668, "learning_rate": 2.4399138374098714e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.06162010505795479, "step": 2770, "valid_targets_mean": 3024.2, "valid_targets_min": 803 }, { "epoch": 3.4132841328413286, "grad_norm": 0.4529392180445224, "learning_rate": 2.433927294270657e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.08406539261341095, "step": 2775, "valid_targets_mean": 4056.8, "valid_targets_min": 1248 }, { "epoch": 3.4194341943419433, "grad_norm": 0.6635839686854069, "learning_rate": 2.4279366684374466e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.0659230500459671, "step": 2780, "valid_targets_mean": 2098.2, "valid_targets_min": 712 }, { "epoch": 3.4255842558425584, "grad_norm": 0.5007226873985919, "learning_rate": 2.421942016274272e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.07925982773303986, "step": 2785, "valid_targets_mean": 3182.2, "valid_targets_min": 1159 }, { "epoch": 3.4317343173431736, "grad_norm": 0.44770103382805143, "learning_rate": 2.4159433941830474e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.08364881575107574, "step": 2790, "valid_targets_mean": 4964.5, "valid_targets_min": 1245 }, { "epoch": 3.4378843788437883, "grad_norm": 0.48861818886915764, "learning_rate": 2.4099408586030397e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.09565254300832748, "step": 2795, "valid_targets_mean": 4456.5, "valid_targets_min": 907 }, { "epoch": 3.4440344403444034, "grad_norm": 0.548570303204303, "learning_rate": 2.403934466010338e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.07968255877494812, "step": 2800, "valid_targets_mean": 3445.1, "valid_targets_min": 1251 }, { "epoch": 3.4501845018450186, "grad_norm": 0.48355228778349324, "learning_rate": 2.3979242729173192e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.09059491008520126, "step": 2805, "valid_targets_mean": 4697.8, "valid_targets_min": 827 }, { "epoch": 3.4563345633456333, "grad_norm": 0.5611975357331571, "learning_rate": 2.391910335872118e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.08527141809463501, "step": 2810, "valid_targets_mean": 3290.6, "valid_targets_min": 1214 }, { "epoch": 3.4624846248462484, "grad_norm": 0.6078436180033226, "learning_rate": 2.385892711458095e-05, "loss": 0.1691, "loss_nan_ranks": 0, "loss_rank_avg": 0.08710209280252457, "step": 2815, "valid_targets_mean": 3033.8, "valid_targets_min": 914 }, { "epoch": 3.4686346863468636, "grad_norm": 0.4853947578797779, "learning_rate": 2.3798714562933053e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.05702066794037819, "step": 2820, "valid_targets_mean": 3216.1, "valid_targets_min": 753 }, { "epoch": 3.4747847478474787, "grad_norm": 0.46984196132141787, "learning_rate": 2.373846627029963e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.09708918631076813, "step": 2825, "valid_targets_mean": 5562.1, "valid_targets_min": 1456 }, { "epoch": 3.4809348093480934, "grad_norm": 0.5095130196068846, "learning_rate": 2.3678182803539117e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.038323938846588135, "step": 2830, "valid_targets_mean": 2221.0, "valid_targets_min": 797 }, { "epoch": 3.4870848708487086, "grad_norm": 0.5045561485669289, "learning_rate": 2.361786472984086e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.07799921184778214, "step": 2835, "valid_targets_mean": 3694.1, "valid_targets_min": 859 }, { "epoch": 3.4932349323493233, "grad_norm": 0.47253875127606976, "learning_rate": 2.3557512616719863e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.07349460572004318, "step": 2840, "valid_targets_mean": 3396.1, "valid_targets_min": 798 }, { "epoch": 3.4993849938499384, "grad_norm": 0.5033151212492368, "learning_rate": 2.3497127032011343e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.07581774890422821, "step": 2845, "valid_targets_mean": 3116.0, "valid_targets_min": 776 }, { "epoch": 3.5055350553505535, "grad_norm": 0.5159059389745787, "learning_rate": 2.3436708543865473e-05, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.08507826924324036, "step": 2850, "valid_targets_mean": 3664.0, "valid_targets_min": 874 }, { "epoch": 3.5116851168511687, "grad_norm": 0.5482546283483722, "learning_rate": 2.3376257720742013e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.0819462239742279, "step": 2855, "valid_targets_mean": 3106.1, "valid_targets_min": 620 }, { "epoch": 3.5178351783517834, "grad_norm": 0.4974541684782698, "learning_rate": 2.3315775131404913e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.07123839855194092, "step": 2860, "valid_targets_mean": 4601.2, "valid_targets_min": 1119 }, { "epoch": 3.5239852398523985, "grad_norm": 1.3047781429682845, "learning_rate": 2.325526134491704e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.054736874997615814, "step": 2865, "valid_targets_mean": 1818.4, "valid_targets_min": 865 }, { "epoch": 3.5301353013530137, "grad_norm": 0.6134499208603761, "learning_rate": 2.319471693063478e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.0885232463479042, "step": 2870, "valid_targets_mean": 3049.0, "valid_targets_min": 906 }, { "epoch": 3.5362853628536284, "grad_norm": 0.6759150233763972, "learning_rate": 2.3134142458202663e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.09225553274154663, "step": 2875, "valid_targets_mean": 2895.2, "valid_targets_min": 1339 }, { "epoch": 3.5424354243542435, "grad_norm": 0.4878657350173033, "learning_rate": 2.3073538497548054e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.06459975242614746, "step": 2880, "valid_targets_mean": 3118.1, "valid_targets_min": 1038 }, { "epoch": 3.5485854858548587, "grad_norm": 0.5285554655544287, "learning_rate": 2.3012905618875748e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.07657990604639053, "step": 2885, "valid_targets_mean": 3509.8, "valid_targets_min": 772 }, { "epoch": 3.554735547355474, "grad_norm": 0.5118921758886427, "learning_rate": 2.295224439266263e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.07552247494459152, "step": 2890, "valid_targets_mean": 3729.6, "valid_targets_min": 1093 }, { "epoch": 3.5608856088560885, "grad_norm": 0.437246955238151, "learning_rate": 2.2891555389652296e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.06995870918035507, "step": 2895, "valid_targets_mean": 4703.5, "valid_targets_min": 725 }, { "epoch": 3.5670356703567037, "grad_norm": 0.5322019397423305, "learning_rate": 2.2830839180849688e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.09949615597724915, "step": 2900, "valid_targets_mean": 4569.4, "valid_targets_min": 1512 }, { "epoch": 3.5731857318573184, "grad_norm": 0.5826176798062128, "learning_rate": 2.2770096337515707e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.08007039874792099, "step": 2905, "valid_targets_mean": 3058.8, "valid_targets_min": 806 }, { "epoch": 3.5793357933579335, "grad_norm": 0.5851533034233356, "learning_rate": 2.270932743116187e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.07829935848712921, "step": 2910, "valid_targets_mean": 2861.5, "valid_targets_min": 615 }, { "epoch": 3.5854858548585486, "grad_norm": 0.5514295047188729, "learning_rate": 2.26485330335449e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.08024849742650986, "step": 2915, "valid_targets_mean": 3024.2, "valid_targets_min": 730 }, { "epoch": 3.591635916359164, "grad_norm": 0.5680683619824699, "learning_rate": 2.2587713716661356e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.08459212630987167, "step": 2920, "valid_targets_mean": 4944.9, "valid_targets_min": 1697 }, { "epoch": 3.5977859778597785, "grad_norm": 0.414136055154694, "learning_rate": 2.2526870052742283e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.10233662277460098, "step": 2925, "valid_targets_mean": 6669.5, "valid_targets_min": 2178 }, { "epoch": 3.6039360393603936, "grad_norm": 0.4814917168206153, "learning_rate": 2.2466002614247748e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.09646624326705933, "step": 2930, "valid_targets_mean": 4670.4, "valid_targets_min": 1535 }, { "epoch": 3.6100861008610083, "grad_norm": 0.5328321932070169, "learning_rate": 2.2405111973861562e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.09511435776948929, "step": 2935, "valid_targets_mean": 3880.5, "valid_targets_min": 1329 }, { "epoch": 3.6162361623616235, "grad_norm": 0.5082863860510842, "learning_rate": 2.23441987044858e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.03942929953336716, "step": 2940, "valid_targets_mean": 2156.8, "valid_targets_min": 670 }, { "epoch": 3.6223862238622386, "grad_norm": 0.45988004581722247, "learning_rate": 2.2283263379235457e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.09746742248535156, "step": 2945, "valid_targets_mean": 5174.5, "valid_targets_min": 1502 }, { "epoch": 3.6285362853628538, "grad_norm": 0.5036731253575619, "learning_rate": 2.222230657143305e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.08364607393741608, "step": 2950, "valid_targets_mean": 3381.1, "valid_targets_min": 812 }, { "epoch": 3.6346863468634685, "grad_norm": 0.551314316649068, "learning_rate": 2.2161328854603213e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.07728952169418335, "step": 2955, "valid_targets_mean": 3063.1, "valid_targets_min": 723 }, { "epoch": 3.6408364083640836, "grad_norm": 0.51479507876296, "learning_rate": 2.210033080246731e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.08519040793180466, "step": 2960, "valid_targets_mean": 4596.8, "valid_targets_min": 748 }, { "epoch": 3.6469864698646988, "grad_norm": 0.5173643741994616, "learning_rate": 2.203931298893802e-05, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.10068618506193161, "step": 2965, "valid_targets_mean": 4853.0, "valid_targets_min": 675 }, { "epoch": 3.6531365313653135, "grad_norm": 0.5152255866096087, "learning_rate": 2.1978275988113983e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.0770726352930069, "step": 2970, "valid_targets_mean": 3557.2, "valid_targets_min": 882 }, { "epoch": 3.6592865928659286, "grad_norm": 0.46558824951501704, "learning_rate": 2.1917220374274337e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.07974518090486526, "step": 2975, "valid_targets_mean": 4598.5, "valid_targets_min": 962 }, { "epoch": 3.6654366543665438, "grad_norm": 0.5267988064286256, "learning_rate": 2.1856146721873355e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.0800408348441124, "step": 2980, "valid_targets_mean": 3688.0, "valid_targets_min": 702 }, { "epoch": 3.671586715867159, "grad_norm": 0.500833065686856, "learning_rate": 2.1795055605535026e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.09218673408031464, "step": 2985, "valid_targets_mean": 3804.9, "valid_targets_min": 1076 }, { "epoch": 3.6777367773677736, "grad_norm": 0.5188781600437642, "learning_rate": 2.173394760004766e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.07670671492815018, "step": 2990, "valid_targets_mean": 3710.1, "valid_targets_min": 961 }, { "epoch": 3.6838868388683887, "grad_norm": 0.526202909842195, "learning_rate": 2.1672823280358463e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.06018427014350891, "step": 2995, "valid_targets_mean": 2723.0, "valid_targets_min": 821 }, { "epoch": 3.6900369003690034, "grad_norm": 0.5583942214599857, "learning_rate": 2.1611683221568147e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.07016149908304214, "step": 3000, "valid_targets_mean": 2577.1, "valid_targets_min": 584 }, { "epoch": 3.6961869618696186, "grad_norm": 0.503187802018394, "learning_rate": 2.155052799892549e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.07081443071365356, "step": 3005, "valid_targets_mean": 2839.6, "valid_targets_min": 593 }, { "epoch": 3.7023370233702337, "grad_norm": 0.4423879077987992, "learning_rate": 2.1489358187821973e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.058198701590299606, "step": 3010, "valid_targets_mean": 4288.9, "valid_targets_min": 759 }, { "epoch": 3.708487084870849, "grad_norm": 0.523500597415475, "learning_rate": 2.1428174363786293e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.06767795234918594, "step": 3015, "valid_targets_mean": 3071.5, "valid_targets_min": 697 }, { "epoch": 3.7146371463714636, "grad_norm": 0.6630227292179588, "learning_rate": 2.136697710247903e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.06141120195388794, "step": 3020, "valid_targets_mean": 2274.9, "valid_targets_min": 749 }, { "epoch": 3.7207872078720787, "grad_norm": 0.4774911599271858, "learning_rate": 2.1305766979687183e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.08603742718696594, "step": 3025, "valid_targets_mean": 4596.4, "valid_targets_min": 1511 }, { "epoch": 3.726937269372694, "grad_norm": 0.4873655994209514, "learning_rate": 2.1244544571318736e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.09643786400556564, "step": 3030, "valid_targets_mean": 4984.9, "valid_targets_min": 725 }, { "epoch": 3.7330873308733086, "grad_norm": 0.5861604893643256, "learning_rate": 2.1183310453397287e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.06834369897842407, "step": 3035, "valid_targets_mean": 2566.1, "valid_targets_min": 817 }, { "epoch": 3.7392373923739237, "grad_norm": 0.5798281756405008, "learning_rate": 2.1122065202056602e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.06632263958454132, "step": 3040, "valid_targets_mean": 2215.2, "valid_targets_min": 1006 }, { "epoch": 3.745387453874539, "grad_norm": 0.5051835355023278, "learning_rate": 2.1060809393535198e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.07687811553478241, "step": 3045, "valid_targets_mean": 3804.5, "valid_targets_min": 1147 }, { "epoch": 3.751537515375154, "grad_norm": 0.49107466628574503, "learning_rate": 2.0999543604170927e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.06628717482089996, "step": 3050, "valid_targets_mean": 3294.6, "valid_targets_min": 734 }, { "epoch": 3.7576875768757687, "grad_norm": 0.5492487915345526, "learning_rate": 2.0938268410395525e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.09565361589193344, "step": 3055, "valid_targets_mean": 3335.4, "valid_targets_min": 954 }, { "epoch": 3.763837638376384, "grad_norm": 0.49989315860754857, "learning_rate": 2.0876984388729237e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.08043211698532104, "step": 3060, "valid_targets_mean": 3451.5, "valid_targets_min": 869 }, { "epoch": 3.7699876998769986, "grad_norm": 0.48854904308329133, "learning_rate": 2.081569211577536e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.10336951911449432, "step": 3065, "valid_targets_mean": 4580.4, "valid_targets_min": 1182 }, { "epoch": 3.7761377613776137, "grad_norm": 0.544658316205967, "learning_rate": 2.0754392168214818e-05, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.09734412282705307, "step": 3070, "valid_targets_mean": 4099.6, "valid_targets_min": 1163 }, { "epoch": 3.782287822878229, "grad_norm": 0.5191321368231835, "learning_rate": 2.0693085122800745e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.05870068818330765, "step": 3075, "valid_targets_mean": 2718.2, "valid_targets_min": 892 }, { "epoch": 3.788437884378844, "grad_norm": 0.47151240316870807, "learning_rate": 2.0631771556353065e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.08743983507156372, "step": 3080, "valid_targets_mean": 4449.8, "valid_targets_min": 949 }, { "epoch": 3.7945879458794587, "grad_norm": 0.46875132694942334, "learning_rate": 2.0570452045753045e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.09555913507938385, "step": 3085, "valid_targets_mean": 4944.2, "valid_targets_min": 1836 }, { "epoch": 3.800738007380074, "grad_norm": 0.4750348212888331, "learning_rate": 2.0509127167937882e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.07685679942369461, "step": 3090, "valid_targets_mean": 3616.9, "valid_targets_min": 1120 }, { "epoch": 3.8068880688806885, "grad_norm": 0.46920532486186584, "learning_rate": 2.044779749989529e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.06964731961488724, "step": 3095, "valid_targets_mean": 3640.8, "valid_targets_min": 1359 }, { "epoch": 3.8130381303813037, "grad_norm": 0.46599609562129785, "learning_rate": 2.038646361865802e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.08804105967283249, "step": 3100, "valid_targets_mean": 4394.6, "valid_targets_min": 1698 }, { "epoch": 3.819188191881919, "grad_norm": 0.6250381818122364, "learning_rate": 2.0325126101298484e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.10825387388467789, "step": 3105, "valid_targets_mean": 3503.9, "valid_targets_min": 720 }, { "epoch": 3.825338253382534, "grad_norm": 0.4767332833536551, "learning_rate": 2.0263785524923295e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.07753412425518036, "step": 3110, "valid_targets_mean": 3931.4, "valid_targets_min": 1513 }, { "epoch": 3.8314883148831487, "grad_norm": 0.5695196818279987, "learning_rate": 2.0202442466667876e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.07002855837345123, "step": 3115, "valid_targets_mean": 2558.4, "valid_targets_min": 726 }, { "epoch": 3.837638376383764, "grad_norm": 0.41393160736795137, "learning_rate": 2.014109750369096e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.07424236834049225, "step": 3120, "valid_targets_mean": 5951.4, "valid_targets_min": 1569 }, { "epoch": 3.843788437884379, "grad_norm": 0.4684034499426382, "learning_rate": 2.007975121316922e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.07539427280426025, "step": 3125, "valid_targets_mean": 4030.0, "valid_targets_min": 1276 }, { "epoch": 3.8499384993849937, "grad_norm": 0.6164204572353755, "learning_rate": 2.001840417229183e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.10436895489692688, "step": 3130, "valid_targets_mean": 3733.4, "valid_targets_min": 1172 }, { "epoch": 3.856088560885609, "grad_norm": 0.5447316028660181, "learning_rate": 1.9957056958255006e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.07176276296377182, "step": 3135, "valid_targets_mean": 2725.9, "valid_targets_min": 633 }, { "epoch": 3.862238622386224, "grad_norm": 0.6220840240687876, "learning_rate": 1.9895710148256604e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.07579903304576874, "step": 3140, "valid_targets_mean": 3683.9, "valid_targets_min": 780 }, { "epoch": 3.868388683886839, "grad_norm": 0.4723313772442079, "learning_rate": 1.983436431949067e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.08690563589334488, "step": 3145, "valid_targets_mean": 4245.1, "valid_targets_min": 1241 }, { "epoch": 3.874538745387454, "grad_norm": 0.44998138559908374, "learning_rate": 1.9773020049142033e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.09968946874141693, "step": 3150, "valid_targets_mean": 5583.9, "valid_targets_min": 797 }, { "epoch": 3.880688806888069, "grad_norm": 0.5270122631047541, "learning_rate": 1.9711677914380845e-05, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.05509759113192558, "step": 3155, "valid_targets_mean": 2708.1, "valid_targets_min": 711 }, { "epoch": 3.8868388683886836, "grad_norm": 0.6017459760924264, "learning_rate": 1.9650338492357157e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.07726362347602844, "step": 3160, "valid_targets_mean": 3143.1, "valid_targets_min": 901 }, { "epoch": 3.892988929889299, "grad_norm": 0.4913540549541257, "learning_rate": 1.9589002360195527e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.10274532437324524, "step": 3165, "valid_targets_mean": 4914.6, "valid_targets_min": 1125 }, { "epoch": 3.899138991389914, "grad_norm": 0.5000331800334817, "learning_rate": 1.952767009498953e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.08059678971767426, "step": 3170, "valid_targets_mean": 3745.5, "valid_targets_min": 672 }, { "epoch": 3.905289052890529, "grad_norm": 0.5358154194004562, "learning_rate": 1.9466342273796385e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.07104428112506866, "step": 3175, "valid_targets_mean": 2510.0, "valid_targets_min": 876 }, { "epoch": 3.911439114391144, "grad_norm": 0.47974465495498386, "learning_rate": 1.9405019473631466e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.05414709821343422, "step": 3180, "valid_targets_mean": 3689.9, "valid_targets_min": 798 }, { "epoch": 3.917589175891759, "grad_norm": 0.49317410562980474, "learning_rate": 1.9343702271462927e-05, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.08570997416973114, "step": 3185, "valid_targets_mean": 3915.9, "valid_targets_min": 1071 }, { "epoch": 3.923739237392374, "grad_norm": 0.4983831118883738, "learning_rate": 1.9282391244206252e-05, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.06947653740644455, "step": 3190, "valid_targets_mean": 3173.9, "valid_targets_min": 1035 }, { "epoch": 3.9298892988929888, "grad_norm": 0.42952770240863514, "learning_rate": 1.9221086968718815e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.08404210209846497, "step": 3195, "valid_targets_mean": 4930.2, "valid_targets_min": 1347 }, { "epoch": 3.936039360393604, "grad_norm": 0.5037826105508637, "learning_rate": 1.9159790021794488e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.10758716613054276, "step": 3200, "valid_targets_mean": 4524.2, "valid_targets_min": 1207 }, { "epoch": 3.942189421894219, "grad_norm": 0.5039306598479385, "learning_rate": 1.9098500980158165e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.10665933787822723, "step": 3205, "valid_targets_mean": 5237.8, "valid_targets_min": 1391 }, { "epoch": 3.948339483394834, "grad_norm": 0.5782200309582292, "learning_rate": 1.903722042046036e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.04807044193148613, "step": 3210, "valid_targets_mean": 1499.4, "valid_targets_min": 816 }, { "epoch": 3.954489544895449, "grad_norm": 0.5505302590778401, "learning_rate": 1.8975948919271817e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.06564323604106903, "step": 3215, "valid_targets_mean": 2359.0, "valid_targets_min": 918 }, { "epoch": 3.960639606396064, "grad_norm": 0.5823874931921458, "learning_rate": 1.8914687053078017e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.09324459731578827, "step": 3220, "valid_targets_mean": 2751.1, "valid_targets_min": 678 }, { "epoch": 3.9667896678966788, "grad_norm": 0.5394851856779528, "learning_rate": 1.8853435398273805e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.09117894619703293, "step": 3225, "valid_targets_mean": 3691.9, "valid_targets_min": 1051 }, { "epoch": 3.972939729397294, "grad_norm": 0.5944595285182408, "learning_rate": 1.879219453115794e-05, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.07047883421182632, "step": 3230, "valid_targets_mean": 1868.2, "valid_targets_min": 656 }, { "epoch": 3.979089790897909, "grad_norm": 0.5173724487631877, "learning_rate": 1.8730965027927688e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.040990497916936874, "step": 3235, "valid_targets_mean": 2296.6, "valid_targets_min": 623 }, { "epoch": 3.985239852398524, "grad_norm": 0.5605418502623941, "learning_rate": 1.86697474646734e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.13732434809207916, "step": 3240, "valid_targets_mean": 5050.0, "valid_targets_min": 1148 }, { "epoch": 3.991389913899139, "grad_norm": 0.44586039014335926, "learning_rate": 1.860854241737307e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.07586301863193512, "step": 3245, "valid_targets_mean": 4287.8, "valid_targets_min": 1059 }, { "epoch": 3.997539975399754, "grad_norm": 0.542761234042047, "learning_rate": 1.8547350461886966e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.07270455360412598, "step": 3250, "valid_targets_mean": 2833.1, "valid_targets_min": 1292 }, { "epoch": 4.003690036900369, "grad_norm": 0.4847126362528262, "learning_rate": 1.8486172173952154e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.05783306062221527, "step": 3255, "valid_targets_mean": 3117.8, "valid_targets_min": 771 }, { "epoch": 4.009840098400984, "grad_norm": 0.4659779631141483, "learning_rate": 1.8425008129177087e-05, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.06389324367046356, "step": 3260, "valid_targets_mean": 4502.9, "valid_targets_min": 1231 }, { "epoch": 4.015990159901599, "grad_norm": 0.5220612005602768, "learning_rate": 1.8363858903036266e-05, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.06980709731578827, "step": 3265, "valid_targets_mean": 4072.8, "valid_targets_min": 1473 }, { "epoch": 4.022140221402214, "grad_norm": 0.5686219625154181, "learning_rate": 1.830272507086471e-05, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.057837411761283875, "step": 3270, "valid_targets_mean": 2812.2, "valid_targets_min": 700 }, { "epoch": 4.028290282902829, "grad_norm": 0.5946771596994455, "learning_rate": 1.824160720785264e-05, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.07070808112621307, "step": 3275, "valid_targets_mean": 3078.5, "valid_targets_min": 1386 }, { "epoch": 4.0344403444034445, "grad_norm": 0.5318470710013258, "learning_rate": 1.8180505889040005e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.08657799661159515, "step": 3280, "valid_targets_mean": 6241.5, "valid_targets_min": 3439 }, { "epoch": 4.040590405904059, "grad_norm": 0.4914685824750089, "learning_rate": 1.8119421689311095e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.06925514340400696, "step": 3285, "valid_targets_mean": 3738.2, "valid_targets_min": 534 }, { "epoch": 4.046740467404674, "grad_norm": 0.4782442048405698, "learning_rate": 1.8058355183389152e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.0859822928905487, "step": 3290, "valid_targets_mean": 5769.8, "valid_targets_min": 1397 }, { "epoch": 4.052890528905289, "grad_norm": 0.515649616238079, "learning_rate": 1.7997306945830915e-05, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.05107033625245094, "step": 3295, "valid_targets_mean": 3106.2, "valid_targets_min": 788 }, { "epoch": 4.059040590405904, "grad_norm": 0.5148130506672726, "learning_rate": 1.793627755102127e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.06403973698616028, "step": 3300, "valid_targets_mean": 3715.0, "valid_targets_min": 968 }, { "epoch": 4.065190651906519, "grad_norm": 0.4606342811052093, "learning_rate": 1.78752675731678e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.04643998295068741, "step": 3305, "valid_targets_mean": 3245.9, "valid_targets_min": 1078 }, { "epoch": 4.071340713407134, "grad_norm": 0.5665502646313025, "learning_rate": 1.7814277586295386e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.061585765331983566, "step": 3310, "valid_targets_mean": 3092.4, "valid_targets_min": 742 }, { "epoch": 4.077490774907749, "grad_norm": 0.529629767598369, "learning_rate": 1.7753308164240858e-05, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.08363986015319824, "step": 3315, "valid_targets_mean": 4668.4, "valid_targets_min": 1552 }, { "epoch": 4.083640836408364, "grad_norm": 0.5076912030173814, "learning_rate": 1.7692359880647516e-05, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.08388642966747284, "step": 3320, "valid_targets_mean": 4158.8, "valid_targets_min": 718 }, { "epoch": 4.089790897908979, "grad_norm": 0.4605966844549127, "learning_rate": 1.7631433308959806e-05, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.07828954607248306, "step": 3325, "valid_targets_mean": 5035.4, "valid_targets_min": 746 }, { "epoch": 4.095940959409594, "grad_norm": 0.4461312138135786, "learning_rate": 1.757052902241788e-05, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.08744291216135025, "step": 3330, "valid_targets_mean": 6007.2, "valid_targets_min": 1020 }, { "epoch": 4.102091020910209, "grad_norm": 0.5598340140998831, "learning_rate": 1.7509647594052203e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.07428855448961258, "step": 3335, "valid_targets_mean": 3529.4, "valid_targets_min": 765 }, { "epoch": 4.108241082410824, "grad_norm": 0.5154871811648977, "learning_rate": 1.7448789596678212e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.06815948337316513, "step": 3340, "valid_targets_mean": 3972.1, "valid_targets_min": 652 }, { "epoch": 4.114391143911439, "grad_norm": 0.5583949032793244, "learning_rate": 1.7387955602890832e-05, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.07821419835090637, "step": 3345, "valid_targets_mean": 3239.0, "valid_targets_min": 820 }, { "epoch": 4.120541205412054, "grad_norm": 0.5447759861816874, "learning_rate": 1.732714618505921e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.056116413325071335, "step": 3350, "valid_targets_mean": 2703.5, "valid_targets_min": 745 }, { "epoch": 4.126691266912669, "grad_norm": 0.48743453205826837, "learning_rate": 1.7266361915321216e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.06582196056842804, "step": 3355, "valid_targets_mean": 4326.4, "valid_targets_min": 868 }, { "epoch": 4.132841328413284, "grad_norm": 0.6293436003161086, "learning_rate": 1.7205603365578127e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.09089374542236328, "step": 3360, "valid_targets_mean": 5472.0, "valid_targets_min": 1015 }, { "epoch": 4.138991389913899, "grad_norm": 0.5382810078608156, "learning_rate": 1.714487110748923e-05, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.07424285262823105, "step": 3365, "valid_targets_mean": 3461.8, "valid_targets_min": 892 }, { "epoch": 4.145141451414514, "grad_norm": 0.5767847704595052, "learning_rate": 1.708416571246643e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.1102609783411026, "step": 3370, "valid_targets_mean": 4746.8, "valid_targets_min": 1181 }, { "epoch": 4.1512915129151295, "grad_norm": 0.46094385862132126, "learning_rate": 1.702348775166891e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.07355746626853943, "step": 3375, "valid_targets_mean": 4858.4, "valid_targets_min": 1289 }, { "epoch": 4.157441574415744, "grad_norm": 0.5273851457039939, "learning_rate": 1.6962837795997705e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.09516991674900055, "step": 3380, "valid_targets_mean": 4578.5, "valid_targets_min": 868 }, { "epoch": 4.163591635916359, "grad_norm": 0.5286780077419035, "learning_rate": 1.6902216416090362e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.0736001580953598, "step": 3385, "valid_targets_mean": 3672.8, "valid_targets_min": 711 }, { "epoch": 4.169741697416974, "grad_norm": 0.5467773637077603, "learning_rate": 1.6841624182315596e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.08320039510726929, "step": 3390, "valid_targets_mean": 3863.8, "valid_targets_min": 820 }, { "epoch": 4.175891758917589, "grad_norm": 0.6869246997323394, "learning_rate": 1.678106166476785e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.07946888357400894, "step": 3395, "valid_targets_mean": 4235.1, "valid_targets_min": 1112 }, { "epoch": 4.182041820418204, "grad_norm": 0.5351371705595994, "learning_rate": 1.6720529433262018e-05, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.06436219811439514, "step": 3400, "valid_targets_mean": 3413.6, "valid_targets_min": 748 }, { "epoch": 4.1881918819188195, "grad_norm": 0.6706465654635336, "learning_rate": 1.666002805732801e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.1119987964630127, "step": 3405, "valid_targets_mean": 3152.4, "valid_targets_min": 548 }, { "epoch": 4.194341943419434, "grad_norm": 0.5760810844110383, "learning_rate": 1.6599558106205437e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.09893061220645905, "step": 3410, "valid_targets_mean": 4299.2, "valid_targets_min": 790 }, { "epoch": 4.200492004920049, "grad_norm": 0.585926878387223, "learning_rate": 1.653912014883825e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.07614987343549728, "step": 3415, "valid_targets_mean": 3813.8, "valid_targets_min": 1001 }, { "epoch": 4.206642066420664, "grad_norm": 0.49494454301990404, "learning_rate": 1.6478714753869376e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.05910831317305565, "step": 3420, "valid_targets_mean": 3775.0, "valid_targets_min": 868 }, { "epoch": 4.212792127921279, "grad_norm": 0.5288842145540353, "learning_rate": 1.641834248963536e-05, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.08476749807596207, "step": 3425, "valid_targets_mean": 4581.8, "valid_targets_min": 1024 }, { "epoch": 4.218942189421894, "grad_norm": 0.5350594055627105, "learning_rate": 1.6358003924161047e-05, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.060208383947610855, "step": 3430, "valid_targets_mean": 3581.1, "valid_targets_min": 1411 }, { "epoch": 4.2250922509225095, "grad_norm": 0.6304659363350698, "learning_rate": 1.62976996251542e-05, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.04790829122066498, "step": 3435, "valid_targets_mean": 2364.8, "valid_targets_min": 1056 }, { "epoch": 4.231242312423125, "grad_norm": 0.5985644536258957, "learning_rate": 1.623743016000021e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.07500965893268585, "step": 3440, "valid_targets_mean": 3000.0, "valid_targets_min": 567 }, { "epoch": 4.237392373923739, "grad_norm": 0.43664098310110033, "learning_rate": 1.6177196095756706e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.034630633890628815, "step": 3445, "valid_targets_mean": 3722.4, "valid_targets_min": 714 }, { "epoch": 4.243542435424354, "grad_norm": 0.47513847632255607, "learning_rate": 1.6116997999148223e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.05792335420846939, "step": 3450, "valid_targets_mean": 3704.1, "valid_targets_min": 744 }, { "epoch": 4.249692496924969, "grad_norm": 0.5558353421338394, "learning_rate": 1.6056836436560927e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.11340054124593735, "step": 3455, "valid_targets_mean": 4209.2, "valid_targets_min": 1221 }, { "epoch": 4.255842558425584, "grad_norm": 0.5852000452078986, "learning_rate": 1.5996711974037212e-05, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.05671136826276779, "step": 3460, "valid_targets_mean": 2514.8, "valid_targets_min": 765 }, { "epoch": 4.2619926199261995, "grad_norm": 0.4988603396819256, "learning_rate": 1.593662517727044e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.08585044741630554, "step": 3465, "valid_targets_mean": 4800.9, "valid_targets_min": 1273 }, { "epoch": 4.268142681426815, "grad_norm": 0.5201371521678605, "learning_rate": 1.587657661159955e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.05396566540002823, "step": 3470, "valid_targets_mean": 3181.5, "valid_targets_min": 950 }, { "epoch": 4.274292742927429, "grad_norm": 0.49471240095979996, "learning_rate": 1.5816566842003805e-05, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.049535416066646576, "step": 3475, "valid_targets_mean": 3328.4, "valid_targets_min": 1111 }, { "epoch": 4.280442804428044, "grad_norm": 0.5347155449526627, "learning_rate": 1.5756596433097436e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.039694249629974365, "step": 3480, "valid_targets_mean": 1989.2, "valid_targets_min": 635 }, { "epoch": 4.286592865928659, "grad_norm": 0.4963480566458479, "learning_rate": 1.5696665949124333e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.051367416977882385, "step": 3485, "valid_targets_mean": 3011.5, "valid_targets_min": 1073 }, { "epoch": 4.292742927429274, "grad_norm": 0.563274477988766, "learning_rate": 1.563677595395277e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.07458598166704178, "step": 3490, "valid_targets_mean": 3607.5, "valid_targets_min": 746 }, { "epoch": 4.2988929889298895, "grad_norm": 0.5506382266547923, "learning_rate": 1.557692701107005e-05, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.07375942170619965, "step": 3495, "valid_targets_mean": 3713.5, "valid_targets_min": 831 }, { "epoch": 4.305043050430505, "grad_norm": 0.562915106596071, "learning_rate": 1.5517119683577228e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.07103714346885681, "step": 3500, "valid_targets_mean": 2919.8, "valid_targets_min": 815 }, { "epoch": 4.31119311193112, "grad_norm": 0.5284114186722062, "learning_rate": 1.5457354534183825e-05, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.06331208348274231, "step": 3505, "valid_targets_mean": 3634.5, "valid_targets_min": 634 }, { "epoch": 4.317343173431734, "grad_norm": 0.5424417577852826, "learning_rate": 1.5397632125202505e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.06771031022071838, "step": 3510, "valid_targets_mean": 3430.8, "valid_targets_min": 861 }, { "epoch": 4.323493234932349, "grad_norm": 0.5595521906404591, "learning_rate": 1.5337953018543824e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.0629117339849472, "step": 3515, "valid_targets_mean": 3504.6, "valid_targets_min": 1385 }, { "epoch": 4.329643296432964, "grad_norm": 0.4804400726372417, "learning_rate": 1.527831777571089e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.0816967785358429, "step": 3520, "valid_targets_mean": 4754.1, "valid_targets_min": 1030 }, { "epoch": 4.3357933579335795, "grad_norm": 0.552143026803764, "learning_rate": 1.5218726957794125e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.08584423363208771, "step": 3525, "valid_targets_mean": 4075.2, "valid_targets_min": 765 }, { "epoch": 4.341943419434195, "grad_norm": 0.4550423203649379, "learning_rate": 1.5159181125465983e-05, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.07080920785665512, "step": 3530, "valid_targets_mean": 4762.4, "valid_targets_min": 1447 }, { "epoch": 4.34809348093481, "grad_norm": 0.4731313758684058, "learning_rate": 1.5099680838975623e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.10025142133235931, "step": 3535, "valid_targets_mean": 6244.4, "valid_targets_min": 2427 }, { "epoch": 4.354243542435424, "grad_norm": 0.5099627239673542, "learning_rate": 1.5040226658143724e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.08871401101350784, "step": 3540, "valid_targets_mean": 4634.8, "valid_targets_min": 1485 }, { "epoch": 4.360393603936039, "grad_norm": 0.4938553918682398, "learning_rate": 1.4980819142357137e-05, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.064915731549263, "step": 3545, "valid_targets_mean": 3435.2, "valid_targets_min": 309 }, { "epoch": 4.366543665436654, "grad_norm": 0.5428877092509158, "learning_rate": 1.4921458850563661e-05, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.09234040230512619, "step": 3550, "valid_targets_mean": 4554.2, "valid_targets_min": 704 }, { "epoch": 4.372693726937269, "grad_norm": 0.4750006082582889, "learning_rate": 1.4862146341266795e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.058801207691431046, "step": 3555, "valid_targets_mean": 4011.9, "valid_targets_min": 726 }, { "epoch": 4.378843788437885, "grad_norm": 0.48944255581598395, "learning_rate": 1.4802882172520441e-05, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.08306654542684555, "step": 3560, "valid_targets_mean": 4794.6, "valid_targets_min": 995 }, { "epoch": 4.3849938499385, "grad_norm": 0.4962246966604672, "learning_rate": 1.4743666901923704e-05, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.0678686648607254, "step": 3565, "valid_targets_mean": 4336.4, "valid_targets_min": 1269 }, { "epoch": 4.391143911439114, "grad_norm": 0.5577783730998841, "learning_rate": 1.4684501086615606e-05, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.07702550292015076, "step": 3570, "valid_targets_mean": 2855.1, "valid_targets_min": 1222 }, { "epoch": 4.397293972939729, "grad_norm": 0.6315673514546636, "learning_rate": 1.4625385283269848e-05, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.07370610535144806, "step": 3575, "valid_targets_mean": 2643.2, "valid_targets_min": 740 }, { "epoch": 4.403444034440344, "grad_norm": 0.4706672123986462, "learning_rate": 1.4566320048089624e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.07439061999320984, "step": 3580, "valid_targets_mean": 4146.6, "valid_targets_min": 1246 }, { "epoch": 4.409594095940959, "grad_norm": 0.5298482881625111, "learning_rate": 1.45073059368023e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.0937977135181427, "step": 3585, "valid_targets_mean": 4273.1, "valid_targets_min": 1177 }, { "epoch": 4.415744157441575, "grad_norm": 0.49894653084638463, "learning_rate": 1.4448343504654262e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.0636676624417305, "step": 3590, "valid_targets_mean": 3722.4, "valid_targets_min": 895 }, { "epoch": 4.42189421894219, "grad_norm": 0.5852816524531729, "learning_rate": 1.4389433306405653e-05, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.07260304689407349, "step": 3595, "valid_targets_mean": 2942.8, "valid_targets_min": 974 }, { "epoch": 4.428044280442805, "grad_norm": 0.6045345485972843, "learning_rate": 1.4330575896325152e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.09738698601722717, "step": 3600, "valid_targets_mean": 3473.6, "valid_targets_min": 949 }, { "epoch": 4.434194341943419, "grad_norm": 0.5317173258708445, "learning_rate": 1.4271771828184796e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.08094622194766998, "step": 3605, "valid_targets_mean": 3401.8, "valid_targets_min": 934 }, { "epoch": 4.440344403444034, "grad_norm": 0.5677701759120205, "learning_rate": 1.4213021655254707e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.059883564710617065, "step": 3610, "valid_targets_mean": 2934.5, "valid_targets_min": 722 }, { "epoch": 4.446494464944649, "grad_norm": 0.5829831762933306, "learning_rate": 1.415432593029797e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.08871051669120789, "step": 3615, "valid_targets_mean": 3333.5, "valid_targets_min": 1255 }, { "epoch": 4.4526445264452645, "grad_norm": 0.5222148556635265, "learning_rate": 1.4095685205565342e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.08161695301532745, "step": 3620, "valid_targets_mean": 4200.1, "valid_targets_min": 1356 }, { "epoch": 4.45879458794588, "grad_norm": 0.4255139007077249, "learning_rate": 1.4037100032790107e-05, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.06346962600946426, "step": 3625, "valid_targets_mean": 4612.5, "valid_targets_min": 750 }, { "epoch": 4.464944649446495, "grad_norm": 0.5914681178825688, "learning_rate": 1.397857096318291e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.06928400695323944, "step": 3630, "valid_targets_mean": 2383.4, "valid_targets_min": 1175 }, { "epoch": 4.471094710947109, "grad_norm": 0.5686194327258245, "learning_rate": 1.3920098547426491e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.09494592994451523, "step": 3635, "valid_targets_mean": 3825.9, "valid_targets_min": 1518 }, { "epoch": 4.477244772447724, "grad_norm": 0.5694822397512799, "learning_rate": 1.386168333567059e-05, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.09039486944675446, "step": 3640, "valid_targets_mean": 3836.8, "valid_targets_min": 869 }, { "epoch": 4.483394833948339, "grad_norm": 0.47822365496970226, "learning_rate": 1.3803325877526703e-05, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.06846988201141357, "step": 3645, "valid_targets_mean": 4471.9, "valid_targets_min": 750 }, { "epoch": 4.4895448954489545, "grad_norm": 0.5026771497972639, "learning_rate": 1.3745026722062956e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.07252183556556702, "step": 3650, "valid_targets_mean": 4237.2, "valid_targets_min": 1263 }, { "epoch": 4.49569495694957, "grad_norm": 0.47401726649085274, "learning_rate": 1.3686786417798916e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.06462505459785461, "step": 3655, "valid_targets_mean": 4246.4, "valid_targets_min": 1076 }, { "epoch": 4.501845018450185, "grad_norm": 0.49458926492319905, "learning_rate": 1.3628605512700431e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.08224207162857056, "step": 3660, "valid_targets_mean": 4970.0, "valid_targets_min": 655 }, { "epoch": 4.507995079950799, "grad_norm": 0.5147416213357333, "learning_rate": 1.3570484554174505e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.07062176614999771, "step": 3665, "valid_targets_mean": 3785.0, "valid_targets_min": 1201 }, { "epoch": 4.514145141451414, "grad_norm": 0.5636561095129219, "learning_rate": 1.3512424089064088e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.08134806901216507, "step": 3670, "valid_targets_mean": 3404.5, "valid_targets_min": 746 }, { "epoch": 4.520295202952029, "grad_norm": 0.6062136107490886, "learning_rate": 1.3454424663642977e-05, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.07669124007225037, "step": 3675, "valid_targets_mean": 2703.5, "valid_targets_min": 1078 }, { "epoch": 4.5264452644526445, "grad_norm": 0.5138410760038257, "learning_rate": 1.3396486823610682e-05, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.07008562982082367, "step": 3680, "valid_targets_mean": 3448.0, "valid_targets_min": 1073 }, { "epoch": 4.53259532595326, "grad_norm": 0.5258186936308812, "learning_rate": 1.3338611114087252e-05, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.07793732732534409, "step": 3685, "valid_targets_mean": 3311.5, "valid_targets_min": 1538 }, { "epoch": 4.538745387453875, "grad_norm": 0.48558932245633596, "learning_rate": 1.3280798079608181e-05, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.07997334748506546, "step": 3690, "valid_targets_mean": 4464.2, "valid_targets_min": 727 }, { "epoch": 4.54489544895449, "grad_norm": 0.4972841188317051, "learning_rate": 1.3223048264119269e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.06024523079395294, "step": 3695, "valid_targets_mean": 4078.1, "valid_targets_min": 808 }, { "epoch": 4.551045510455104, "grad_norm": 0.465057621006943, "learning_rate": 1.3165362210971501e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.068995401263237, "step": 3700, "valid_targets_mean": 3970.1, "valid_targets_min": 773 }, { "epoch": 4.557195571955719, "grad_norm": 0.49976069741713, "learning_rate": 1.3107740462915953e-05, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.05405917018651962, "step": 3705, "valid_targets_mean": 3382.1, "valid_targets_min": 627 }, { "epoch": 4.5633456334563345, "grad_norm": 0.47422656680463937, "learning_rate": 1.3050183562098653e-05, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.05915185436606407, "step": 3710, "valid_targets_mean": 4194.0, "valid_targets_min": 754 }, { "epoch": 4.56949569495695, "grad_norm": 0.5928831954299879, "learning_rate": 1.299269205005553e-05, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.05791758745908737, "step": 3715, "valid_targets_mean": 1995.2, "valid_targets_min": 656 }, { "epoch": 4.575645756457565, "grad_norm": 0.4831304370797475, "learning_rate": 1.2935266467707275e-05, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.06728240847587585, "step": 3720, "valid_targets_mean": 5017.4, "valid_targets_min": 1511 }, { "epoch": 4.58179581795818, "grad_norm": 0.5776107680657485, "learning_rate": 1.287790735535424e-05, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.04329244792461395, "step": 3725, "valid_targets_mean": 2134.9, "valid_targets_min": 829 }, { "epoch": 4.587945879458795, "grad_norm": 0.4449963835783109, "learning_rate": 1.2820615252671434e-05, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.061272963881492615, "step": 3730, "valid_targets_mean": 4642.6, "valid_targets_min": 1366 }, { "epoch": 4.594095940959409, "grad_norm": 0.5235970561683299, "learning_rate": 1.2763390698703341e-05, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.07071864604949951, "step": 3735, "valid_targets_mean": 3672.9, "valid_targets_min": 1062 }, { "epoch": 4.6002460024600245, "grad_norm": 0.6572220272058902, "learning_rate": 1.2706234231858932e-05, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.07880595326423645, "step": 3740, "valid_targets_mean": 2513.5, "valid_targets_min": 796 }, { "epoch": 4.60639606396064, "grad_norm": 0.582577179421199, "learning_rate": 1.2649146389906553e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.07004042714834213, "step": 3745, "valid_targets_mean": 2945.9, "valid_targets_min": 825 }, { "epoch": 4.612546125461255, "grad_norm": 0.5720410190558141, "learning_rate": 1.259212770996887e-05, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.10302242636680603, "step": 3750, "valid_targets_mean": 5194.1, "valid_targets_min": 975 }, { "epoch": 4.61869618696187, "grad_norm": 0.4896174083665472, "learning_rate": 1.2535178728517852e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.07344147562980652, "step": 3755, "valid_targets_mean": 4385.2, "valid_targets_min": 848 }, { "epoch": 4.624846248462484, "grad_norm": 0.5756366891167546, "learning_rate": 1.2478299981369667e-05, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.0843324139714241, "step": 3760, "valid_targets_mean": 4323.6, "valid_targets_min": 888 }, { "epoch": 4.630996309963099, "grad_norm": 0.6237415331280456, "learning_rate": 1.2421492003679671e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.08802750706672668, "step": 3765, "valid_targets_mean": 3715.6, "valid_targets_min": 818 }, { "epoch": 4.6371463714637144, "grad_norm": 0.4992602705757155, "learning_rate": 1.2364755329937403e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.07272461801767349, "step": 3770, "valid_targets_mean": 4209.1, "valid_targets_min": 993 }, { "epoch": 4.64329643296433, "grad_norm": 0.47324861839611904, "learning_rate": 1.2308090493961484e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.06892076879739761, "step": 3775, "valid_targets_mean": 4364.8, "valid_targets_min": 1213 }, { "epoch": 4.649446494464945, "grad_norm": 0.5144479425298557, "learning_rate": 1.2251498028894658e-05, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.06068869307637215, "step": 3780, "valid_targets_mean": 3596.5, "valid_targets_min": 1265 }, { "epoch": 4.65559655596556, "grad_norm": 0.543136696144552, "learning_rate": 1.2194978467198748e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.062472306191921234, "step": 3785, "valid_targets_mean": 3187.6, "valid_targets_min": 626 }, { "epoch": 4.661746617466175, "grad_norm": 0.5286524894298498, "learning_rate": 1.2138532340649638e-05, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.07963377237319946, "step": 3790, "valid_targets_mean": 4249.2, "valid_targets_min": 902 }, { "epoch": 4.667896678966789, "grad_norm": 0.6567560149626056, "learning_rate": 1.2082160180332308e-05, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.09163267910480499, "step": 3795, "valid_targets_mean": 3868.6, "valid_targets_min": 777 }, { "epoch": 4.674046740467404, "grad_norm": 0.46351341634770754, "learning_rate": 1.2025862516635782e-05, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.07743068784475327, "step": 3800, "valid_targets_mean": 4704.1, "valid_targets_min": 911 }, { "epoch": 4.68019680196802, "grad_norm": 0.6354546361725474, "learning_rate": 1.19696398792482e-05, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.09236712753772736, "step": 3805, "valid_targets_mean": 4463.0, "valid_targets_min": 1009 }, { "epoch": 4.686346863468635, "grad_norm": 0.6435358425703358, "learning_rate": 1.1913492797151772e-05, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.08572517335414886, "step": 3810, "valid_targets_mean": 3627.5, "valid_targets_min": 804 }, { "epoch": 4.69249692496925, "grad_norm": 0.4901786337459368, "learning_rate": 1.1857421798617837e-05, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.07259362936019897, "step": 3815, "valid_targets_mean": 3976.0, "valid_targets_min": 938 }, { "epoch": 4.698646986469865, "grad_norm": 0.48477130636044624, "learning_rate": 1.1801427411201903e-05, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.06874503195285797, "step": 3820, "valid_targets_mean": 4498.1, "valid_targets_min": 1256 }, { "epoch": 4.70479704797048, "grad_norm": 0.6168880714679651, "learning_rate": 1.1745510161738646e-05, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.07084785401821136, "step": 3825, "valid_targets_mean": 2575.5, "valid_targets_min": 1390 }, { "epoch": 4.710947109471094, "grad_norm": 0.5195154399095956, "learning_rate": 1.1689670576336991e-05, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.0658005028963089, "step": 3830, "valid_targets_mean": 3332.1, "valid_targets_min": 449 }, { "epoch": 4.7170971709717096, "grad_norm": 0.5136729697158225, "learning_rate": 1.1633909180375138e-05, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.03681659698486328, "step": 3835, "valid_targets_mean": 1849.9, "valid_targets_min": 1062 }, { "epoch": 4.723247232472325, "grad_norm": 0.44969242982556784, "learning_rate": 1.1578226498495608e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.06825601309537888, "step": 3840, "valid_targets_mean": 5380.5, "valid_targets_min": 1812 }, { "epoch": 4.72939729397294, "grad_norm": 0.5221717431192702, "learning_rate": 1.1522623054600355e-05, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.08411978930234909, "step": 3845, "valid_targets_mean": 4392.5, "valid_targets_min": 1174 }, { "epoch": 4.735547355473555, "grad_norm": 0.5960531445910542, "learning_rate": 1.1467099371845783e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.08852316439151764, "step": 3850, "valid_targets_mean": 3556.5, "valid_targets_min": 908 }, { "epoch": 4.741697416974169, "grad_norm": 0.6081536661118019, "learning_rate": 1.1411655972637865e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.08051259815692902, "step": 3855, "valid_targets_mean": 3077.5, "valid_targets_min": 1030 }, { "epoch": 4.747847478474784, "grad_norm": 0.5274281577052315, "learning_rate": 1.13562933786272e-05, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.07737687230110168, "step": 3860, "valid_targets_mean": 3497.4, "valid_targets_min": 660 }, { "epoch": 4.7539975399753995, "grad_norm": 0.41390929742086996, "learning_rate": 1.1301012110704105e-05, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.056217439472675323, "step": 3865, "valid_targets_mean": 5030.4, "valid_targets_min": 1301 }, { "epoch": 4.760147601476015, "grad_norm": 0.5075257633026137, "learning_rate": 1.1245812688993741e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.07909762859344482, "step": 3870, "valid_targets_mean": 5072.0, "valid_targets_min": 1457 }, { "epoch": 4.76629766297663, "grad_norm": 0.6056323717965811, "learning_rate": 1.1190695632851187e-05, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.06616080552339554, "step": 3875, "valid_targets_mean": 3140.9, "valid_targets_min": 697 }, { "epoch": 4.772447724477245, "grad_norm": 0.4882086217169741, "learning_rate": 1.1135661460856589e-05, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.055649369955062866, "step": 3880, "valid_targets_mean": 3043.1, "valid_targets_min": 1408 }, { "epoch": 4.77859778597786, "grad_norm": 0.5413567443991248, "learning_rate": 1.1080710690810244e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.10606395453214645, "step": 3885, "valid_targets_mean": 5074.6, "valid_targets_min": 1719 }, { "epoch": 4.784747847478474, "grad_norm": 0.5624429541241354, "learning_rate": 1.1025843839727735e-05, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.085678331553936, "step": 3890, "valid_targets_mean": 4083.0, "valid_targets_min": 1050 }, { "epoch": 4.7908979089790895, "grad_norm": 0.49625521938538614, "learning_rate": 1.0971061423835113e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.0709814801812172, "step": 3895, "valid_targets_mean": 4170.6, "valid_targets_min": 874 }, { "epoch": 4.797047970479705, "grad_norm": 0.5077584404709818, "learning_rate": 1.0916363958563967e-05, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.06389714032411575, "step": 3900, "valid_targets_mean": 3698.9, "valid_targets_min": 1368 }, { "epoch": 4.80319803198032, "grad_norm": 0.5067180682852067, "learning_rate": 1.0861751958546626e-05, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.06770926713943481, "step": 3905, "valid_targets_mean": 3907.0, "valid_targets_min": 888 }, { "epoch": 4.809348093480935, "grad_norm": 0.53237355606112, "learning_rate": 1.0807225937611299e-05, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.06792059540748596, "step": 3910, "valid_targets_mean": 3627.5, "valid_targets_min": 851 }, { "epoch": 4.81549815498155, "grad_norm": 0.5204671492605579, "learning_rate": 1.0752786408777238e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.08350042998790741, "step": 3915, "valid_targets_mean": 4186.5, "valid_targets_min": 829 }, { "epoch": 4.821648216482165, "grad_norm": 0.5312367760073929, "learning_rate": 1.0698433884249933e-05, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.0519859679043293, "step": 3920, "valid_targets_mean": 2146.4, "valid_targets_min": 906 }, { "epoch": 4.8277982779827795, "grad_norm": 0.499503075851238, "learning_rate": 1.0644168875416252e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.07208546996116638, "step": 3925, "valid_targets_mean": 4055.0, "valid_targets_min": 1222 }, { "epoch": 4.833948339483395, "grad_norm": 0.6885457068358782, "learning_rate": 1.0589991892839683e-05, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.0665866881608963, "step": 3930, "valid_targets_mean": 2886.0, "valid_targets_min": 1019 }, { "epoch": 4.84009840098401, "grad_norm": 0.48038254936054964, "learning_rate": 1.0535903446255475e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.08551338315010071, "step": 3935, "valid_targets_mean": 6053.8, "valid_targets_min": 1559 }, { "epoch": 4.846248462484625, "grad_norm": 0.4855937379594069, "learning_rate": 1.0481904044565881e-05, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.0735793262720108, "step": 3940, "valid_targets_mean": 4364.6, "valid_targets_min": 684 }, { "epoch": 4.85239852398524, "grad_norm": 0.6220477710887902, "learning_rate": 1.0427994195835347e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.07010868936777115, "step": 3945, "valid_targets_mean": 2520.4, "valid_targets_min": 789 }, { "epoch": 4.858548585485855, "grad_norm": 0.5554550711680113, "learning_rate": 1.0374174407285747e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.07773833721876144, "step": 3950, "valid_targets_mean": 3834.2, "valid_targets_min": 801 }, { "epoch": 4.8646986469864695, "grad_norm": 0.4748342627057833, "learning_rate": 1.0320445185291617e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.08634714037179947, "step": 3955, "valid_targets_mean": 4488.9, "valid_targets_min": 2086 }, { "epoch": 4.870848708487085, "grad_norm": 0.5360432120626524, "learning_rate": 1.0266807035375361e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.07135751098394394, "step": 3960, "valid_targets_mean": 3104.8, "valid_targets_min": 737 }, { "epoch": 4.8769987699877, "grad_norm": 0.5569738960572754, "learning_rate": 1.0213260462202516e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.08494162559509277, "step": 3965, "valid_targets_mean": 3775.0, "valid_targets_min": 1197 }, { "epoch": 4.883148831488315, "grad_norm": 0.6288639728621314, "learning_rate": 1.0159805969577023e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.09134040772914886, "step": 3970, "valid_targets_mean": 2802.6, "valid_targets_min": 810 }, { "epoch": 4.88929889298893, "grad_norm": 0.5331710918825406, "learning_rate": 1.0106444060436418e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.06761527061462402, "step": 3975, "valid_targets_mean": 2761.5, "valid_targets_min": 822 }, { "epoch": 4.895448954489545, "grad_norm": 0.5242148922223903, "learning_rate": 1.0053175236847194e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.09052105247974396, "step": 3980, "valid_targets_mean": 4687.2, "valid_targets_min": 1014 }, { "epoch": 4.9015990159901595, "grad_norm": 0.573693513407013, "learning_rate": 1.0000000000000006e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.06895217299461365, "step": 3985, "valid_targets_mean": 3968.4, "valid_targets_min": 1162 }, { "epoch": 4.907749077490775, "grad_norm": 0.5349411087388412, "learning_rate": 9.94691885020497e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.055875398218631744, "step": 3990, "valid_targets_mean": 2503.1, "valid_targets_min": 1200 }, { "epoch": 4.91389913899139, "grad_norm": 0.46427537558278087, "learning_rate": 9.893932286886994e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.08818367123603821, "step": 3995, "valid_targets_mean": 5586.0, "valid_targets_min": 773 }, { "epoch": 4.920049200492005, "grad_norm": 0.48713774481651195, "learning_rate": 9.841040808581023e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.09311980754137039, "step": 4000, "valid_targets_mean": 5138.4, "valid_targets_min": 1622 }, { "epoch": 4.92619926199262, "grad_norm": 0.5352749285926348, "learning_rate": 9.78824491292739e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.08384846150875092, "step": 4005, "valid_targets_mean": 4028.9, "valid_targets_min": 809 }, { "epoch": 4.932349323493235, "grad_norm": 0.5282980096403203, "learning_rate": 9.73554509666711e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.08767678588628769, "step": 4010, "valid_targets_mean": 4881.1, "valid_targets_min": 1480 }, { "epoch": 4.93849938499385, "grad_norm": 0.5586423840236229, "learning_rate": 9.682941855637212e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.07774870097637177, "step": 4015, "valid_targets_mean": 3326.1, "valid_targets_min": 733 }, { "epoch": 4.944649446494465, "grad_norm": 0.441482304162159, "learning_rate": 9.6304356847661e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.0827236920595169, "step": 4020, "valid_targets_mean": 5296.1, "valid_targets_min": 1661 }, { "epoch": 4.95079950799508, "grad_norm": 0.5388929133942453, "learning_rate": 9.57802707806884e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.08114897459745407, "step": 4025, "valid_targets_mean": 3976.1, "valid_targets_min": 1091 }, { "epoch": 4.956949569495695, "grad_norm": 0.4526069870272038, "learning_rate": 9.525716528642586e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.06927553564310074, "step": 4030, "valid_targets_mean": 4801.6, "valid_targets_min": 1166 }, { "epoch": 4.96309963099631, "grad_norm": 0.4454345323251501, "learning_rate": 9.473504528661861e-06, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.06050243228673935, "step": 4035, "valid_targets_mean": 4023.6, "valid_targets_min": 1017 }, { "epoch": 4.969249692496925, "grad_norm": 0.5575436642753206, "learning_rate": 9.421391569373985e-06, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.10379059612751007, "step": 4040, "valid_targets_mean": 4639.4, "valid_targets_min": 1339 }, { "epoch": 4.97539975399754, "grad_norm": 0.504681637684389, "learning_rate": 9.369378141094432e-06, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.041682638227939606, "step": 4045, "valid_targets_mean": 2344.9, "valid_targets_min": 747 }, { "epoch": 4.9815498154981555, "grad_norm": 0.5032705259761875, "learning_rate": 9.31746473320221e-06, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.0683014988899231, "step": 4050, "valid_targets_mean": 3720.0, "valid_targets_min": 647 }, { "epoch": 4.98769987699877, "grad_norm": 0.44183651131256785, "learning_rate": 9.265651834135269e-06, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.061229877173900604, "step": 4055, "valid_targets_mean": 3820.8, "valid_targets_min": 889 }, { "epoch": 4.993849938499385, "grad_norm": 0.5175046321055239, "learning_rate": 9.213939931385916e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.06363791227340698, "step": 4060, "valid_targets_mean": 3328.5, "valid_targets_min": 1207 }, { "epoch": 5.0, "grad_norm": 0.5287980278487949, "learning_rate": 9.162329511496186e-06, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.04995204508304596, "step": 4065, "valid_targets_mean": 2923.9, "valid_targets_min": 659 }, { "epoch": 5.006150061500615, "grad_norm": 0.4785771117273528, "learning_rate": 9.110821060053316e-06, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.06151096150279045, "step": 4070, "valid_targets_mean": 3563.6, "valid_targets_min": 642 }, { "epoch": 5.01230012300123, "grad_norm": 0.5049824641002617, "learning_rate": 9.059415061685148e-06, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.08826617151498795, "step": 4075, "valid_targets_mean": 4935.4, "valid_targets_min": 727 }, { "epoch": 5.018450184501845, "grad_norm": 0.6469695131202428, "learning_rate": 9.008112000055542e-06, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.04977300763130188, "step": 4080, "valid_targets_mean": 2149.4, "valid_targets_min": 567 }, { "epoch": 5.02460024600246, "grad_norm": 0.5712167917407098, "learning_rate": 8.956912357859904e-06, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.039753835648298264, "step": 4085, "valid_targets_mean": 2464.6, "valid_targets_min": 920 }, { "epoch": 5.030750307503075, "grad_norm": 0.6081788808312366, "learning_rate": 8.90581661682056e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.06659470498561859, "step": 4090, "valid_targets_mean": 2849.0, "valid_targets_min": 613 }, { "epoch": 5.03690036900369, "grad_norm": 0.5628471620837191, "learning_rate": 8.854825257682287e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.0829765647649765, "step": 4095, "valid_targets_mean": 4282.0, "valid_targets_min": 772 }, { "epoch": 5.043050430504305, "grad_norm": 0.5910867284637292, "learning_rate": 8.803938760207748e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.05292678251862526, "step": 4100, "valid_targets_mean": 2229.6, "valid_targets_min": 780 }, { "epoch": 5.04920049200492, "grad_norm": 0.6923670551347763, "learning_rate": 8.753157603172997e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.07180257141590118, "step": 4105, "valid_targets_mean": 2584.1, "valid_targets_min": 1083 }, { "epoch": 5.055350553505535, "grad_norm": 0.5399803857583291, "learning_rate": 8.70248226436297e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.05704289674758911, "step": 4110, "valid_targets_mean": 3451.8, "valid_targets_min": 790 }, { "epoch": 5.06150061500615, "grad_norm": 0.6178170330499573, "learning_rate": 8.651913220566985e-06, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.05068812146782875, "step": 4115, "valid_targets_mean": 2423.1, "valid_targets_min": 889 }, { "epoch": 5.067650676506765, "grad_norm": 0.6070925996863827, "learning_rate": 8.601450947574281e-06, "loss": 0.1356, "loss_nan_ranks": 0, "loss_rank_avg": 0.0549185574054718, "step": 4120, "valid_targets_mean": 2540.6, "valid_targets_min": 1157 }, { "epoch": 5.07380073800738, "grad_norm": 0.6557178619364926, "learning_rate": 8.551095920169505e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.06462284922599792, "step": 4125, "valid_targets_mean": 2918.8, "valid_targets_min": 874 }, { "epoch": 5.079950799507995, "grad_norm": 0.48332087977767, "learning_rate": 8.500848612128256e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.06660201400518417, "step": 4130, "valid_targets_mean": 4803.1, "valid_targets_min": 1570 }, { "epoch": 5.08610086100861, "grad_norm": 0.5603027314423431, "learning_rate": 8.450709496212656e-06, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.06227262318134308, "step": 4135, "valid_targets_mean": 3059.6, "valid_targets_min": 810 }, { "epoch": 5.092250922509225, "grad_norm": 0.5464937469808374, "learning_rate": 8.400679044166866e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.06879455596208572, "step": 4140, "valid_targets_mean": 3663.6, "valid_targets_min": 844 }, { "epoch": 5.0984009840098405, "grad_norm": 0.49805111101150573, "learning_rate": 8.350757726712654e-06, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.0746736004948616, "step": 4145, "valid_targets_mean": 4985.0, "valid_targets_min": 888 }, { "epoch": 5.104551045510455, "grad_norm": 0.5473078398477096, "learning_rate": 8.300946013544986e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.05511518940329552, "step": 4150, "valid_targets_mean": 3267.4, "valid_targets_min": 711 }, { "epoch": 5.11070110701107, "grad_norm": 0.4790352465578367, "learning_rate": 8.251244373327575e-06, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.05356874689459801, "step": 4155, "valid_targets_mean": 3838.9, "valid_targets_min": 698 }, { "epoch": 5.116851168511685, "grad_norm": 0.5173429050043004, "learning_rate": 8.201653273688518e-06, "loss": 0.1356, "loss_nan_ranks": 0, "loss_rank_avg": 0.06376117467880249, "step": 4160, "valid_targets_mean": 3924.8, "valid_targets_min": 682 }, { "epoch": 5.1230012300123, "grad_norm": 0.49619999281719224, "learning_rate": 8.15217318121584e-06, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.0763036385178566, "step": 4165, "valid_targets_mean": 5031.5, "valid_targets_min": 1159 }, { "epoch": 5.129151291512915, "grad_norm": 0.6886197883366834, "learning_rate": 8.10280456145316e-06, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.06304652988910675, "step": 4170, "valid_targets_mean": 2223.1, "valid_targets_min": 933 }, { "epoch": 5.1353013530135305, "grad_norm": 0.6353351707891169, "learning_rate": 8.053547878895262e-06, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.08870084583759308, "step": 4175, "valid_targets_mean": 5869.8, "valid_targets_min": 1660 }, { "epoch": 5.141451414514145, "grad_norm": 0.5427256920132474, "learning_rate": 8.00440359698375e-06, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.06112075224518776, "step": 4180, "valid_targets_mean": 3706.9, "valid_targets_min": 799 }, { "epoch": 5.14760147601476, "grad_norm": 0.4931303708484275, "learning_rate": 7.955372178102686e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.0511876679956913, "step": 4185, "valid_targets_mean": 3994.8, "valid_targets_min": 657 }, { "epoch": 5.153751537515375, "grad_norm": 0.7230617633736471, "learning_rate": 7.906454083574226e-06, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.05878932774066925, "step": 4190, "valid_targets_mean": 1831.1, "valid_targets_min": 642 }, { "epoch": 5.15990159901599, "grad_norm": 0.6599402185288566, "learning_rate": 7.857649773654322e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.09495142102241516, "step": 4195, "valid_targets_mean": 3926.4, "valid_targets_min": 881 }, { "epoch": 5.166051660516605, "grad_norm": 0.5648942987083065, "learning_rate": 7.808959707528327e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.06887968629598618, "step": 4200, "valid_targets_mean": 3425.8, "valid_targets_min": 1495 }, { "epoch": 5.1722017220172205, "grad_norm": 0.5372484579852459, "learning_rate": 7.760384343306715e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.06378699094057083, "step": 4205, "valid_targets_mean": 4489.6, "valid_targets_min": 1153 }, { "epoch": 5.178351783517835, "grad_norm": 0.5609304848272691, "learning_rate": 7.711924138020784e-06, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.09759139269590378, "step": 4210, "valid_targets_mean": 3769.9, "valid_targets_min": 750 }, { "epoch": 5.18450184501845, "grad_norm": 0.4818577511888391, "learning_rate": 7.663579547618311e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.050046101212501526, "step": 4215, "valid_targets_mean": 3101.2, "valid_targets_min": 1367 }, { "epoch": 5.190651906519065, "grad_norm": 0.6574419406424697, "learning_rate": 7.615351026959299e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.06832084059715271, "step": 4220, "valid_targets_mean": 2211.8, "valid_targets_min": 861 }, { "epoch": 5.19680196801968, "grad_norm": 0.534102056865247, "learning_rate": 7.567239029811677e-06, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.07990866899490356, "step": 4225, "valid_targets_mean": 4538.5, "valid_targets_min": 948 }, { "epoch": 5.202952029520295, "grad_norm": 0.5459890166096859, "learning_rate": 7.519244008847042e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.059343911707401276, "step": 4230, "valid_targets_mean": 3617.5, "valid_targets_min": 1149 }, { "epoch": 5.2091020910209105, "grad_norm": 0.4965065159797279, "learning_rate": 7.471366415636407e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.07250720262527466, "step": 4235, "valid_targets_mean": 4636.0, "valid_targets_min": 1207 }, { "epoch": 5.215252152521526, "grad_norm": 0.5368507598251694, "learning_rate": 7.423606700645924e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.05517926812171936, "step": 4240, "valid_targets_mean": 2792.1, "valid_targets_min": 710 }, { "epoch": 5.22140221402214, "grad_norm": 0.5627823490501318, "learning_rate": 7.375965313232689e-06, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.08396650850772858, "step": 4245, "valid_targets_mean": 4103.9, "valid_targets_min": 607 }, { "epoch": 5.227552275522755, "grad_norm": 0.6026850979363331, "learning_rate": 7.328442701640455e-06, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.07790623605251312, "step": 4250, "valid_targets_mean": 3153.5, "valid_targets_min": 987 }, { "epoch": 5.23370233702337, "grad_norm": 0.5268265024874609, "learning_rate": 7.281039312995462e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.06084034591913223, "step": 4255, "valid_targets_mean": 3125.0, "valid_targets_min": 1157 }, { "epoch": 5.239852398523985, "grad_norm": 0.5854489793935117, "learning_rate": 7.233755593302236e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.0571461096405983, "step": 4260, "valid_targets_mean": 2466.8, "valid_targets_min": 936 }, { "epoch": 5.2460024600246005, "grad_norm": 0.49665126539240234, "learning_rate": 7.186591987439344e-06, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.05833997204899788, "step": 4265, "valid_targets_mean": 4250.1, "valid_targets_min": 1311 }, { "epoch": 5.252152521525216, "grad_norm": 0.6149568899035343, "learning_rate": 7.139548939155265e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.08298102021217346, "step": 4270, "valid_targets_mean": 3524.6, "valid_targets_min": 862 }, { "epoch": 5.25830258302583, "grad_norm": 0.49986537787060903, "learning_rate": 7.09262689106416e-06, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.08084630221128464, "step": 4275, "valid_targets_mean": 5082.0, "valid_targets_min": 807 }, { "epoch": 5.264452644526445, "grad_norm": 0.5095804577841002, "learning_rate": 7.045826284641755e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.09113496541976929, "step": 4280, "valid_targets_mean": 5525.5, "valid_targets_min": 1838 }, { "epoch": 5.27060270602706, "grad_norm": 0.5800095036467529, "learning_rate": 6.999147560221155e-06, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.08298463374376297, "step": 4285, "valid_targets_mean": 4589.1, "valid_targets_min": 722 }, { "epoch": 5.276752767527675, "grad_norm": 0.5008947329331649, "learning_rate": 6.952591156988715e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.07245397567749023, "step": 4290, "valid_targets_mean": 4993.2, "valid_targets_min": 1222 }, { "epoch": 5.2829028290282904, "grad_norm": 0.5695620281334599, "learning_rate": 6.906157512979919e-06, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.06223241984844208, "step": 4295, "valid_targets_mean": 3146.4, "valid_targets_min": 694 }, { "epoch": 5.289052890528906, "grad_norm": 0.497306924306098, "learning_rate": 6.859847065075229e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.08233607560396194, "step": 4300, "valid_targets_mean": 5098.9, "valid_targets_min": 988 }, { "epoch": 5.29520295202952, "grad_norm": 0.6017082112417436, "learning_rate": 6.813660248995995e-06, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.04814864322543144, "step": 4305, "valid_targets_mean": 2045.5, "valid_targets_min": 1095 }, { "epoch": 5.301353013530135, "grad_norm": 0.7031164675781172, "learning_rate": 6.767597499300363e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.061618953943252563, "step": 4310, "valid_targets_mean": 2244.2, "valid_targets_min": 898 }, { "epoch": 5.30750307503075, "grad_norm": 0.5773205611506669, "learning_rate": 6.72165924937916e-06, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.06138886511325836, "step": 4315, "valid_targets_mean": 3077.6, "valid_targets_min": 1029 }, { "epoch": 5.313653136531365, "grad_norm": 0.5994567554792678, "learning_rate": 6.675845931451841e-06, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.05309034883975983, "step": 4320, "valid_targets_mean": 2592.4, "valid_targets_min": 592 }, { "epoch": 5.31980319803198, "grad_norm": 0.6920774165003466, "learning_rate": 6.630157976562408e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.08477108180522919, "step": 4325, "valid_targets_mean": 3603.5, "valid_targets_min": 1029 }, { "epoch": 5.325953259532596, "grad_norm": 0.4847184821128782, "learning_rate": 6.584595814575352e-06, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.05919899791479111, "step": 4330, "valid_targets_mean": 4405.2, "valid_targets_min": 1264 }, { "epoch": 5.332103321033211, "grad_norm": 0.5523701905851736, "learning_rate": 6.539159874171639e-06, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.08438067883253098, "step": 4335, "valid_targets_mean": 4468.0, "valid_targets_min": 825 }, { "epoch": 5.338253382533825, "grad_norm": 0.5526060489777394, "learning_rate": 6.493850582844628e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.0591844879090786, "step": 4340, "valid_targets_mean": 4367.8, "valid_targets_min": 716 }, { "epoch": 5.34440344403444, "grad_norm": 0.4843090875685017, "learning_rate": 6.448668366896092e-06, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.05962533876299858, "step": 4345, "valid_targets_mean": 4170.4, "valid_targets_min": 744 }, { "epoch": 5.350553505535055, "grad_norm": 0.47936663965824555, "learning_rate": 6.403613651432177e-06, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.058356355875730515, "step": 4350, "valid_targets_mean": 3903.0, "valid_targets_min": 963 }, { "epoch": 5.35670356703567, "grad_norm": 0.622003720893813, "learning_rate": 6.358686860359422e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.0567665621638298, "step": 4355, "valid_targets_mean": 2604.9, "valid_targets_min": 1221 }, { "epoch": 5.3628536285362856, "grad_norm": 0.6083992416127505, "learning_rate": 6.31388841638076e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.0629962831735611, "step": 4360, "valid_targets_mean": 3218.0, "valid_targets_min": 949 }, { "epoch": 5.369003690036901, "grad_norm": 0.5733667189845008, "learning_rate": 6.2692187409915425e-06, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.05322912707924843, "step": 4365, "valid_targets_mean": 2994.6, "valid_targets_min": 985 }, { "epoch": 5.375153751537516, "grad_norm": 0.574028849732009, "learning_rate": 6.224678254475573e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.0691322386264801, "step": 4370, "valid_targets_mean": 3420.0, "valid_targets_min": 439 }, { "epoch": 5.38130381303813, "grad_norm": 0.468878348756875, "learning_rate": 6.18026737590117e-06, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.06864840537309647, "step": 4375, "valid_targets_mean": 5576.8, "valid_targets_min": 1082 }, { "epoch": 5.387453874538745, "grad_norm": 0.6297761784013611, "learning_rate": 6.1359865231171876e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.07104820013046265, "step": 4380, "valid_targets_mean": 3394.8, "valid_targets_min": 744 }, { "epoch": 5.39360393603936, "grad_norm": 0.5762979148080327, "learning_rate": 6.091836112749134e-06, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.06590209156274796, "step": 4385, "valid_targets_mean": 3324.1, "valid_targets_min": 742 }, { "epoch": 5.3997539975399755, "grad_norm": 0.5124388311977301, "learning_rate": 6.047816560195188e-06, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.09571660310029984, "step": 4390, "valid_targets_mean": 6296.0, "valid_targets_min": 1787 }, { "epoch": 5.405904059040591, "grad_norm": 0.5825350183593732, "learning_rate": 6.003928279622342e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.08598175644874573, "step": 4395, "valid_targets_mean": 4390.6, "valid_targets_min": 1616 }, { "epoch": 5.412054120541206, "grad_norm": 0.4763543026437352, "learning_rate": 5.960171683962504e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.06651069968938828, "step": 4400, "valid_targets_mean": 5291.0, "valid_targets_min": 605 }, { "epoch": 5.41820418204182, "grad_norm": 0.44617040766394106, "learning_rate": 5.91654718490857e-06, "loss": 0.1338, "loss_nan_ranks": 0, "loss_rank_avg": 0.05469570681452751, "step": 4405, "valid_targets_mean": 4090.4, "valid_targets_min": 1062 }, { "epoch": 5.424354243542435, "grad_norm": 0.5840963047069434, "learning_rate": 5.873055192910606e-06, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.07961584627628326, "step": 4410, "valid_targets_mean": 3863.9, "valid_targets_min": 727 }, { "epoch": 5.43050430504305, "grad_norm": 0.4937156422148364, "learning_rate": 5.829696117171935e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.05776210129261017, "step": 4415, "valid_targets_mean": 4145.0, "valid_targets_min": 1323 }, { "epoch": 5.4366543665436655, "grad_norm": 0.5040308641158776, "learning_rate": 5.786470365645323e-06, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.06853733956813812, "step": 4420, "valid_targets_mean": 4661.2, "valid_targets_min": 721 }, { "epoch": 5.442804428044281, "grad_norm": 0.6975362471017391, "learning_rate": 5.743378345029121e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.07282223552465439, "step": 4425, "valid_targets_mean": 2467.2, "valid_targets_min": 818 }, { "epoch": 5.448954489544896, "grad_norm": 0.5033536112795816, "learning_rate": 5.700420460763441e-06, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.05807007849216461, "step": 4430, "valid_targets_mean": 4276.6, "valid_targets_min": 1434 }, { "epoch": 5.45510455104551, "grad_norm": 0.5345278681133446, "learning_rate": 5.6575971170263676e-06, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.06748709082603455, "step": 4435, "valid_targets_mean": 3936.2, "valid_targets_min": 1017 }, { "epoch": 5.461254612546125, "grad_norm": 0.5181312098885833, "learning_rate": 5.614908716730112e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.06790114939212799, "step": 4440, "valid_targets_mean": 4764.8, "valid_targets_min": 753 }, { "epoch": 5.46740467404674, "grad_norm": 0.5265881025472253, "learning_rate": 5.572355661517242e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.0549679771065712, "step": 4445, "valid_targets_mean": 4789.5, "valid_targets_min": 557 }, { "epoch": 5.4735547355473555, "grad_norm": 0.546448417139361, "learning_rate": 5.529938351756921e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.07799028605222702, "step": 4450, "valid_targets_mean": 4369.8, "valid_targets_min": 1012 }, { "epoch": 5.479704797047971, "grad_norm": 0.6404295613832135, "learning_rate": 5.487657186541109e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.05156659334897995, "step": 4455, "valid_targets_mean": 2518.1, "valid_targets_min": 1004 }, { "epoch": 5.485854858548586, "grad_norm": 0.6350534594087568, "learning_rate": 5.445512563680824e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.08964598923921585, "step": 4460, "valid_targets_mean": 3464.0, "valid_targets_min": 809 }, { "epoch": 5.492004920049201, "grad_norm": 0.57284220136077, "learning_rate": 5.403504879702402e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.0627598911523819, "step": 4465, "valid_targets_mean": 3355.9, "valid_targets_min": 1519 }, { "epoch": 5.498154981549815, "grad_norm": 0.5670977260623126, "learning_rate": 5.361634529843746e-06, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.07299600541591644, "step": 4470, "valid_targets_mean": 4018.2, "valid_targets_min": 1028 }, { "epoch": 5.50430504305043, "grad_norm": 0.47708220603647616, "learning_rate": 5.319901908050653e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.09748424589633942, "step": 4475, "valid_targets_mean": 5790.4, "valid_targets_min": 2550 }, { "epoch": 5.5104551045510455, "grad_norm": 0.5521838855870443, "learning_rate": 5.278307406973044e-06, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.05909402668476105, "step": 4480, "valid_targets_mean": 3219.6, "valid_targets_min": 1101 }, { "epoch": 5.516605166051661, "grad_norm": 0.5188394648038602, "learning_rate": 5.236851417961335e-06, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.06519473344087601, "step": 4485, "valid_targets_mean": 4415.0, "valid_targets_min": 809 }, { "epoch": 5.522755227552276, "grad_norm": 0.6118574496274587, "learning_rate": 5.1955343310627e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.08431139588356018, "step": 4490, "valid_targets_mean": 3424.8, "valid_targets_min": 1116 }, { "epoch": 5.528905289052891, "grad_norm": 0.5583995118932806, "learning_rate": 5.1543565350174156e-06, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.058837100863456726, "step": 4495, "valid_targets_mean": 3215.4, "valid_targets_min": 1072 }, { "epoch": 5.535055350553505, "grad_norm": 0.6267388804666768, "learning_rate": 5.1133184172552415e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.07143986225128174, "step": 4500, "valid_targets_mean": 3486.0, "valid_targets_min": 1197 }, { "epoch": 5.54120541205412, "grad_norm": 0.6270834284286618, "learning_rate": 5.072420363891721e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.09735643118619919, "step": 4505, "valid_targets_mean": 3999.5, "valid_targets_min": 1181 }, { "epoch": 5.5473554735547355, "grad_norm": 0.5358570615128295, "learning_rate": 5.031662759724594e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.04467421770095825, "step": 4510, "valid_targets_mean": 2465.5, "valid_targets_min": 620 }, { "epoch": 5.553505535055351, "grad_norm": 0.6280043730155115, "learning_rate": 4.991045988230137e-06, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.06517910212278366, "step": 4515, "valid_targets_mean": 2457.2, "valid_targets_min": 821 }, { "epoch": 5.559655596555966, "grad_norm": 0.5400057725876789, "learning_rate": 4.950570431559578e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.0681416317820549, "step": 4520, "valid_targets_mean": 3514.8, "valid_targets_min": 783 }, { "epoch": 5.565805658056581, "grad_norm": 0.4846347741343395, "learning_rate": 4.910236470535501e-06, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.06555978208780289, "step": 4525, "valid_targets_mean": 4478.2, "valid_targets_min": 689 }, { "epoch": 5.571955719557195, "grad_norm": 0.4842509174019338, "learning_rate": 4.870044484648246e-06, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.06658433377742767, "step": 4530, "valid_targets_mean": 4445.2, "valid_targets_min": 549 }, { "epoch": 5.57810578105781, "grad_norm": 0.49339619825987036, "learning_rate": 4.829994852052378e-06, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.07952606678009033, "step": 4535, "valid_targets_mean": 3233.0, "valid_targets_min": 1082 }, { "epoch": 5.584255842558425, "grad_norm": 0.5644561862473277, "learning_rate": 4.790087949563071e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.049260400235652924, "step": 4540, "valid_targets_mean": 2309.9, "valid_targets_min": 841 }, { "epoch": 5.590405904059041, "grad_norm": 0.5936110749163102, "learning_rate": 4.750324152652608e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.058592405170202255, "step": 4545, "valid_targets_mean": 2652.8, "valid_targets_min": 634 }, { "epoch": 5.596555965559656, "grad_norm": 0.5907395277430468, "learning_rate": 4.710703835446837e-06, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.06237831711769104, "step": 4550, "valid_targets_mean": 3264.0, "valid_targets_min": 1100 }, { "epoch": 5.602706027060271, "grad_norm": 0.4940489453365208, "learning_rate": 4.671227370721643e-06, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.0626446008682251, "step": 4555, "valid_targets_mean": 4216.4, "valid_targets_min": 685 }, { "epoch": 5.608856088560886, "grad_norm": 0.790661869914746, "learning_rate": 4.6318951298994415e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.06247299537062645, "step": 4560, "valid_targets_mean": 3516.4, "valid_targets_min": 1220 }, { "epoch": 5.6150061500615, "grad_norm": 0.533525633898037, "learning_rate": 4.592707483045695e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.05781655013561249, "step": 4565, "valid_targets_mean": 3576.8, "valid_targets_min": 784 }, { "epoch": 5.621156211562115, "grad_norm": 0.6447467253790201, "learning_rate": 4.553664798865414e-06, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.08398255705833435, "step": 4570, "valid_targets_mean": 3295.8, "valid_targets_min": 801 }, { "epoch": 5.627306273062731, "grad_norm": 0.6726510656316983, "learning_rate": 4.514767444699715e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.05583667755126953, "step": 4575, "valid_targets_mean": 2771.9, "valid_targets_min": 930 }, { "epoch": 5.633456334563346, "grad_norm": 0.5999660895339212, "learning_rate": 4.476015786522325e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.05261404067277908, "step": 4580, "valid_targets_mean": 2810.2, "valid_targets_min": 669 }, { "epoch": 5.639606396063961, "grad_norm": 0.5405223268016334, "learning_rate": 4.4374101889361884e-06, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.08601601421833038, "step": 4585, "valid_targets_mean": 5179.4, "valid_targets_min": 1207 }, { "epoch": 5.645756457564576, "grad_norm": 0.49448784969381876, "learning_rate": 4.398951015169983e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.06781433522701263, "step": 4590, "valid_targets_mean": 4570.5, "valid_targets_min": 551 }, { "epoch": 5.651906519065191, "grad_norm": 0.6608146757310736, "learning_rate": 4.360638627074738e-06, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.05293276906013489, "step": 4595, "valid_targets_mean": 1845.6, "valid_targets_min": 803 }, { "epoch": 5.658056580565805, "grad_norm": 0.4406119277585125, "learning_rate": 4.32247338512042e-06, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.07278837263584137, "step": 4600, "valid_targets_mean": 5933.4, "valid_targets_min": 1701 }, { "epoch": 5.6642066420664205, "grad_norm": 0.5632101252627604, "learning_rate": 4.284455648392536e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.07039278745651245, "step": 4605, "valid_targets_mean": 3400.9, "valid_targets_min": 679 }, { "epoch": 5.670356703567036, "grad_norm": 0.6577996185215177, "learning_rate": 4.246585774588772e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.062012627720832825, "step": 4610, "valid_targets_mean": 2761.6, "valid_targets_min": 826 }, { "epoch": 5.676506765067651, "grad_norm": 0.502880708364359, "learning_rate": 4.208864120015603e-06, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.05661604925990105, "step": 4615, "valid_targets_mean": 3922.2, "valid_targets_min": 734 }, { "epoch": 5.682656826568266, "grad_norm": 0.6287154845246335, "learning_rate": 4.17129103958495e-06, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.09337248653173447, "step": 4620, "valid_targets_mean": 4328.6, "valid_targets_min": 969 }, { "epoch": 5.68880688806888, "grad_norm": 0.6110181061383558, "learning_rate": 4.1338668868108645e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.07381390035152435, "step": 4625, "valid_targets_mean": 3711.2, "valid_targets_min": 1120 }, { "epoch": 5.694956949569495, "grad_norm": 0.6601727872764537, "learning_rate": 4.096592013806162e-06, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.081791952252388, "step": 4630, "valid_targets_mean": 3901.4, "valid_targets_min": 700 }, { "epoch": 5.7011070110701105, "grad_norm": 0.686233004174092, "learning_rate": 4.059466771279133e-06, "loss": 0.1239, "loss_nan_ranks": 0, "loss_rank_avg": 0.07497609406709671, "step": 4635, "valid_targets_mean": 3973.1, "valid_targets_min": 1371 }, { "epoch": 5.707257072570726, "grad_norm": 0.55563257482993, "learning_rate": 4.022491508530239e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.0771527886390686, "step": 4640, "valid_targets_mean": 2829.2, "valid_targets_min": 1121 }, { "epoch": 5.713407134071341, "grad_norm": 0.48508003873003414, "learning_rate": 3.985666573448828e-06, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.07775989919900894, "step": 4645, "valid_targets_mean": 5275.2, "valid_targets_min": 1079 }, { "epoch": 5.719557195571956, "grad_norm": 0.5094246505079187, "learning_rate": 3.948992312509865e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.06223844364285469, "step": 4650, "valid_targets_mean": 4162.6, "valid_targets_min": 721 }, { "epoch": 5.725707257072571, "grad_norm": 0.59486147494615, "learning_rate": 3.912469070770648e-06, "loss": 0.1284, "loss_nan_ranks": 0, "loss_rank_avg": 0.06888983398675919, "step": 4655, "valid_targets_mean": 3657.1, "valid_targets_min": 839 }, { "epoch": 5.731857318573185, "grad_norm": 0.6260831099269651, "learning_rate": 3.876097191867614e-06, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.09011298418045044, "step": 4660, "valid_targets_mean": 4611.9, "valid_targets_min": 1241 }, { "epoch": 5.7380073800738005, "grad_norm": 0.5069235198944142, "learning_rate": 3.839877018013027e-06, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.07013392448425293, "step": 4665, "valid_targets_mean": 4539.8, "valid_targets_min": 923 }, { "epoch": 5.744157441574416, "grad_norm": 0.5340512819994322, "learning_rate": 3.8038088899918314e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.05745799094438553, "step": 4670, "valid_targets_mean": 3181.0, "valid_targets_min": 1343 }, { "epoch": 5.750307503075031, "grad_norm": 0.49648263165880957, "learning_rate": 3.767893147158419e-06, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.05860132724046707, "step": 4675, "valid_targets_mean": 4163.6, "valid_targets_min": 1068 }, { "epoch": 5.756457564575646, "grad_norm": 0.6294891949820611, "learning_rate": 3.732130127433422e-06, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.057297538965940475, "step": 4680, "valid_targets_mean": 1830.6, "valid_targets_min": 818 }, { "epoch": 5.762607626076261, "grad_norm": 0.5564900867827102, "learning_rate": 3.6965201673005456e-06, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.06601780652999878, "step": 4685, "valid_targets_mean": 3625.5, "valid_targets_min": 744 }, { "epoch": 5.768757687576876, "grad_norm": 0.5910788018371039, "learning_rate": 3.6610636018034183e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.06505535542964935, "step": 4690, "valid_targets_mean": 3133.2, "valid_targets_min": 822 }, { "epoch": 5.7749077490774905, "grad_norm": 0.5093963772024384, "learning_rate": 3.6257607645424052e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.07086948305368423, "step": 4695, "valid_targets_mean": 4104.9, "valid_targets_min": 1144 }, { "epoch": 5.781057810578106, "grad_norm": 0.5469709395305934, "learning_rate": 3.590611987671497e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.09126688539981842, "step": 4700, "valid_targets_mean": 5289.1, "valid_targets_min": 1127 }, { "epoch": 5.787207872078721, "grad_norm": 0.5724591670046765, "learning_rate": 3.555617601895176e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.05370062589645386, "step": 4705, "valid_targets_mean": 2782.0, "valid_targets_min": 629 }, { "epoch": 5.793357933579336, "grad_norm": 0.47231706756273467, "learning_rate": 3.520777936465296e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.04965495318174362, "step": 4710, "valid_targets_mean": 4040.6, "valid_targets_min": 822 }, { "epoch": 5.799507995079951, "grad_norm": 0.6052932463463506, "learning_rate": 3.4860933191780078e-06, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.0728473886847496, "step": 4715, "valid_targets_mean": 3552.5, "valid_targets_min": 501 }, { "epoch": 5.805658056580565, "grad_norm": 0.6178695601121506, "learning_rate": 3.4515640763706394e-06, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.06548146903514862, "step": 4720, "valid_targets_mean": 3125.8, "valid_targets_min": 800 }, { "epoch": 5.8118081180811805, "grad_norm": 0.4909567394923962, "learning_rate": 3.417190532918673e-06, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.0758591815829277, "step": 4725, "valid_targets_mean": 5454.2, "valid_targets_min": 796 }, { "epoch": 5.817958179581796, "grad_norm": 0.5702206919092988, "learning_rate": 3.3829730122326355e-06, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.05891511216759682, "step": 4730, "valid_targets_mean": 3412.4, "valid_targets_min": 818 }, { "epoch": 5.824108241082411, "grad_norm": 0.5290119769717845, "learning_rate": 3.3489118362550954e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.07258553802967072, "step": 4735, "valid_targets_mean": 4466.4, "valid_targets_min": 1280 }, { "epoch": 5.830258302583026, "grad_norm": 0.551055090241482, "learning_rate": 3.3150073254576153e-06, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.06383375823497772, "step": 4740, "valid_targets_mean": 3301.2, "valid_targets_min": 449 }, { "epoch": 5.836408364083641, "grad_norm": 0.504056724244596, "learning_rate": 3.2812597988377413e-06, "loss": 0.1245, "loss_nan_ranks": 0, "loss_rank_avg": 0.05320952832698822, "step": 4745, "valid_targets_mean": 4407.1, "valid_targets_min": 909 }, { "epoch": 5.842558425584256, "grad_norm": 0.49749832350411566, "learning_rate": 3.247669573916008e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.05242083966732025, "step": 4750, "valid_targets_mean": 3587.6, "valid_targets_min": 901 }, { "epoch": 5.8487084870848705, "grad_norm": 0.6416005840428731, "learning_rate": 3.2142369667329377e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.06621767580509186, "step": 4755, "valid_targets_mean": 2420.4, "valid_targets_min": 728 }, { "epoch": 5.854858548585486, "grad_norm": 0.5968103115042238, "learning_rate": 3.1809622918460726e-06, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.0694182813167572, "step": 4760, "valid_targets_mean": 3374.0, "valid_targets_min": 859 }, { "epoch": 5.861008610086101, "grad_norm": 0.6448717684056493, "learning_rate": 3.1478458623270304e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.04484240710735321, "step": 4765, "valid_targets_mean": 1618.8, "valid_targets_min": 984 }, { "epoch": 5.867158671586716, "grad_norm": 0.5519382283696171, "learning_rate": 3.114887989758517e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.07720959931612015, "step": 4770, "valid_targets_mean": 3744.9, "valid_targets_min": 661 }, { "epoch": 5.873308733087331, "grad_norm": 0.4744423674183958, "learning_rate": 3.082088984231455e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.06701827794313431, "step": 4775, "valid_targets_mean": 4775.1, "valid_targets_min": 1345 }, { "epoch": 5.879458794587946, "grad_norm": 0.5294607139263744, "learning_rate": 3.0494491543420147e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.07675887644290924, "step": 4780, "valid_targets_mean": 4780.4, "valid_targets_min": 938 }, { "epoch": 5.885608856088561, "grad_norm": 0.6087599536180349, "learning_rate": 3.016968807188725e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.09123402833938599, "step": 4785, "valid_targets_mean": 5260.0, "valid_targets_min": 1211 }, { "epoch": 5.891758917589176, "grad_norm": 0.5354881993903267, "learning_rate": 2.9846482483696124e-06, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.08291329443454742, "step": 4790, "valid_targets_mean": 5136.9, "valid_targets_min": 771 }, { "epoch": 5.897908979089791, "grad_norm": 0.6239045302015143, "learning_rate": 2.9524877819792787e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.09621922671794891, "step": 4795, "valid_targets_mean": 3785.5, "valid_targets_min": 1572 }, { "epoch": 5.904059040590406, "grad_norm": 0.6157717196902334, "learning_rate": 2.920487710606075e-06, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.04875405877828598, "step": 4800, "valid_targets_mean": 2200.9, "valid_targets_min": 753 }, { "epoch": 5.910209102091021, "grad_norm": 0.7551974435501979, "learning_rate": 2.888648335329236e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.06033777818083763, "step": 4805, "valid_targets_mean": 1572.6, "valid_targets_min": 746 }, { "epoch": 5.916359163591636, "grad_norm": 0.5154662886994588, "learning_rate": 2.8569699557160557e-06, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.061547838151454926, "step": 4810, "valid_targets_mean": 4221.2, "valid_targets_min": 869 }, { "epoch": 5.922509225092251, "grad_norm": 0.5457029607797095, "learning_rate": 2.8254528698190765e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.07080341130495071, "step": 4815, "valid_targets_mean": 4031.8, "valid_targets_min": 631 }, { "epoch": 5.928659286592866, "grad_norm": 0.5346075613200031, "learning_rate": 2.7940973741732636e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.07108861207962036, "step": 4820, "valid_targets_mean": 3890.4, "valid_targets_min": 1090 }, { "epoch": 5.934809348093481, "grad_norm": 0.6419688422559524, "learning_rate": 2.7629037637932388e-06, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.08232875913381577, "step": 4825, "valid_targets_mean": 3988.0, "valid_targets_min": 998 }, { "epoch": 5.940959409594096, "grad_norm": 0.5889517880633873, "learning_rate": 2.7318723321704845e-06, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.07364372909069061, "step": 4830, "valid_targets_mean": 3616.8, "valid_targets_min": 836 }, { "epoch": 5.947109471094711, "grad_norm": 0.4964907504454752, "learning_rate": 2.7010033712705894e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.05161096528172493, "step": 4835, "valid_targets_mean": 2952.1, "valid_targets_min": 858 }, { "epoch": 5.953259532595326, "grad_norm": 0.6116958954533448, "learning_rate": 2.670297171530509e-06, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.0692531168460846, "step": 4840, "valid_targets_mean": 3255.8, "valid_targets_min": 1167 }, { "epoch": 5.959409594095941, "grad_norm": 0.5857212616293475, "learning_rate": 2.6397540218558227e-06, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.08528057485818863, "step": 4845, "valid_targets_mean": 4222.1, "valid_targets_min": 1389 }, { "epoch": 5.9655596555965555, "grad_norm": 0.5446476829662712, "learning_rate": 2.6093742096180273e-06, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.07207009196281433, "step": 4850, "valid_targets_mean": 3742.9, "valid_targets_min": 1058 }, { "epoch": 5.971709717097171, "grad_norm": 0.6322976648443214, "learning_rate": 2.57915802065182e-06, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.06266084313392639, "step": 4855, "valid_targets_mean": 2555.8, "valid_targets_min": 1038 }, { "epoch": 5.977859778597786, "grad_norm": 0.48292079395281423, "learning_rate": 2.5491057392524087e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.059271179139614105, "step": 4860, "valid_targets_mean": 3956.6, "valid_targets_min": 1375 }, { "epoch": 5.984009840098401, "grad_norm": 0.6301550881858835, "learning_rate": 2.5192176481728583e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.09505551308393478, "step": 4865, "valid_targets_mean": 4051.2, "valid_targets_min": 1019 }, { "epoch": 5.990159901599016, "grad_norm": 0.5844004497131141, "learning_rate": 2.489494028621404e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.07588277012109756, "step": 4870, "valid_targets_mean": 3836.9, "valid_targets_min": 842 }, { "epoch": 5.996309963099631, "grad_norm": 0.530198345390078, "learning_rate": 2.4599351602588194e-06, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.07319337874650955, "step": 4875, "valid_targets_mean": 4583.0, "valid_targets_min": 1225 }, { "epoch": 6.002460024600246, "grad_norm": 0.5424770084625548, "learning_rate": 2.430541321195787e-06, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.06289032101631165, "step": 4880, "valid_targets_mean": 3303.5, "valid_targets_min": 1071 }, { "epoch": 6.008610086100861, "grad_norm": 0.5815125365229142, "learning_rate": 2.401312787990264e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.06941921263933182, "step": 4885, "valid_targets_mean": 3812.0, "valid_targets_min": 760 }, { "epoch": 6.014760147601476, "grad_norm": 0.5100325851359603, "learning_rate": 2.372249835644915e-06, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.07263228297233582, "step": 4890, "valid_targets_mean": 5018.5, "valid_targets_min": 722 }, { "epoch": 6.020910209102091, "grad_norm": 0.5804998300235991, "learning_rate": 2.343352737604483e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.04796181991696358, "step": 4895, "valid_targets_mean": 2296.5, "valid_targets_min": 807 }, { "epoch": 6.027060270602706, "grad_norm": 0.5043972229635773, "learning_rate": 2.314621765753251e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.06931351125240326, "step": 4900, "valid_targets_mean": 4836.1, "valid_targets_min": 545 }, { "epoch": 6.033210332103321, "grad_norm": 0.5371257853237565, "learning_rate": 2.286057190412465e-06, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.04863344877958298, "step": 4905, "valid_targets_mean": 3137.8, "valid_targets_min": 1036 }, { "epoch": 6.039360393603936, "grad_norm": 0.48958086204603707, "learning_rate": 2.257659280337783e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.04522975534200668, "step": 4910, "valid_targets_mean": 2998.8, "valid_targets_min": 782 }, { "epoch": 6.045510455104551, "grad_norm": 0.5225596005150376, "learning_rate": 2.2294283027167827e-06, "loss": 0.1278, "loss_nan_ranks": 0, "loss_rank_avg": 0.05581795796751976, "step": 4915, "valid_targets_mean": 3294.5, "valid_targets_min": 662 }, { "epoch": 6.051660516605166, "grad_norm": 0.5779145445466218, "learning_rate": 2.2013645231663983e-06, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.0466914102435112, "step": 4920, "valid_targets_mean": 2584.9, "valid_targets_min": 641 }, { "epoch": 6.057810578105781, "grad_norm": 0.5867639086185799, "learning_rate": 2.173468205730469e-06, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.043185681104660034, "step": 4925, "valid_targets_mean": 2012.4, "valid_targets_min": 798 }, { "epoch": 6.063960639606396, "grad_norm": 0.4720992581177058, "learning_rate": 2.14573961287722e-06, "loss": 0.1201, "loss_nan_ranks": 0, "loss_rank_avg": 0.054659806191921234, "step": 4930, "valid_targets_mean": 4029.0, "valid_targets_min": 802 }, { "epoch": 6.070110701107011, "grad_norm": 0.5422489326157197, "learning_rate": 2.1181790054968033e-06, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.05541398748755455, "step": 4935, "valid_targets_mean": 3444.0, "valid_targets_min": 1318 }, { "epoch": 6.076260762607626, "grad_norm": 0.5206542530264247, "learning_rate": 2.0907866428988544e-06, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.055713292211294174, "step": 4940, "valid_targets_mean": 4180.0, "valid_targets_min": 881 }, { "epoch": 6.082410824108241, "grad_norm": 0.48220785097840313, "learning_rate": 2.0635627828100315e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.06293288618326187, "step": 4945, "valid_targets_mean": 5320.4, "valid_targets_min": 957 }, { "epoch": 6.088560885608856, "grad_norm": 0.5799166793259684, "learning_rate": 2.0365076813716155e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.08323095738887787, "step": 4950, "valid_targets_mean": 4605.6, "valid_targets_min": 902 }, { "epoch": 6.094710947109471, "grad_norm": 0.5465387730589073, "learning_rate": 2.009621593137079e-06, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.0627049133181572, "step": 4955, "valid_targets_mean": 4263.2, "valid_targets_min": 923 }, { "epoch": 6.100861008610086, "grad_norm": 0.5454878652321398, "learning_rate": 1.9829047710696957e-06, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.05662379041314125, "step": 4960, "valid_targets_mean": 3385.6, "valid_targets_min": 916 }, { "epoch": 6.107011070110701, "grad_norm": 0.5227236942685615, "learning_rate": 1.956357466540175e-06, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.059625908732414246, "step": 4965, "valid_targets_mean": 3437.2, "valid_targets_min": 1276 }, { "epoch": 6.113161131611316, "grad_norm": 0.6490963031088945, "learning_rate": 1.9299799293242795e-06, "loss": 0.1338, "loss_nan_ranks": 0, "loss_rank_avg": 0.0674668550491333, "step": 4970, "valid_targets_mean": 2841.2, "valid_targets_min": 1604 }, { "epoch": 6.1193111931119315, "grad_norm": 0.5405801133792902, "learning_rate": 1.9037724076004793e-06, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.07145149260759354, "step": 4975, "valid_targets_mean": 4087.9, "valid_targets_min": 1697 }, { "epoch": 6.125461254612546, "grad_norm": 0.5417643718645909, "learning_rate": 1.8777351479476191e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.06233806908130646, "step": 4980, "valid_targets_mean": 3042.6, "valid_targets_min": 1339 }, { "epoch": 6.131611316113161, "grad_norm": 0.6089532975913663, "learning_rate": 1.8518683953425975e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.05497092008590698, "step": 4985, "valid_targets_mean": 2455.1, "valid_targets_min": 790 }, { "epoch": 6.137761377613776, "grad_norm": 0.5622806251761018, "learning_rate": 1.82617239315807e-06, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.04518791288137436, "step": 4990, "valid_targets_mean": 2354.2, "valid_targets_min": 823 }, { "epoch": 6.143911439114391, "grad_norm": 0.6481181684913966, "learning_rate": 1.8006473831601479e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.06699104607105255, "step": 4995, "valid_targets_mean": 2764.2, "valid_targets_min": 779 }, { "epoch": 6.150061500615006, "grad_norm": 0.7089327493356412, "learning_rate": 1.7752936055061165e-06, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.06491109728813171, "step": 5000, "valid_targets_mean": 1922.2, "valid_targets_min": 505 }, { "epoch": 6.1562115621156215, "grad_norm": 0.5681141076205176, "learning_rate": 1.7501112987422053e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.07124713063240051, "step": 5005, "valid_targets_mean": 3761.8, "valid_targets_min": 945 }, { "epoch": 6.162361623616236, "grad_norm": 0.5032455330376907, "learning_rate": 1.725100699801312e-06, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.0461309440433979, "step": 5010, "valid_targets_mean": 3047.2, "valid_targets_min": 932 }, { "epoch": 6.168511685116851, "grad_norm": 0.674626130208239, "learning_rate": 1.7002620440007888e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.0470353439450264, "step": 5015, "valid_targets_mean": 1651.0, "valid_targets_min": 643 }, { "epoch": 6.174661746617466, "grad_norm": 0.47662425479605447, "learning_rate": 1.6755955650402267e-06, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.06650280207395554, "step": 5020, "valid_targets_mean": 5104.5, "valid_targets_min": 869 }, { "epoch": 6.180811808118081, "grad_norm": 0.5045431997111055, "learning_rate": 1.651101494999252e-06, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.06818658113479614, "step": 5025, "valid_targets_mean": 5044.1, "valid_targets_min": 1283 }, { "epoch": 6.186961869618696, "grad_norm": 0.5255677322760391, "learning_rate": 1.626780064335356e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.05097660794854164, "step": 5030, "valid_targets_mean": 3461.8, "valid_targets_min": 730 }, { "epoch": 6.1931119311193115, "grad_norm": 0.553937699562758, "learning_rate": 1.6026315018817017e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.06818796694278717, "step": 5035, "valid_targets_mean": 4351.0, "valid_targets_min": 1414 }, { "epoch": 6.199261992619927, "grad_norm": 0.47568139072291377, "learning_rate": 1.5786560348450054e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.057540006935596466, "step": 5040, "valid_targets_mean": 5034.5, "valid_targets_min": 1841 }, { "epoch": 6.205412054120541, "grad_norm": 0.5209846711292241, "learning_rate": 1.5548538888033605e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.05540771409869194, "step": 5045, "valid_targets_mean": 4044.1, "valid_targets_min": 882 }, { "epoch": 6.211562115621156, "grad_norm": 0.5337563166849851, "learning_rate": 1.531225287704139e-06, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.07083357870578766, "step": 5050, "valid_targets_mean": 4359.1, "valid_targets_min": 718 }, { "epoch": 6.217712177121771, "grad_norm": 0.531098068033974, "learning_rate": 1.5077704538618942e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.04739413037896156, "step": 5055, "valid_targets_mean": 3149.5, "valid_targets_min": 1041 }, { "epoch": 6.223862238622386, "grad_norm": 0.5540770755610535, "learning_rate": 1.4844896079562344e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.057800762355327606, "step": 5060, "valid_targets_mean": 3788.5, "valid_targets_min": 844 }, { "epoch": 6.2300123001230014, "grad_norm": 0.5855322011840497, "learning_rate": 1.4613829690297832e-06, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.06619509309530258, "step": 5065, "valid_targets_mean": 3172.5, "valid_targets_min": 841 }, { "epoch": 6.236162361623617, "grad_norm": 0.6015697268239801, "learning_rate": 1.4384507544860937e-06, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.06107232719659805, "step": 5070, "valid_targets_mean": 3098.6, "valid_targets_min": 762 }, { "epoch": 6.242312423124231, "grad_norm": 0.6208420441231545, "learning_rate": 1.4156931800876072e-06, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.05853826552629471, "step": 5075, "valid_targets_mean": 3241.2, "valid_targets_min": 662 }, { "epoch": 6.248462484624846, "grad_norm": 0.5157491131630199, "learning_rate": 1.3931104599536371e-06, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.049253273755311966, "step": 5080, "valid_targets_mean": 3172.0, "valid_targets_min": 814 }, { "epoch": 6.254612546125461, "grad_norm": 0.6061095809955876, "learning_rate": 1.370702806558335e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.06068650260567665, "step": 5085, "valid_targets_mean": 2952.6, "valid_targets_min": 684 }, { "epoch": 6.260762607626076, "grad_norm": 0.5870473650514756, "learning_rate": 1.3484704307287145e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.07536955177783966, "step": 5090, "valid_targets_mean": 3981.9, "valid_targets_min": 1097 }, { "epoch": 6.266912669126691, "grad_norm": 0.5418840060025298, "learning_rate": 1.3264135416426416e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.06840242445468903, "step": 5095, "valid_targets_mean": 4178.6, "valid_targets_min": 1192 }, { "epoch": 6.273062730627307, "grad_norm": 0.6720709021096094, "learning_rate": 1.3045323468268788e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.051598817110061646, "step": 5100, "valid_targets_mean": 1979.5, "valid_targets_min": 754 }, { "epoch": 6.279212792127922, "grad_norm": 0.6814971461663389, "learning_rate": 1.2828270521551467e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.05146491155028343, "step": 5105, "valid_targets_mean": 1902.8, "valid_targets_min": 814 }, { "epoch": 6.285362853628536, "grad_norm": 0.5244610038039247, "learning_rate": 1.2612978618461625e-06, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.07176411151885986, "step": 5110, "valid_targets_mean": 4863.8, "valid_targets_min": 1254 }, { "epoch": 6.291512915129151, "grad_norm": 0.5456289000315424, "learning_rate": 1.2399449784617268e-06, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.058985818177461624, "step": 5115, "valid_targets_mean": 3855.1, "valid_targets_min": 1007 }, { "epoch": 6.297662976629766, "grad_norm": 0.6618389501828307, "learning_rate": 1.2187686029048295e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.051307328045368195, "step": 5120, "valid_targets_mean": 2647.4, "valid_targets_min": 1279 }, { "epoch": 6.303813038130381, "grad_norm": 0.5886803833241598, "learning_rate": 1.197768934417738e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.06644248217344284, "step": 5125, "valid_targets_mean": 3766.5, "valid_targets_min": 713 }, { "epoch": 6.3099630996309966, "grad_norm": 0.7661344916145737, "learning_rate": 1.1769461705801533e-06, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.08498349040746689, "step": 5130, "valid_targets_mean": 2529.4, "valid_targets_min": 998 }, { "epoch": 6.316113161131612, "grad_norm": 0.5420320846177908, "learning_rate": 1.1563005073073153e-06, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.07607104629278183, "step": 5135, "valid_targets_mean": 4911.0, "valid_targets_min": 1407 }, { "epoch": 6.322263222632226, "grad_norm": 0.5555350855438084, "learning_rate": 1.1358321388481873e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.06736680865287781, "step": 5140, "valid_targets_mean": 3581.1, "valid_targets_min": 1163 }, { "epoch": 6.328413284132841, "grad_norm": 0.5865304696625325, "learning_rate": 1.1155412577836145e-06, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.08822140097618103, "step": 5145, "valid_targets_mean": 4158.9, "valid_targets_min": 1356 }, { "epoch": 6.334563345633456, "grad_norm": 0.5718301827586693, "learning_rate": 1.0954280550245122e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.06321176886558533, "step": 5150, "valid_targets_mean": 3289.2, "valid_targets_min": 724 }, { "epoch": 6.340713407134071, "grad_norm": 0.5856223256790988, "learning_rate": 1.0754927198100785e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.05578772723674774, "step": 5155, "valid_targets_mean": 3221.1, "valid_targets_min": 1307 }, { "epoch": 6.3468634686346865, "grad_norm": 0.6281303982187476, "learning_rate": 1.0557354397060026e-06, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.07257921248674393, "step": 5160, "valid_targets_mean": 3363.1, "valid_targets_min": 943 }, { "epoch": 6.353013530135302, "grad_norm": 0.6029484904933851, "learning_rate": 1.0361564006027126e-06, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.06681361794471741, "step": 5165, "valid_targets_mean": 3008.5, "valid_targets_min": 846 }, { "epoch": 6.359163591635916, "grad_norm": 0.5412048657285767, "learning_rate": 1.0167557867136145e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.07798179984092712, "step": 5170, "valid_targets_mean": 4743.1, "valid_targets_min": 719 }, { "epoch": 6.365313653136531, "grad_norm": 0.5374689567993625, "learning_rate": 9.975337805733654e-07, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.05465513467788696, "step": 5175, "valid_targets_mean": 3842.9, "valid_targets_min": 1105 }, { "epoch": 6.371463714637146, "grad_norm": 0.6524717743607436, "learning_rate": 9.784905630361562e-07, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.07767906785011292, "step": 5180, "valid_targets_mean": 3469.4, "valid_targets_min": 1064 }, { "epoch": 6.377613776137761, "grad_norm": 0.6799806799339971, "learning_rate": 9.596263132740024e-07, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.0618944987654686, "step": 5185, "valid_targets_mean": 2437.5, "valid_targets_min": 1078 }, { "epoch": 6.3837638376383765, "grad_norm": 0.48825175548767674, "learning_rate": 9.409412087750769e-07, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.06350645422935486, "step": 5190, "valid_targets_mean": 5053.9, "valid_targets_min": 1333 }, { "epoch": 6.389913899138992, "grad_norm": 0.4828087282175385, "learning_rate": 9.22435425342012e-07, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.06886067986488342, "step": 5195, "valid_targets_mean": 5354.2, "valid_targets_min": 2076 }, { "epoch": 6.396063960639607, "grad_norm": 0.7221827828864817, "learning_rate": 9.041091370902722e-07, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.04774102196097374, "step": 5200, "valid_targets_mean": 1681.8, "valid_targets_min": 878 }, { "epoch": 6.402214022140221, "grad_norm": 0.5812176892970463, "learning_rate": 8.859625164465013e-07, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.06685419380664825, "step": 5205, "valid_targets_mean": 3608.5, "valid_targets_min": 1181 }, { "epoch": 6.408364083640836, "grad_norm": 0.5345398731915736, "learning_rate": 8.679957341469047e-07, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.07105870544910431, "step": 5210, "valid_targets_mean": 4142.4, "valid_targets_min": 1101 }, { "epoch": 6.414514145141451, "grad_norm": 0.5878686852754383, "learning_rate": 8.502089592356411e-07, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.05155439302325249, "step": 5215, "valid_targets_mean": 2866.0, "valid_targets_min": 928 }, { "epoch": 6.4206642066420665, "grad_norm": 0.6419035998015323, "learning_rate": 8.326023590632304e-07, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.09296417236328125, "step": 5220, "valid_targets_mean": 4123.2, "valid_targets_min": 797 }, { "epoch": 6.426814268142682, "grad_norm": 0.6383297859514876, "learning_rate": 8.1517609928498e-07, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.06617703288793564, "step": 5225, "valid_targets_mean": 3466.5, "valid_targets_min": 720 }, { "epoch": 6.432964329643297, "grad_norm": 0.6064618192893211, "learning_rate": 7.979303438594388e-07, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.07864312082529068, "step": 5230, "valid_targets_mean": 3315.6, "valid_targets_min": 893 }, { "epoch": 6.439114391143911, "grad_norm": 0.5200930400466781, "learning_rate": 7.808652550468299e-07, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.0621294341981411, "step": 5235, "valid_targets_mean": 3840.2, "valid_targets_min": 882 }, { "epoch": 6.445264452644526, "grad_norm": 0.5832419806760687, "learning_rate": 7.63980993407547e-07, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.07488331198692322, "step": 5240, "valid_targets_mean": 3681.5, "valid_targets_min": 816 }, { "epoch": 6.451414514145141, "grad_norm": 0.5963619223693212, "learning_rate": 7.472777178006296e-07, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.0465703159570694, "step": 5245, "valid_targets_mean": 2769.9, "valid_targets_min": 766 }, { "epoch": 6.4575645756457565, "grad_norm": 0.52100211696451, "learning_rate": 7.307555853822745e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.04648655652999878, "step": 5250, "valid_targets_mean": 3330.4, "valid_targets_min": 1024 }, { "epoch": 6.463714637146372, "grad_norm": 0.5336634545046933, "learning_rate": 7.144147516043554e-07, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.048668649047613144, "step": 5255, "valid_targets_mean": 2715.1, "valid_targets_min": 665 }, { "epoch": 6.469864698646987, "grad_norm": 0.6413786231811837, "learning_rate": 6.982553702129568e-07, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.08997328579425812, "step": 5260, "valid_targets_mean": 4145.6, "valid_targets_min": 682 }, { "epoch": 6.476014760147601, "grad_norm": 1.2100250213441113, "learning_rate": 6.822775932469383e-07, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.06279893219470978, "step": 5265, "valid_targets_mean": 4278.0, "valid_targets_min": 791 }, { "epoch": 6.482164821648216, "grad_norm": 0.6726549041937918, "learning_rate": 6.664815710364925e-07, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.083136186003685, "step": 5270, "valid_targets_mean": 4407.0, "valid_targets_min": 1172 }, { "epoch": 6.488314883148831, "grad_norm": 0.565911309079508, "learning_rate": 6.508674522017355e-07, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.08014942705631256, "step": 5275, "valid_targets_mean": 4196.5, "valid_targets_min": 1309 }, { "epoch": 6.4944649446494465, "grad_norm": 0.5733837286075206, "learning_rate": 6.354353836513105e-07, "loss": 0.1268, "loss_nan_ranks": 0, "loss_rank_avg": 0.07294522225856781, "step": 5280, "valid_targets_mean": 3610.2, "valid_targets_min": 935 }, { "epoch": 6.500615006150062, "grad_norm": 0.5329046100371863, "learning_rate": 6.201855105809973e-07, "loss": 0.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.04123207926750183, "step": 5285, "valid_targets_mean": 2400.8, "valid_targets_min": 881 }, { "epoch": 6.506765067650677, "grad_norm": 0.596372557576995, "learning_rate": 6.051179764723625e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.0468425527215004, "step": 5290, "valid_targets_mean": 2518.8, "valid_targets_min": 889 }, { "epoch": 6.512915129151292, "grad_norm": 0.5121653895720126, "learning_rate": 5.902329230913872e-07, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.0639481246471405, "step": 5295, "valid_targets_mean": 4319.6, "valid_targets_min": 906 }, { "epoch": 6.519065190651906, "grad_norm": 0.542778921187282, "learning_rate": 5.755304904871506e-07, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.06037888675928116, "step": 5300, "valid_targets_mean": 4170.6, "valid_targets_min": 912 }, { "epoch": 6.525215252152521, "grad_norm": 0.5804417258187665, "learning_rate": 5.610108169905104e-07, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.0487140417098999, "step": 5305, "valid_targets_mean": 2688.4, "valid_targets_min": 896 }, { "epoch": 6.531365313653136, "grad_norm": 0.5376900650647904, "learning_rate": 5.466740392127934e-07, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.06433159112930298, "step": 5310, "valid_targets_mean": 4386.4, "valid_targets_min": 750 }, { "epoch": 6.537515375153752, "grad_norm": 0.6848076403496212, "learning_rate": 5.32520292044516e-07, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.04983920603990555, "step": 5315, "valid_targets_mean": 3416.9, "valid_targets_min": 672 }, { "epoch": 6.543665436654367, "grad_norm": 0.4829597523952342, "learning_rate": 5.185497086541125e-07, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.05569973587989807, "step": 5320, "valid_targets_mean": 3630.2, "valid_targets_min": 1652 }, { "epoch": 6.549815498154982, "grad_norm": 0.5075676761107347, "learning_rate": 5.047624204866797e-07, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.07317518442869186, "step": 5325, "valid_targets_mean": 6119.2, "valid_targets_min": 1353 }, { "epoch": 6.555965559655597, "grad_norm": 0.5190420641766421, "learning_rate": 4.911585572627541e-07, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.07553472369909286, "step": 5330, "valid_targets_mean": 5454.0, "valid_targets_min": 715 }, { "epoch": 6.562115621156211, "grad_norm": 0.5143181130618779, "learning_rate": 4.777382469770731e-07, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.06313024461269379, "step": 5335, "valid_targets_mean": 4874.2, "valid_targets_min": 631 }, { "epoch": 6.568265682656826, "grad_norm": 0.5343703571493038, "learning_rate": 4.64501615897377e-07, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.04912997782230377, "step": 5340, "valid_targets_mean": 2674.8, "valid_targets_min": 1021 }, { "epoch": 6.574415744157442, "grad_norm": 0.6572140767257532, "learning_rate": 4.514487885632268e-07, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.07277044653892517, "step": 5345, "valid_targets_mean": 2919.0, "valid_targets_min": 589 }, { "epoch": 6.580565805658057, "grad_norm": 0.5442828554066622, "learning_rate": 4.385798877848291e-07, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.050412461161613464, "step": 5350, "valid_targets_mean": 3338.4, "valid_targets_min": 1261 }, { "epoch": 6.586715867158672, "grad_norm": 0.5302749656503288, "learning_rate": 4.258950346418789e-07, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.06352603435516357, "step": 5355, "valid_targets_mean": 3963.1, "valid_targets_min": 786 }, { "epoch": 6.592865928659286, "grad_norm": 0.6868016969517825, "learning_rate": 4.1339434848241435e-07, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.061369460076093674, "step": 5360, "valid_targets_mean": 2106.0, "valid_targets_min": 1033 }, { "epoch": 6.599015990159901, "grad_norm": 0.5867537186958434, "learning_rate": 4.0107794692171076e-07, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.04071478545665741, "step": 5365, "valid_targets_mean": 2107.9, "valid_targets_min": 917 }, { "epoch": 6.605166051660516, "grad_norm": 0.6335536711997667, "learning_rate": 3.889459458411593e-07, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.062453605234622955, "step": 5370, "valid_targets_mean": 2727.2, "valid_targets_min": 740 }, { "epoch": 6.6113161131611315, "grad_norm": 0.5165876825091585, "learning_rate": 3.7699845938717894e-07, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.06971459090709686, "step": 5375, "valid_targets_mean": 4974.9, "valid_targets_min": 936 }, { "epoch": 6.617466174661747, "grad_norm": 0.6111422469058083, "learning_rate": 3.652355999701529e-07, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.08351373672485352, "step": 5380, "valid_targets_mean": 3744.5, "valid_targets_min": 1267 }, { "epoch": 6.623616236162362, "grad_norm": 0.6026266407522326, "learning_rate": 3.5365747826335616e-07, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.05595562979578972, "step": 5385, "valid_targets_mean": 2574.4, "valid_targets_min": 992 }, { "epoch": 6.629766297662977, "grad_norm": 0.7258469981503565, "learning_rate": 3.422642032019208e-07, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.0903460830450058, "step": 5390, "valid_targets_mean": 3207.4, "valid_targets_min": 867 }, { "epoch": 6.635916359163591, "grad_norm": 0.7245258537744896, "learning_rate": 3.3105588198181435e-07, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.06543657928705215, "step": 5395, "valid_targets_mean": 3652.9, "valid_targets_min": 752 }, { "epoch": 6.642066420664206, "grad_norm": 0.4649500989129253, "learning_rate": 3.200326200588255e-07, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.06393611431121826, "step": 5400, "valid_targets_mean": 7006.8, "valid_targets_min": 4825 }, { "epoch": 6.6482164821648215, "grad_norm": 0.6681705676412517, "learning_rate": 3.0919452114758e-07, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.06847294420003891, "step": 5405, "valid_targets_mean": 2410.8, "valid_targets_min": 891 }, { "epoch": 6.654366543665437, "grad_norm": 0.5761711012939229, "learning_rate": 2.985416872205549e-07, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.07202339172363281, "step": 5410, "valid_targets_mean": 3844.8, "valid_targets_min": 916 }, { "epoch": 6.660516605166052, "grad_norm": 0.5695579443647555, "learning_rate": 2.880742185071195e-07, "loss": 0.13, "loss_nan_ranks": 0, "loss_rank_avg": 0.07999488711357117, "step": 5415, "valid_targets_mean": 4289.5, "valid_targets_min": 745 }, { "epoch": 6.666666666666667, "grad_norm": 0.590865804864645, "learning_rate": 2.77792213492607e-07, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.07472768425941467, "step": 5420, "valid_targets_mean": 3445.0, "valid_targets_min": 1208 }, { "epoch": 6.672816728167282, "grad_norm": 0.5830789211352447, "learning_rate": 2.6769576891737093e-07, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.07768949866294861, "step": 5425, "valid_targets_mean": 4333.6, "valid_targets_min": 1169 }, { "epoch": 6.678966789667896, "grad_norm": 0.5530267582678328, "learning_rate": 2.5778497977587914e-07, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.05172623693943024, "step": 5430, "valid_targets_mean": 3705.8, "valid_targets_min": 1011 }, { "epoch": 6.6851168511685115, "grad_norm": 0.5348405157600488, "learning_rate": 2.480599393158256e-07, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.06197597086429596, "step": 5435, "valid_targets_mean": 4570.2, "valid_targets_min": 1047 }, { "epoch": 6.691266912669127, "grad_norm": 0.7936490731490548, "learning_rate": 2.3852073903725127e-07, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.06336570531129837, "step": 5440, "valid_targets_mean": 1634.6, "valid_targets_min": 853 }, { "epoch": 6.697416974169742, "grad_norm": 0.5113218712957384, "learning_rate": 2.2916746869167782e-07, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.05810292810201645, "step": 5445, "valid_targets_mean": 3879.2, "valid_targets_min": 820 }, { "epoch": 6.703567035670357, "grad_norm": 0.5944280644108385, "learning_rate": 2.2000021628126867e-07, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.06202930212020874, "step": 5450, "valid_targets_mean": 3255.5, "valid_targets_min": 1384 }, { "epoch": 6.709717097170972, "grad_norm": 0.5764944538982887, "learning_rate": 2.1101906805800265e-07, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.09774152934551239, "step": 5455, "valid_targets_mean": 4486.8, "valid_targets_min": 1426 }, { "epoch": 6.715867158671586, "grad_norm": 0.5749340442728162, "learning_rate": 2.0222410852285046e-07, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.06891864538192749, "step": 5460, "valid_targets_mean": 3419.9, "valid_targets_min": 869 }, { "epoch": 6.7220172201722015, "grad_norm": 0.6720160493302868, "learning_rate": 1.9361542042499737e-07, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.05232574790716171, "step": 5465, "valid_targets_mean": 2165.0, "valid_targets_min": 768 }, { "epoch": 6.728167281672817, "grad_norm": 0.7673520029285447, "learning_rate": 1.851930847610528e-07, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.07530073821544647, "step": 5470, "valid_targets_mean": 2495.6, "valid_targets_min": 697 }, { "epoch": 6.734317343173432, "grad_norm": 0.5031763579980356, "learning_rate": 1.7695718077428648e-07, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.07046972215175629, "step": 5475, "valid_targets_mean": 4617.9, "valid_targets_min": 1008 }, { "epoch": 6.740467404674047, "grad_norm": 0.4620356869621955, "learning_rate": 1.6890778595389347e-07, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.04569670557975769, "step": 5480, "valid_targets_mean": 4168.4, "valid_targets_min": 874 }, { "epoch": 6.746617466174662, "grad_norm": 0.4824749420700062, "learning_rate": 1.6104497603425916e-07, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.059134647250175476, "step": 5485, "valid_targets_mean": 5008.5, "valid_targets_min": 744 }, { "epoch": 6.752767527675276, "grad_norm": 0.592863648819326, "learning_rate": 1.5336882499424e-07, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.05972706153988838, "step": 5490, "valid_targets_mean": 2984.4, "valid_targets_min": 683 }, { "epoch": 6.7589175891758915, "grad_norm": 0.632709052179341, "learning_rate": 1.4587940505648158e-07, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.054421160370111465, "step": 5495, "valid_targets_mean": 2370.8, "valid_targets_min": 659 }, { "epoch": 6.765067650676507, "grad_norm": 0.6183396377399092, "learning_rate": 1.385767866867238e-07, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.05898458883166313, "step": 5500, "valid_targets_mean": 2615.6, "valid_targets_min": 681 }, { "epoch": 6.771217712177122, "grad_norm": 0.5737063674951367, "learning_rate": 1.3146103859315694e-07, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.06541895866394043, "step": 5505, "valid_targets_mean": 3901.8, "valid_targets_min": 1068 }, { "epoch": 6.777367773677737, "grad_norm": 0.6368471024753006, "learning_rate": 1.2453222772575103e-07, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.06549682468175888, "step": 5510, "valid_targets_mean": 2812.5, "valid_targets_min": 1190 }, { "epoch": 6.783517835178352, "grad_norm": 0.6358721107315133, "learning_rate": 1.1779041927564739e-07, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.07891295850276947, "step": 5515, "valid_targets_mean": 3044.1, "valid_targets_min": 906 }, { "epoch": 6.789667896678967, "grad_norm": 0.5137882501347547, "learning_rate": 1.1123567667453705e-07, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.05998239666223526, "step": 5520, "valid_targets_mean": 4075.0, "valid_targets_min": 954 }, { "epoch": 6.7958179581795815, "grad_norm": 0.62170856938697, "learning_rate": 1.0486806159405672e-07, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.08012904226779938, "step": 5525, "valid_targets_mean": 3613.6, "valid_targets_min": 748 }, { "epoch": 6.801968019680197, "grad_norm": 0.5735668081419381, "learning_rate": 9.86876339452203e-08, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.06451477110385895, "step": 5530, "valid_targets_mean": 4471.0, "valid_targets_min": 549 }, { "epoch": 6.808118081180812, "grad_norm": 0.5111385230332108, "learning_rate": 9.269445187785275e-08, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.07112513482570648, "step": 5535, "valid_targets_mean": 4464.1, "valid_targets_min": 615 }, { "epoch": 6.814268142681427, "grad_norm": 0.6264382075580561, "learning_rate": 8.688857178003495e-08, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.0690319836139679, "step": 5540, "valid_targets_mean": 3371.1, "valid_targets_min": 1170 }, { "epoch": 6.820418204182042, "grad_norm": 0.5140239111149651, "learning_rate": 8.127004827757967e-08, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.06056186184287071, "step": 5545, "valid_targets_mean": 4212.4, "valid_targets_min": 859 }, { "epoch": 6.826568265682657, "grad_norm": 0.6772382442570577, "learning_rate": 7.583893423352306e-08, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.05224543809890747, "step": 5550, "valid_targets_mean": 1865.4, "valid_targets_min": 772 }, { "epoch": 6.832718327183272, "grad_norm": 0.5895539346948653, "learning_rate": 7.05952807476118e-08, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.04882111772894859, "step": 5555, "valid_targets_mean": 2514.6, "valid_targets_min": 789 }, { "epoch": 6.838868388683887, "grad_norm": 0.48807813825983537, "learning_rate": 6.553913715583671e-08, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.048527151346206665, "step": 5560, "valid_targets_mean": 3977.1, "valid_targets_min": 1117 }, { "epoch": 6.845018450184502, "grad_norm": 0.6078080609130851, "learning_rate": 6.067055102996433e-08, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.06978254020214081, "step": 5565, "valid_targets_mean": 4450.6, "valid_targets_min": 1072 }, { "epoch": 6.851168511685117, "grad_norm": 0.5235762394225727, "learning_rate": 5.59895681770839e-08, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.06056521087884903, "step": 5570, "valid_targets_mean": 4479.1, "valid_targets_min": 208 }, { "epoch": 6.857318573185732, "grad_norm": 0.48851126333272826, "learning_rate": 5.149623263918546e-08, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.07842652499675751, "step": 5575, "valid_targets_mean": 6019.1, "valid_targets_min": 1392 }, { "epoch": 6.863468634686347, "grad_norm": 0.4810864262135866, "learning_rate": 4.719058669273802e-08, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.079092837870121, "step": 5580, "valid_targets_mean": 6218.6, "valid_targets_min": 1701 }, { "epoch": 6.869618696186961, "grad_norm": 0.6973133651374057, "learning_rate": 4.3072670848292034e-08, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.07518057525157928, "step": 5585, "valid_targets_mean": 3752.8, "valid_targets_min": 1118 }, { "epoch": 6.875768757687577, "grad_norm": 0.6585540745246752, "learning_rate": 3.9142523850108635e-08, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.08246316015720367, "step": 5590, "valid_targets_mean": 3989.9, "valid_targets_min": 1062 }, { "epoch": 6.881918819188192, "grad_norm": 0.5374730661090874, "learning_rate": 3.540018267577772e-08, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.046635936945676804, "step": 5595, "valid_targets_mean": 3061.2, "valid_targets_min": 741 }, { "epoch": 6.888068880688807, "grad_norm": 0.510472460842064, "learning_rate": 3.184568253588927e-08, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.07652543485164642, "step": 5600, "valid_targets_mean": 4784.9, "valid_targets_min": 1068 }, { "epoch": 6.894218942189422, "grad_norm": 0.4840025298882532, "learning_rate": 2.8479056873682577e-08, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.04297013208270073, "step": 5605, "valid_targets_mean": 3136.8, "valid_targets_min": 965 }, { "epoch": 6.900369003690037, "grad_norm": 0.5842670543442152, "learning_rate": 2.5300337364746462e-08, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.06335698068141937, "step": 5610, "valid_targets_mean": 3246.9, "valid_targets_min": 647 }, { "epoch": 6.906519065190652, "grad_norm": 0.48110269279952494, "learning_rate": 2.2309553916719518e-08, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.057074613869190216, "step": 5615, "valid_targets_mean": 4114.1, "valid_targets_min": 1243 }, { "epoch": 6.9126691266912665, "grad_norm": 0.5175296164711993, "learning_rate": 1.9506734668999217e-08, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.07905285060405731, "step": 5620, "valid_targets_mean": 5416.8, "valid_targets_min": 1756 }, { "epoch": 6.918819188191882, "grad_norm": 0.5664682648051188, "learning_rate": 1.689190599248436e-08, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.06515791267156601, "step": 5625, "valid_targets_mean": 4656.8, "valid_targets_min": 838 }, { "epoch": 6.924969249692497, "grad_norm": 0.5480011214181123, "learning_rate": 1.4465092489330812e-08, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.06544838845729828, "step": 5630, "valid_targets_mean": 3923.1, "valid_targets_min": 1042 }, { "epoch": 6.931119311193112, "grad_norm": 1.0905972704554736, "learning_rate": 1.2226316992707266e-08, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.04656635597348213, "step": 5635, "valid_targets_mean": 3093.6, "valid_targets_min": 781 }, { "epoch": 6.937269372693727, "grad_norm": 0.518413117093057, "learning_rate": 1.0175600566593169e-08, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.07991036772727966, "step": 5640, "valid_targets_mean": 5375.9, "valid_targets_min": 3338 }, { "epoch": 6.943419434194342, "grad_norm": 0.5833702797180802, "learning_rate": 8.312962505578893e-09, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.06386210024356842, "step": 5645, "valid_targets_mean": 3400.4, "valid_targets_min": 895 }, { "epoch": 6.949569495694957, "grad_norm": 0.5850004322161442, "learning_rate": 6.638420334672546e-09, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.07902055978775024, "step": 5650, "valid_targets_mean": 3789.1, "valid_targets_min": 1433 }, { "epoch": 6.955719557195572, "grad_norm": 0.5915490092064204, "learning_rate": 5.1519898091489936e-09, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.06437867879867554, "step": 5655, "valid_targets_mean": 2941.4, "valid_targets_min": 935 }, { "epoch": 6.961869618696187, "grad_norm": 0.5980551924311458, "learning_rate": 3.853684914394418e-09, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.06067301332950592, "step": 5660, "valid_targets_mean": 2890.5, "valid_targets_min": 662 }, { "epoch": 6.968019680196802, "grad_norm": 0.6543423176496738, "learning_rate": 2.7435178657797546e-09, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.065235935151577, "step": 5665, "valid_targets_mean": 3264.4, "valid_targets_min": 727 }, { "epoch": 6.974169741697417, "grad_norm": 0.5488408784889992, "learning_rate": 1.8214991085341304e-09, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.05782807990908623, "step": 5670, "valid_targets_mean": 3813.8, "valid_targets_min": 684 }, { "epoch": 6.980319803198032, "grad_norm": 0.5867867676387645, "learning_rate": 1.0876373176671452e-09, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.06842830777168274, "step": 5675, "valid_targets_mean": 3599.1, "valid_targets_min": 1083 }, { "epoch": 6.9864698646986465, "grad_norm": 0.5561177687249769, "learning_rate": 5.419393978600696e-10, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.07188498973846436, "step": 5680, "valid_targets_mean": 3829.9, "valid_targets_min": 876 }, { "epoch": 6.992619926199262, "grad_norm": 0.616934525736705, "learning_rate": 1.8441048343031953e-10, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.06920751929283142, "step": 5685, "valid_targets_mean": 4424.5, "valid_targets_min": 604 }, { "epoch": 6.998769987699877, "grad_norm": 0.6400642366273652, "learning_rate": 1.5053938260400913e-11, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.04953449219465256, "step": 5690, "valid_targets_mean": 2385.9, "valid_targets_min": 933 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.06432667374610901, "step": 5691, "total_flos": 2.2910895883466834e+18, "train_loss": 0.08254917599345904, "train_runtime": 110755.8081, "train_samples_per_second": 0.822, "train_steps_per_second": 0.051, "valid_targets_mean": 3910.1, "valid_targets_min": 1232 } ], "logging_steps": 5, "max_steps": 5691, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.2910895883466834e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }