{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4375, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008, "grad_norm": 12.374207826720879, "learning_rate": 3.6529680365296803e-07, "loss": 0.673, "loss_nan_ranks": 0, "loss_rank_avg": 0.6549139022827148, "step": 5, "valid_targets_mean": 3321.2, "valid_targets_min": 857 }, { "epoch": 0.016, "grad_norm": 11.43057305648331, "learning_rate": 8.219178082191781e-07, "loss": 0.6633, "loss_nan_ranks": 0, "loss_rank_avg": 0.6954354643821716, "step": 10, "valid_targets_mean": 2652.1, "valid_targets_min": 682 }, { "epoch": 0.024, "grad_norm": 9.570235812016593, "learning_rate": 1.278538812785388e-06, "loss": 0.6271, "loss_nan_ranks": 0, "loss_rank_avg": 0.6770514249801636, "step": 15, "valid_targets_mean": 3358.0, "valid_targets_min": 739 }, { "epoch": 0.032, "grad_norm": 8.170405598762851, "learning_rate": 1.7351598173515982e-06, "loss": 0.6202, "loss_nan_ranks": 0, "loss_rank_avg": 0.5899783372879028, "step": 20, "valid_targets_mean": 4322.4, "valid_targets_min": 743 }, { "epoch": 0.04, "grad_norm": 3.6087283340453133, "learning_rate": 2.191780821917808e-06, "loss": 0.5571, "loss_nan_ranks": 0, "loss_rank_avg": 0.4666231572628021, "step": 25, "valid_targets_mean": 5854.6, "valid_targets_min": 718 }, { "epoch": 0.048, "grad_norm": 2.6527603461614553, "learning_rate": 2.6484018264840183e-06, "loss": 0.5838, "loss_nan_ranks": 0, "loss_rank_avg": 0.5448369979858398, "step": 30, "valid_targets_mean": 4481.5, "valid_targets_min": 920 }, { "epoch": 0.056, "grad_norm": 2.027006540805368, "learning_rate": 3.1050228310502285e-06, "loss": 0.5264, "loss_nan_ranks": 0, "loss_rank_avg": 0.5310207605361938, "step": 35, "valid_targets_mean": 2902.4, "valid_targets_min": 828 }, { "epoch": 0.064, "grad_norm": 1.8084836411086191, "learning_rate": 3.5616438356164386e-06, "loss": 0.5147, "loss_nan_ranks": 0, "loss_rank_avg": 0.5529466867446899, "step": 40, "valid_targets_mean": 2200.1, "valid_targets_min": 732 }, { "epoch": 0.072, "grad_norm": 1.0819999335224122, "learning_rate": 4.018264840182649e-06, "loss": 0.4949, "loss_nan_ranks": 0, "loss_rank_avg": 0.45418739318847656, "step": 45, "valid_targets_mean": 5406.0, "valid_targets_min": 864 }, { "epoch": 0.08, "grad_norm": 0.9962749166883843, "learning_rate": 4.4748858447488585e-06, "loss": 0.5261, "loss_nan_ranks": 0, "loss_rank_avg": 0.5496567487716675, "step": 50, "valid_targets_mean": 3678.8, "valid_targets_min": 902 }, { "epoch": 0.088, "grad_norm": 0.8013005822835737, "learning_rate": 4.931506849315069e-06, "loss": 0.4898, "loss_nan_ranks": 0, "loss_rank_avg": 0.5123369693756104, "step": 55, "valid_targets_mean": 4873.1, "valid_targets_min": 950 }, { "epoch": 0.096, "grad_norm": 0.6575479902865903, "learning_rate": 5.388127853881279e-06, "loss": 0.4628, "loss_nan_ranks": 0, "loss_rank_avg": 0.41041916608810425, "step": 60, "valid_targets_mean": 4923.4, "valid_targets_min": 887 }, { "epoch": 0.104, "grad_norm": 0.7006327660151911, "learning_rate": 5.8447488584474885e-06, "loss": 0.476, "loss_nan_ranks": 0, "loss_rank_avg": 0.4419603943824768, "step": 65, "valid_targets_mean": 3550.9, "valid_targets_min": 954 }, { "epoch": 0.112, "grad_norm": 0.6222761889218557, "learning_rate": 6.301369863013699e-06, "loss": 0.4573, "loss_nan_ranks": 0, "loss_rank_avg": 0.45139503479003906, "step": 70, "valid_targets_mean": 3806.9, "valid_targets_min": 779 }, { "epoch": 0.12, "grad_norm": 0.5620156952847125, "learning_rate": 6.757990867579909e-06, "loss": 0.4339, "loss_nan_ranks": 0, "loss_rank_avg": 0.44665512442588806, "step": 75, "valid_targets_mean": 4951.6, "valid_targets_min": 994 }, { "epoch": 0.128, "grad_norm": 0.49883881664127766, "learning_rate": 7.214611872146119e-06, "loss": 0.4414, "loss_nan_ranks": 0, "loss_rank_avg": 0.42222359776496887, "step": 80, "valid_targets_mean": 5721.9, "valid_targets_min": 909 }, { "epoch": 0.136, "grad_norm": 0.5538426247192075, "learning_rate": 7.671232876712329e-06, "loss": 0.4276, "loss_nan_ranks": 0, "loss_rank_avg": 0.4493791460990906, "step": 85, "valid_targets_mean": 4876.8, "valid_targets_min": 1047 }, { "epoch": 0.144, "grad_norm": 0.5791700438161751, "learning_rate": 8.127853881278539e-06, "loss": 0.4333, "loss_nan_ranks": 0, "loss_rank_avg": 0.4152202606201172, "step": 90, "valid_targets_mean": 3532.4, "valid_targets_min": 959 }, { "epoch": 0.152, "grad_norm": 0.5477499942337496, "learning_rate": 8.584474885844748e-06, "loss": 0.4003, "loss_nan_ranks": 0, "loss_rank_avg": 0.37116068601608276, "step": 95, "valid_targets_mean": 3519.7, "valid_targets_min": 1179 }, { "epoch": 0.16, "grad_norm": 0.5775964980586745, "learning_rate": 9.04109589041096e-06, "loss": 0.4339, "loss_nan_ranks": 0, "loss_rank_avg": 0.40842100977897644, "step": 100, "valid_targets_mean": 3587.7, "valid_targets_min": 875 }, { "epoch": 0.168, "grad_norm": 0.6430856727704666, "learning_rate": 9.49771689497717e-06, "loss": 0.4225, "loss_nan_ranks": 0, "loss_rank_avg": 0.47565746307373047, "step": 105, "valid_targets_mean": 3647.5, "valid_targets_min": 887 }, { "epoch": 0.176, "grad_norm": 0.716966298704087, "learning_rate": 9.95433789954338e-06, "loss": 0.3843, "loss_nan_ranks": 0, "loss_rank_avg": 0.42896223068237305, "step": 110, "valid_targets_mean": 2842.8, "valid_targets_min": 921 }, { "epoch": 0.184, "grad_norm": 0.5301806019840736, "learning_rate": 1.0410958904109589e-05, "loss": 0.3547, "loss_nan_ranks": 0, "loss_rank_avg": 0.3746205270290375, "step": 115, "valid_targets_mean": 3999.1, "valid_targets_min": 1007 }, { "epoch": 0.192, "grad_norm": 0.48241364109719725, "learning_rate": 1.08675799086758e-05, "loss": 0.3868, "loss_nan_ranks": 0, "loss_rank_avg": 0.33790087699890137, "step": 120, "valid_targets_mean": 5485.6, "valid_targets_min": 709 }, { "epoch": 0.2, "grad_norm": 0.38455061918249317, "learning_rate": 1.132420091324201e-05, "loss": 0.3826, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305814862251282, "step": 125, "valid_targets_mean": 7719.6, "valid_targets_min": 865 }, { "epoch": 0.208, "grad_norm": 0.4907444754258652, "learning_rate": 1.178082191780822e-05, "loss": 0.3677, "loss_nan_ranks": 0, "loss_rank_avg": 0.401222288608551, "step": 130, "valid_targets_mean": 4818.7, "valid_targets_min": 961 }, { "epoch": 0.216, "grad_norm": 0.45743331436009144, "learning_rate": 1.223744292237443e-05, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.3574488162994385, "step": 135, "valid_targets_mean": 5390.3, "valid_targets_min": 978 }, { "epoch": 0.224, "grad_norm": 0.511011558834825, "learning_rate": 1.2694063926940641e-05, "loss": 0.3764, "loss_nan_ranks": 0, "loss_rank_avg": 0.3379029631614685, "step": 140, "valid_targets_mean": 5142.8, "valid_targets_min": 893 }, { "epoch": 0.232, "grad_norm": 0.5822963240467418, "learning_rate": 1.3150684931506849e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.34744590520858765, "step": 145, "valid_targets_mean": 5302.1, "valid_targets_min": 880 }, { "epoch": 0.24, "grad_norm": 0.6216847277162149, "learning_rate": 1.360730593607306e-05, "loss": 0.3759, "loss_nan_ranks": 0, "loss_rank_avg": 0.3552771210670471, "step": 150, "valid_targets_mean": 4948.8, "valid_targets_min": 814 }, { "epoch": 0.248, "grad_norm": 0.574367767908384, "learning_rate": 1.406392694063927e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.3638104498386383, "step": 155, "valid_targets_mean": 3668.3, "valid_targets_min": 763 }, { "epoch": 0.256, "grad_norm": 0.5264337459661648, "learning_rate": 1.4520547945205482e-05, "loss": 0.3625, "loss_nan_ranks": 0, "loss_rank_avg": 0.3273163437843323, "step": 160, "valid_targets_mean": 4477.4, "valid_targets_min": 926 }, { "epoch": 0.264, "grad_norm": 0.49616555200759516, "learning_rate": 1.497716894977169e-05, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.3494306802749634, "step": 165, "valid_targets_mean": 4903.5, "valid_targets_min": 766 }, { "epoch": 0.272, "grad_norm": 0.5183306288028923, "learning_rate": 1.54337899543379e-05, "loss": 0.3495, "loss_nan_ranks": 0, "loss_rank_avg": 0.32361409068107605, "step": 170, "valid_targets_mean": 4151.4, "valid_targets_min": 979 }, { "epoch": 0.28, "grad_norm": 0.6625899937361988, "learning_rate": 1.589041095890411e-05, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.3405327796936035, "step": 175, "valid_targets_mean": 2944.8, "valid_targets_min": 843 }, { "epoch": 0.288, "grad_norm": 0.521897584371646, "learning_rate": 1.634703196347032e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.3742603063583374, "step": 180, "valid_targets_mean": 4572.4, "valid_targets_min": 872 }, { "epoch": 0.296, "grad_norm": 0.49053163267667843, "learning_rate": 1.680365296803653e-05, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.30405259132385254, "step": 185, "valid_targets_mean": 5678.8, "valid_targets_min": 629 }, { "epoch": 0.304, "grad_norm": 0.9074873265259921, "learning_rate": 1.726027397260274e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.5085344314575195, "step": 190, "valid_targets_mean": 2015.6, "valid_targets_min": 976 }, { "epoch": 0.312, "grad_norm": 0.7231403812681834, "learning_rate": 1.771689497716895e-05, "loss": 0.3531, "loss_nan_ranks": 0, "loss_rank_avg": 0.4101080000400543, "step": 195, "valid_targets_mean": 3050.3, "valid_targets_min": 869 }, { "epoch": 0.32, "grad_norm": 0.4901983123951643, "learning_rate": 1.8173515981735163e-05, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.3015870749950409, "step": 200, "valid_targets_mean": 6477.4, "valid_targets_min": 788 }, { "epoch": 0.328, "grad_norm": 0.7091813307576407, "learning_rate": 1.863013698630137e-05, "loss": 0.3278, "loss_nan_ranks": 0, "loss_rank_avg": 0.36794477701187134, "step": 205, "valid_targets_mean": 2819.5, "valid_targets_min": 648 }, { "epoch": 0.336, "grad_norm": 0.6242515345896389, "learning_rate": 1.9086757990867582e-05, "loss": 0.3378, "loss_nan_ranks": 0, "loss_rank_avg": 0.38683176040649414, "step": 210, "valid_targets_mean": 3260.6, "valid_targets_min": 822 }, { "epoch": 0.344, "grad_norm": 0.5367951319766895, "learning_rate": 1.954337899543379e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.31571871042251587, "step": 215, "valid_targets_mean": 4805.6, "valid_targets_min": 1114 }, { "epoch": 0.352, "grad_norm": 0.7441017340177637, "learning_rate": 2e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.35355275869369507, "step": 220, "valid_targets_mean": 2396.6, "valid_targets_min": 889 }, { "epoch": 0.36, "grad_norm": 0.5463780408548322, "learning_rate": 2.045662100456621e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.2769712805747986, "step": 225, "valid_targets_mean": 4953.7, "valid_targets_min": 938 }, { "epoch": 0.368, "grad_norm": 0.5117792360088306, "learning_rate": 2.0913242009132424e-05, "loss": 0.334, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192422389984131, "step": 230, "valid_targets_mean": 5398.4, "valid_targets_min": 917 }, { "epoch": 0.376, "grad_norm": 0.6081591338406857, "learning_rate": 2.1369863013698632e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.3515390157699585, "step": 235, "valid_targets_mean": 3282.2, "valid_targets_min": 1082 }, { "epoch": 0.384, "grad_norm": 0.5361233007075954, "learning_rate": 2.182648401826484e-05, "loss": 0.327, "loss_nan_ranks": 0, "loss_rank_avg": 0.33629757165908813, "step": 240, "valid_targets_mean": 5654.5, "valid_targets_min": 794 }, { "epoch": 0.392, "grad_norm": 0.4879945295289328, "learning_rate": 2.2283105022831052e-05, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.2991241216659546, "step": 245, "valid_targets_mean": 6910.0, "valid_targets_min": 693 }, { "epoch": 0.4, "grad_norm": 0.5818121087256863, "learning_rate": 2.2739726027397263e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.2698156237602234, "step": 250, "valid_targets_mean": 5727.4, "valid_targets_min": 837 }, { "epoch": 0.408, "grad_norm": 0.5484701967234875, "learning_rate": 2.3196347031963475e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.2877916991710663, "step": 255, "valid_targets_mean": 3935.9, "valid_targets_min": 908 }, { "epoch": 0.416, "grad_norm": 0.7598295746278937, "learning_rate": 2.3652968036529683e-05, "loss": 0.3256, "loss_nan_ranks": 0, "loss_rank_avg": 0.379886269569397, "step": 260, "valid_targets_mean": 3017.8, "valid_targets_min": 929 }, { "epoch": 0.424, "grad_norm": 0.6292837735711766, "learning_rate": 2.410958904109589e-05, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.3254546821117401, "step": 265, "valid_targets_mean": 3521.9, "valid_targets_min": 1022 }, { "epoch": 0.432, "grad_norm": 0.507874716177431, "learning_rate": 2.4566210045662106e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930123805999756, "step": 270, "valid_targets_mean": 4279.1, "valid_targets_min": 845 }, { "epoch": 0.44, "grad_norm": 0.4869811841188768, "learning_rate": 2.5022831050228314e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.295903742313385, "step": 275, "valid_targets_mean": 5994.6, "valid_targets_min": 807 }, { "epoch": 0.448, "grad_norm": 0.618514883028784, "learning_rate": 2.547945205479452e-05, "loss": 0.3316, "loss_nan_ranks": 0, "loss_rank_avg": 0.32905834913253784, "step": 280, "valid_targets_mean": 4779.1, "valid_targets_min": 1148 }, { "epoch": 0.456, "grad_norm": 0.6790060720865024, "learning_rate": 2.593607305936073e-05, "loss": 0.3311, "loss_nan_ranks": 0, "loss_rank_avg": 0.3841496706008911, "step": 285, "valid_targets_mean": 3403.9, "valid_targets_min": 723 }, { "epoch": 0.464, "grad_norm": 1.3404239047851452, "learning_rate": 2.6392694063926944e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.29200658202171326, "step": 290, "valid_targets_mean": 4245.9, "valid_targets_min": 657 }, { "epoch": 0.472, "grad_norm": 0.5708709470409948, "learning_rate": 2.6849315068493153e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.30335745215415955, "step": 295, "valid_targets_mean": 4115.2, "valid_targets_min": 1058 }, { "epoch": 0.48, "grad_norm": 0.601194220459844, "learning_rate": 2.7305936073059364e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.4048035740852356, "step": 300, "valid_targets_mean": 5644.8, "valid_targets_min": 1055 }, { "epoch": 0.488, "grad_norm": 0.5494984385782556, "learning_rate": 2.7762557077625572e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.29575061798095703, "step": 305, "valid_targets_mean": 5261.0, "valid_targets_min": 734 }, { "epoch": 0.496, "grad_norm": 0.5098156256599904, "learning_rate": 2.8219178082191783e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.3082813024520874, "step": 310, "valid_targets_mean": 6082.6, "valid_targets_min": 826 }, { "epoch": 0.504, "grad_norm": 0.5159281940057138, "learning_rate": 2.8675799086757995e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.3101263642311096, "step": 315, "valid_targets_mean": 5008.8, "valid_targets_min": 806 }, { "epoch": 0.512, "grad_norm": 0.6804451743074025, "learning_rate": 2.9132420091324203e-05, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.29619288444519043, "step": 320, "valid_targets_mean": 4585.7, "valid_targets_min": 1016 }, { "epoch": 0.52, "grad_norm": 0.5850935505815877, "learning_rate": 2.958904109589041e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.28627079725265503, "step": 325, "valid_targets_mean": 3302.2, "valid_targets_min": 966 }, { "epoch": 0.528, "grad_norm": 0.965007545709362, "learning_rate": 3.0045662100456626e-05, "loss": 0.3114, "loss_nan_ranks": 0, "loss_rank_avg": 0.35180073976516724, "step": 330, "valid_targets_mean": 3250.3, "valid_targets_min": 829 }, { "epoch": 0.536, "grad_norm": 0.5381764485997723, "learning_rate": 3.0502283105022834e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.2976144552230835, "step": 335, "valid_targets_mean": 4887.6, "valid_targets_min": 827 }, { "epoch": 0.544, "grad_norm": 0.648507415849347, "learning_rate": 3.0958904109589045e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3534129858016968, "step": 340, "valid_targets_mean": 4146.6, "valid_targets_min": 1034 }, { "epoch": 0.552, "grad_norm": 0.5712482499204495, "learning_rate": 3.141552511415525e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.25627678632736206, "step": 345, "valid_targets_mean": 4196.8, "valid_targets_min": 917 }, { "epoch": 0.56, "grad_norm": 0.44280064147997866, "learning_rate": 3.187214611872147e-05, "loss": 0.2947, "loss_nan_ranks": 0, "loss_rank_avg": 0.29131901264190674, "step": 350, "valid_targets_mean": 6720.6, "valid_targets_min": 1054 }, { "epoch": 0.568, "grad_norm": 0.5998227591824579, "learning_rate": 3.2328767123287676e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.2890249192714691, "step": 355, "valid_targets_mean": 3408.9, "valid_targets_min": 973 }, { "epoch": 0.576, "grad_norm": 0.7483944088873048, "learning_rate": 3.2785388127853884e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.3844132721424103, "step": 360, "valid_targets_mean": 4073.4, "valid_targets_min": 893 }, { "epoch": 0.584, "grad_norm": 0.5805802611531444, "learning_rate": 3.324200913242009e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.31355297565460205, "step": 365, "valid_targets_mean": 3970.4, "valid_targets_min": 796 }, { "epoch": 0.592, "grad_norm": 0.6042096610158246, "learning_rate": 3.369863013698631e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948343753814697, "step": 370, "valid_targets_mean": 3084.6, "valid_targets_min": 677 }, { "epoch": 0.6, "grad_norm": 0.6461668885744746, "learning_rate": 3.4155251141552515e-05, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.2847023010253906, "step": 375, "valid_targets_mean": 3152.9, "valid_targets_min": 827 }, { "epoch": 0.608, "grad_norm": 0.6252813642439993, "learning_rate": 3.461187214611872e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.31125932931900024, "step": 380, "valid_targets_mean": 3398.4, "valid_targets_min": 714 }, { "epoch": 0.616, "grad_norm": 0.5513266421188043, "learning_rate": 3.506849315068493e-05, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.3118017315864563, "step": 385, "valid_targets_mean": 4706.7, "valid_targets_min": 870 }, { "epoch": 0.624, "grad_norm": 0.5782519741863913, "learning_rate": 3.5525114155251146e-05, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.272940993309021, "step": 390, "valid_targets_mean": 3489.2, "valid_targets_min": 855 }, { "epoch": 0.632, "grad_norm": 0.4835190489595145, "learning_rate": 3.5981735159817354e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.24451082944869995, "step": 395, "valid_targets_mean": 6700.7, "valid_targets_min": 865 }, { "epoch": 0.64, "grad_norm": 0.5678926388355849, "learning_rate": 3.643835616438356e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.27626603841781616, "step": 400, "valid_targets_mean": 3785.8, "valid_targets_min": 662 }, { "epoch": 0.648, "grad_norm": 0.5159242200400144, "learning_rate": 3.689497716894977e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.26561927795410156, "step": 405, "valid_targets_mean": 4753.9, "valid_targets_min": 870 }, { "epoch": 0.656, "grad_norm": 0.6417729066274248, "learning_rate": 3.7351598173515985e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.36154353618621826, "step": 410, "valid_targets_mean": 3772.2, "valid_targets_min": 1060 }, { "epoch": 0.664, "grad_norm": 0.5052939522988528, "learning_rate": 3.780821917808219e-05, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.2737759053707123, "step": 415, "valid_targets_mean": 6162.9, "valid_targets_min": 978 }, { "epoch": 0.672, "grad_norm": 0.41783612659228964, "learning_rate": 3.82648401826484e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618584930896759, "step": 420, "valid_targets_mean": 9499.0, "valid_targets_min": 1090 }, { "epoch": 0.68, "grad_norm": 1.0340429120195325, "learning_rate": 3.8721461187214615e-05, "loss": 0.311, "loss_nan_ranks": 0, "loss_rank_avg": 0.3576170802116394, "step": 425, "valid_targets_mean": 3117.8, "valid_targets_min": 1019 }, { "epoch": 0.688, "grad_norm": 0.6432463334293257, "learning_rate": 3.9178082191780823e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.31897398829460144, "step": 430, "valid_targets_mean": 2963.1, "valid_targets_min": 845 }, { "epoch": 0.696, "grad_norm": 0.6510917417085519, "learning_rate": 3.963470319634704e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.3051530718803406, "step": 435, "valid_targets_mean": 3365.6, "valid_targets_min": 974 }, { "epoch": 0.704, "grad_norm": 0.5340165987215613, "learning_rate": 3.99999936325009e-05, "loss": 0.3129, "loss_nan_ranks": 0, "loss_rank_avg": 0.3342752456665039, "step": 440, "valid_targets_mean": 4853.4, "valid_targets_min": 1068 }, { "epoch": 0.712, "grad_norm": 0.5677728076782123, "learning_rate": 3.9999770770457856e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.2853566110134125, "step": 445, "valid_targets_mean": 4938.3, "valid_targets_min": 910 }, { "epoch": 0.72, "grad_norm": 0.566650322028894, "learning_rate": 3.9999229537513936e-05, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.27975791692733765, "step": 450, "valid_targets_mean": 3907.8, "valid_targets_min": 793 }, { "epoch": 0.728, "grad_norm": 0.512996855287856, "learning_rate": 3.999836994228487e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654213011264801, "step": 455, "valid_targets_mean": 3657.9, "valid_targets_min": 976 }, { "epoch": 0.736, "grad_norm": 0.5712508862988912, "learning_rate": 3.999719199845432e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.28030380606651306, "step": 460, "valid_targets_mean": 3826.2, "valid_targets_min": 791 }, { "epoch": 0.744, "grad_norm": 0.550763618650829, "learning_rate": 3.999569572477366e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925485074520111, "step": 465, "valid_targets_mean": 3767.2, "valid_targets_min": 1074 }, { "epoch": 0.752, "grad_norm": 0.4844778100988879, "learning_rate": 3.999388114506166e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.28359127044677734, "step": 470, "valid_targets_mean": 5441.2, "valid_targets_min": 1040 }, { "epoch": 0.76, "grad_norm": 0.5223336482223219, "learning_rate": 3.999174828820413e-05, "loss": 0.3165, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604113817214966, "step": 475, "valid_targets_mean": 4254.1, "valid_targets_min": 662 }, { "epoch": 0.768, "grad_norm": 0.7085323476959958, "learning_rate": 3.998929718815341e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.366795152425766, "step": 480, "valid_targets_mean": 3101.3, "valid_targets_min": 941 }, { "epoch": 0.776, "grad_norm": 0.5280273815145139, "learning_rate": 3.998652788392792e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2906476855278015, "step": 485, "valid_targets_mean": 4255.8, "valid_targets_min": 968 }, { "epoch": 0.784, "grad_norm": 0.45090956227053314, "learning_rate": 3.9983440419611445e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.23735715448856354, "step": 490, "valid_targets_mean": 4642.8, "valid_targets_min": 868 }, { "epoch": 0.792, "grad_norm": 0.4683162495835124, "learning_rate": 3.9980034844352494e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.268685519695282, "step": 495, "valid_targets_mean": 6424.1, "valid_targets_min": 1279 }, { "epoch": 0.8, "grad_norm": 0.517351165125786, "learning_rate": 3.9976311212363495e-05, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.3032742142677307, "step": 500, "valid_targets_mean": 4640.5, "valid_targets_min": 738 }, { "epoch": 0.808, "grad_norm": 0.5071613397785332, "learning_rate": 3.997226958291992e-05, "loss": 0.3027, "loss_nan_ranks": 0, "loss_rank_avg": 0.26866069436073303, "step": 505, "valid_targets_mean": 5655.1, "valid_targets_min": 905 }, { "epoch": 0.816, "grad_norm": 0.6466486162647562, "learning_rate": 3.996791002035937e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.4299527406692505, "step": 510, "valid_targets_mean": 3593.1, "valid_targets_min": 859 }, { "epoch": 0.824, "grad_norm": 0.5443624306552559, "learning_rate": 3.996323259408055e-05, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.2630675435066223, "step": 515, "valid_targets_mean": 7815.6, "valid_targets_min": 532 }, { "epoch": 0.832, "grad_norm": 0.6243451089128813, "learning_rate": 3.995823737854211e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.3227846622467041, "step": 520, "valid_targets_mean": 3138.6, "valid_targets_min": 757 }, { "epoch": 0.84, "grad_norm": 0.6022810456897381, "learning_rate": 3.9952924453261534e-05, "loss": 0.3032, "loss_nan_ranks": 0, "loss_rank_avg": 0.3212684988975525, "step": 525, "valid_targets_mean": 3576.4, "valid_targets_min": 914 }, { "epoch": 0.848, "grad_norm": 0.5723242679917651, "learning_rate": 3.994729390281384e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.2988251745700836, "step": 530, "valid_targets_mean": 4023.6, "valid_targets_min": 722 }, { "epoch": 0.856, "grad_norm": 0.5462336841915116, "learning_rate": 3.994134581683021e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.2816080152988434, "step": 535, "valid_targets_mean": 3982.4, "valid_targets_min": 1090 }, { "epoch": 0.864, "grad_norm": 0.4918215735498511, "learning_rate": 3.9935080289996626e-05, "loss": 0.298, "loss_nan_ranks": 0, "loss_rank_avg": 0.26696616411209106, "step": 540, "valid_targets_mean": 5292.1, "valid_targets_min": 839 }, { "epoch": 0.872, "grad_norm": 0.6349909083508697, "learning_rate": 3.992849742205228e-05, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.32703348994255066, "step": 545, "valid_targets_mean": 3155.8, "valid_targets_min": 712 }, { "epoch": 0.88, "grad_norm": 0.455853550279736, "learning_rate": 3.9921597317788065e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557429075241089, "step": 550, "valid_targets_mean": 4919.1, "valid_targets_min": 767 }, { "epoch": 0.888, "grad_norm": 0.6086037931430966, "learning_rate": 3.991438008704486e-05, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.33778220415115356, "step": 555, "valid_targets_mean": 3085.8, "valid_targets_min": 820 }, { "epoch": 0.896, "grad_norm": 0.5213582280989516, "learning_rate": 3.990684584471179e-05, "loss": 0.2946, "loss_nan_ranks": 0, "loss_rank_avg": 0.29489654302597046, "step": 560, "valid_targets_mean": 4436.3, "valid_targets_min": 779 }, { "epoch": 0.904, "grad_norm": 0.5843714438083748, "learning_rate": 3.989899471072441e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.26970839500427246, "step": 565, "valid_targets_mean": 2767.6, "valid_targets_min": 835 }, { "epoch": 0.912, "grad_norm": 0.541008479057164, "learning_rate": 3.9890826810062784e-05, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.25051432847976685, "step": 570, "valid_targets_mean": 3267.8, "valid_targets_min": 901 }, { "epoch": 0.92, "grad_norm": 0.44648718657516523, "learning_rate": 3.988234227274949e-05, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.28003740310668945, "step": 575, "valid_targets_mean": 5206.3, "valid_targets_min": 616 }, { "epoch": 0.928, "grad_norm": 0.5963913155091053, "learning_rate": 3.987354123384757e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.27831757068634033, "step": 580, "valid_targets_mean": 3726.2, "valid_targets_min": 1063 }, { "epoch": 0.936, "grad_norm": 0.5529862065194503, "learning_rate": 3.9864423833458364e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.33845236897468567, "step": 585, "valid_targets_mean": 3352.5, "valid_targets_min": 1010 }, { "epoch": 0.944, "grad_norm": 0.5276685630923462, "learning_rate": 3.9854990216719285e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.30608147382736206, "step": 590, "valid_targets_mean": 3963.6, "valid_targets_min": 960 }, { "epoch": 0.952, "grad_norm": 0.5761410220991169, "learning_rate": 3.98452405338015e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.3611443042755127, "step": 595, "valid_targets_mean": 3870.4, "valid_targets_min": 670 }, { "epoch": 0.96, "grad_norm": 0.43161899888992733, "learning_rate": 3.983517493990756e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567683458328247, "step": 600, "valid_targets_mean": 5753.8, "valid_targets_min": 1022 }, { "epoch": 0.968, "grad_norm": 0.5174699444690888, "learning_rate": 3.982479359526892e-05, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.31545543670654297, "step": 605, "valid_targets_mean": 4297.7, "valid_targets_min": 1026 }, { "epoch": 0.976, "grad_norm": 0.5582649393151906, "learning_rate": 3.981409666514336e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.28723669052124023, "step": 610, "valid_targets_mean": 3499.9, "valid_targets_min": 730 }, { "epoch": 0.984, "grad_norm": 0.4569144879632991, "learning_rate": 3.98030843198124e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.26559823751449585, "step": 615, "valid_targets_mean": 3593.3, "valid_targets_min": 764 }, { "epoch": 0.992, "grad_norm": 0.5364468262792286, "learning_rate": 3.979175673457858e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.2658482491970062, "step": 620, "valid_targets_mean": 3494.4, "valid_targets_min": 670 }, { "epoch": 1.0, "grad_norm": 0.589932569473527, "learning_rate": 3.9780114089762616e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2865822911262512, "step": 625, "valid_targets_mean": 3167.1, "valid_targets_min": 924 }, { "epoch": 1.008, "grad_norm": 0.4223733533410392, "learning_rate": 3.976815657070062e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.24453572928905487, "step": 630, "valid_targets_mean": 5350.5, "valid_targets_min": 909 }, { "epoch": 1.016, "grad_norm": 0.5617173103201819, "learning_rate": 3.975588436774107e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.2646633982658386, "step": 635, "valid_targets_mean": 3123.4, "valid_targets_min": 1007 }, { "epoch": 1.024, "grad_norm": 0.5490235878628557, "learning_rate": 3.9743297676241826e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.2878129184246063, "step": 640, "valid_targets_mean": 4515.7, "valid_targets_min": 784 }, { "epoch": 1.032, "grad_norm": 0.8694303583221871, "learning_rate": 3.9730396696566994e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.39216941595077515, "step": 645, "valid_targets_mean": 1941.7, "valid_targets_min": 1014 }, { "epoch": 1.04, "grad_norm": 0.5176313613959357, "learning_rate": 3.971718163408375e-05, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930067777633667, "step": 650, "valid_targets_mean": 4818.8, "valid_targets_min": 1106 }, { "epoch": 1.048, "grad_norm": 0.44358594950793484, "learning_rate": 3.9703652699159093e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.30579259991645813, "step": 655, "valid_targets_mean": 5172.5, "valid_targets_min": 871 }, { "epoch": 1.056, "grad_norm": 0.5740468844331686, "learning_rate": 3.9689810107156425e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.3474939167499542, "step": 660, "valid_targets_mean": 4049.9, "valid_targets_min": 821 }, { "epoch": 1.064, "grad_norm": 0.5556529187566539, "learning_rate": 3.967565407843222e-05, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.29836633801460266, "step": 665, "valid_targets_mean": 4204.5, "valid_targets_min": 1348 }, { "epoch": 1.072, "grad_norm": 0.5024698593720891, "learning_rate": 3.966118483833242e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.26958394050598145, "step": 670, "valid_targets_mean": 4268.8, "valid_targets_min": 1033 }, { "epoch": 1.08, "grad_norm": 0.4842800380286951, "learning_rate": 3.964640261718893e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.26958194375038147, "step": 675, "valid_targets_mean": 3595.6, "valid_targets_min": 862 }, { "epoch": 1.088, "grad_norm": 0.5273262657978705, "learning_rate": 3.963130765031589e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.2689908444881439, "step": 680, "valid_targets_mean": 3801.2, "valid_targets_min": 1022 }, { "epoch": 1.096, "grad_norm": 0.5751221396165925, "learning_rate": 3.961590017800598e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.2882736027240753, "step": 685, "valid_targets_mean": 3101.3, "valid_targets_min": 664 }, { "epoch": 1.104, "grad_norm": 0.5471508339834354, "learning_rate": 3.960018044552653e-05, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.31060564517974854, "step": 690, "valid_targets_mean": 3763.3, "valid_targets_min": 846 }, { "epoch": 1.112, "grad_norm": 0.5792478778548963, "learning_rate": 3.9584148703115704e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2743430435657501, "step": 695, "valid_targets_mean": 2966.4, "valid_targets_min": 1021 }, { "epoch": 1.12, "grad_norm": 0.5701845098447167, "learning_rate": 3.956780520597842e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.31023383140563965, "step": 700, "valid_targets_mean": 3593.6, "valid_targets_min": 748 }, { "epoch": 1.1280000000000001, "grad_norm": 0.4243313433223685, "learning_rate": 3.955115021428236e-05, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508736550807953, "step": 705, "valid_targets_mean": 5902.2, "valid_targets_min": 912 }, { "epoch": 1.1360000000000001, "grad_norm": 0.4790109609572266, "learning_rate": 3.95341839931538e-05, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.2982293367385864, "step": 710, "valid_targets_mean": 5286.7, "valid_targets_min": 1022 }, { "epoch": 1.144, "grad_norm": 0.5585199616419411, "learning_rate": 3.95169068126734e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2889254093170166, "step": 715, "valid_targets_mean": 2680.4, "valid_targets_min": 822 }, { "epoch": 1.152, "grad_norm": 0.393666834541853, "learning_rate": 3.949931894787187e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.22171318531036377, "step": 720, "valid_targets_mean": 6140.5, "valid_targets_min": 913 }, { "epoch": 1.16, "grad_norm": 0.4554560378266813, "learning_rate": 3.948142067872565e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.276266485452652, "step": 725, "valid_targets_mean": 4809.1, "valid_targets_min": 1074 }, { "epoch": 1.168, "grad_norm": 0.4943688708217394, "learning_rate": 3.946321229015241e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.2835407853126526, "step": 730, "valid_targets_mean": 4429.9, "valid_targets_min": 1050 }, { "epoch": 1.176, "grad_norm": 0.4477093216825828, "learning_rate": 3.944469407200652e-05, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.23854275047779083, "step": 735, "valid_targets_mean": 4396.1, "valid_targets_min": 855 }, { "epoch": 1.184, "grad_norm": 0.5896727157094116, "learning_rate": 3.942586631907444e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.2517150044441223, "step": 740, "valid_targets_mean": 3115.4, "valid_targets_min": 850 }, { "epoch": 1.192, "grad_norm": 0.5289038060630349, "learning_rate": 3.9406729331070054e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541031539440155, "step": 745, "valid_targets_mean": 3815.3, "valid_targets_min": 962 }, { "epoch": 1.2, "grad_norm": 0.44733647620635336, "learning_rate": 3.938728341262985e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.2868531048297882, "step": 750, "valid_targets_mean": 4895.9, "valid_targets_min": 623 }, { "epoch": 1.208, "grad_norm": 0.7202988131820695, "learning_rate": 3.936752887330812e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.3202763497829437, "step": 755, "valid_targets_mean": 2302.6, "valid_targets_min": 929 }, { "epoch": 1.216, "grad_norm": 0.5140036991263218, "learning_rate": 3.9347466027571975e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2578458786010742, "step": 760, "valid_targets_mean": 4010.8, "valid_targets_min": 832 }, { "epoch": 1.224, "grad_norm": 0.5537418130011722, "learning_rate": 3.932709519479639e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2952079176902771, "step": 765, "valid_targets_mean": 3206.0, "valid_targets_min": 800 }, { "epoch": 1.232, "grad_norm": 0.49323600062823847, "learning_rate": 3.930641669925911e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.264598548412323, "step": 770, "valid_targets_mean": 3837.5, "valid_targets_min": 878 }, { "epoch": 1.24, "grad_norm": 0.46711652952383553, "learning_rate": 3.928543087013546e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.27722471952438354, "step": 775, "valid_targets_mean": 4181.8, "valid_targets_min": 877 }, { "epoch": 1.248, "grad_norm": 0.43556151715805724, "learning_rate": 3.926413804149315e-05, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.21522939205169678, "step": 780, "valid_targets_mean": 4802.7, "valid_targets_min": 978 }, { "epoch": 1.256, "grad_norm": 0.6366361986050708, "learning_rate": 3.9242538552286894e-05, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.32596951723098755, "step": 785, "valid_targets_mean": 2695.1, "valid_targets_min": 707 }, { "epoch": 1.264, "grad_norm": 0.5512190834498045, "learning_rate": 3.9220632746353096e-05, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.3354596495628357, "step": 790, "valid_targets_mean": 3169.8, "valid_targets_min": 714 }, { "epoch": 1.272, "grad_norm": 0.4994124792250944, "learning_rate": 3.91984209724043e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.24309590458869934, "step": 795, "valid_targets_mean": 3187.5, "valid_targets_min": 717 }, { "epoch": 1.28, "grad_norm": 0.5058818429479062, "learning_rate": 3.917590358402369e-05, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896243929862976, "step": 800, "valid_targets_mean": 4368.1, "valid_targets_min": 662 }, { "epoch": 1.288, "grad_norm": 0.5741606754229182, "learning_rate": 3.915308093965943e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.31103113293647766, "step": 805, "valid_targets_mean": 3463.2, "valid_targets_min": 1093 }, { "epoch": 1.296, "grad_norm": 0.5269169994703332, "learning_rate": 3.9129953402618976e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.28437525033950806, "step": 810, "valid_targets_mean": 3127.5, "valid_targets_min": 768 }, { "epoch": 1.304, "grad_norm": 0.5105272259938182, "learning_rate": 3.91065213410633e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.27728912234306335, "step": 815, "valid_targets_mean": 3164.8, "valid_targets_min": 954 }, { "epoch": 1.312, "grad_norm": 0.7068657863624991, "learning_rate": 3.908278512800098e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.30154961347579956, "step": 820, "valid_targets_mean": 2021.1, "valid_targets_min": 771 }, { "epoch": 1.32, "grad_norm": 0.43262404009468025, "learning_rate": 3.905874514128235e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.22265702486038208, "step": 825, "valid_targets_mean": 5069.6, "valid_targets_min": 1046 }, { "epoch": 1.328, "grad_norm": 0.4833800812123599, "learning_rate": 3.903440176359338e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.2597518265247345, "step": 830, "valid_targets_mean": 4273.6, "valid_targets_min": 642 }, { "epoch": 1.336, "grad_norm": 0.495986902645752, "learning_rate": 3.90097553824497e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.26148658990859985, "step": 835, "valid_targets_mean": 3473.2, "valid_targets_min": 558 }, { "epoch": 1.3439999999999999, "grad_norm": 0.51848462208148, "learning_rate": 3.8984806390190304e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.30521005392074585, "step": 840, "valid_targets_mean": 3706.1, "valid_targets_min": 1051 }, { "epoch": 1.3519999999999999, "grad_norm": 0.557804275665896, "learning_rate": 3.895955518397141e-05, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.2697344124317169, "step": 845, "valid_targets_mean": 2746.5, "valid_targets_min": 976 }, { "epoch": 1.3599999999999999, "grad_norm": 0.4866612431488525, "learning_rate": 3.893400216576011e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.24589639902114868, "step": 850, "valid_targets_mean": 3582.2, "valid_targets_min": 765 }, { "epoch": 1.3679999999999999, "grad_norm": 0.46312511696658815, "learning_rate": 3.89081477423279e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.25814926624298096, "step": 855, "valid_targets_mean": 4407.3, "valid_targets_min": 820 }, { "epoch": 1.376, "grad_norm": 0.4559151598342351, "learning_rate": 3.888199232524434e-05, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.27635207772254944, "step": 860, "valid_targets_mean": 4211.1, "valid_targets_min": 840 }, { "epoch": 1.384, "grad_norm": 0.42662571052348236, "learning_rate": 3.8855536330870354e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.27323490381240845, "step": 865, "valid_targets_mean": 5150.4, "valid_targets_min": 851 }, { "epoch": 1.392, "grad_norm": 0.43724344437427815, "learning_rate": 3.882878018035173e-05, "loss": 0.2682, "loss_nan_ranks": 0, "loss_rank_avg": 0.298825204372406, "step": 870, "valid_targets_mean": 4823.4, "valid_targets_min": 648 }, { "epoch": 1.4, "grad_norm": 0.4513041544448632, "learning_rate": 3.880172429961232e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.2363213747739792, "step": 875, "valid_targets_mean": 4356.6, "valid_targets_min": 676 }, { "epoch": 1.408, "grad_norm": 0.4023862024488909, "learning_rate": 3.877436911934733e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.26997482776641846, "step": 880, "valid_targets_mean": 5533.5, "valid_targets_min": 904 }, { "epoch": 1.416, "grad_norm": 0.7080890847938507, "learning_rate": 3.874671507501641e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.3377278745174408, "step": 885, "valid_targets_mean": 2200.1, "valid_targets_min": 912 }, { "epoch": 1.424, "grad_norm": 0.5267587721617124, "learning_rate": 3.871876260683677e-05, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.2512984275817871, "step": 890, "valid_targets_mean": 3473.6, "valid_targets_min": 810 }, { "epoch": 1.432, "grad_norm": 0.5790695758130487, "learning_rate": 3.869051215977612e-05, "loss": 0.2884, "loss_nan_ranks": 0, "loss_rank_avg": 0.32350438833236694, "step": 895, "valid_targets_mean": 3247.3, "valid_targets_min": 822 }, { "epoch": 1.44, "grad_norm": 0.4803005137644847, "learning_rate": 3.8661964183545634e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.27841246128082275, "step": 900, "valid_targets_mean": 4475.9, "valid_targets_min": 948 }, { "epoch": 1.448, "grad_norm": 0.475901655735222, "learning_rate": 3.863311913259276e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.33764156699180603, "step": 905, "valid_targets_mean": 5242.4, "valid_targets_min": 826 }, { "epoch": 1.456, "grad_norm": 0.748149672688827, "learning_rate": 3.860397746609402e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.31807559728622437, "step": 910, "valid_targets_mean": 2950.9, "valid_targets_min": 816 }, { "epoch": 1.464, "grad_norm": 0.37580443450106377, "learning_rate": 3.857453964794764e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2712574005126953, "step": 915, "valid_targets_mean": 6658.7, "valid_targets_min": 1186 }, { "epoch": 1.472, "grad_norm": 0.45030105000964843, "learning_rate": 3.854480614676624e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.272754043340683, "step": 920, "valid_targets_mean": 3925.5, "valid_targets_min": 788 }, { "epoch": 1.48, "grad_norm": 0.34923108926716045, "learning_rate": 3.851477743586932e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2357773333787918, "step": 925, "valid_targets_mean": 6845.4, "valid_targets_min": 998 }, { "epoch": 1.488, "grad_norm": 0.5115811479757503, "learning_rate": 3.8484453993275746e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.23984485864639282, "step": 930, "valid_targets_mean": 3133.7, "valid_targets_min": 774 }, { "epoch": 1.496, "grad_norm": 0.48452858019317047, "learning_rate": 3.8453836301696134e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.2921665608882904, "step": 935, "valid_targets_mean": 3872.1, "valid_targets_min": 830 }, { "epoch": 1.504, "grad_norm": 0.5141883495932179, "learning_rate": 3.842292484852518e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.2862679958343506, "step": 940, "valid_targets_mean": 4214.1, "valid_targets_min": 898 }, { "epoch": 1.512, "grad_norm": 0.46283592158032705, "learning_rate": 3.8391720125833875e-05, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.2581455707550049, "step": 945, "valid_targets_mean": 3914.6, "valid_targets_min": 987 }, { "epoch": 1.52, "grad_norm": 0.48706765716515343, "learning_rate": 3.83602226303617e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.2788928747177124, "step": 950, "valid_targets_mean": 4213.4, "valid_targets_min": 839 }, { "epoch": 1.528, "grad_norm": 0.585464765294358, "learning_rate": 3.83284328635087e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.2879747152328491, "step": 955, "valid_targets_mean": 3057.9, "valid_targets_min": 932 }, { "epoch": 1.536, "grad_norm": 0.5315853015293113, "learning_rate": 3.829635133132751e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.2610795199871063, "step": 960, "valid_targets_mean": 3284.8, "valid_targets_min": 733 }, { "epoch": 1.544, "grad_norm": 0.5296944336561442, "learning_rate": 3.8263978544515304e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.26374924182891846, "step": 965, "valid_targets_mean": 3174.6, "valid_targets_min": 824 }, { "epoch": 1.552, "grad_norm": 0.4659744673324122, "learning_rate": 3.823131501840565e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.27271947264671326, "step": 970, "valid_targets_mean": 3992.8, "valid_targets_min": 786 }, { "epoch": 1.56, "grad_norm": 0.41130937508304954, "learning_rate": 3.819836127296032e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.26125800609588623, "step": 975, "valid_targets_mean": 4572.8, "valid_targets_min": 587 }, { "epoch": 1.568, "grad_norm": 0.5146658247796757, "learning_rate": 3.8165117832761016e-05, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052479326725006, "step": 980, "valid_targets_mean": 3267.8, "valid_targets_min": 963 }, { "epoch": 1.576, "grad_norm": 0.5707618643836874, "learning_rate": 3.813158522700098e-05, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.3040449619293213, "step": 985, "valid_targets_mean": 3492.4, "valid_targets_min": 995 }, { "epoch": 1.584, "grad_norm": 0.45611771016792524, "learning_rate": 3.809776398947665e-05, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.2837957441806793, "step": 990, "valid_targets_mean": 4701.9, "valid_targets_min": 1074 }, { "epoch": 1.592, "grad_norm": 0.4630680235085982, "learning_rate": 3.806365465857908e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2922239601612091, "step": 995, "valid_targets_mean": 3976.1, "valid_targets_min": 918 }, { "epoch": 1.6, "grad_norm": 0.399096117534781, "learning_rate": 3.802925777728541e-05, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.2673601806163788, "step": 1000, "valid_targets_mean": 5512.1, "valid_targets_min": 840 }, { "epoch": 1.608, "grad_norm": 0.41627336969619316, "learning_rate": 3.799457389315023e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.2412080317735672, "step": 1005, "valid_targets_mean": 4379.9, "valid_targets_min": 1023 }, { "epoch": 1.616, "grad_norm": 0.440295852006296, "learning_rate": 3.795960355829683e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.2329067587852478, "step": 1010, "valid_targets_mean": 4429.0, "valid_targets_min": 1099 }, { "epoch": 1.624, "grad_norm": 0.5318475478532778, "learning_rate": 3.7924347329408444e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.2775961756706238, "step": 1015, "valid_targets_mean": 2742.1, "valid_targets_min": 857 }, { "epoch": 1.6320000000000001, "grad_norm": 0.4161727759675333, "learning_rate": 3.788880576771937e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.24313268065452576, "step": 1020, "valid_targets_mean": 5492.8, "valid_targets_min": 978 }, { "epoch": 1.6400000000000001, "grad_norm": 0.7999546972605147, "learning_rate": 3.785297943900605e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.28334081172943115, "step": 1025, "valid_targets_mean": 5762.0, "valid_targets_min": 852 }, { "epoch": 1.6480000000000001, "grad_norm": 0.48331284388571666, "learning_rate": 3.7816868913578044e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.2545091509819031, "step": 1030, "valid_targets_mean": 3178.3, "valid_targets_min": 728 }, { "epoch": 1.6560000000000001, "grad_norm": 0.45991402061064773, "learning_rate": 3.778047476626897e-05, "loss": 0.2936, "loss_nan_ranks": 0, "loss_rank_avg": 0.25272148847579956, "step": 1035, "valid_targets_mean": 4338.1, "valid_targets_min": 1049 }, { "epoch": 1.6640000000000001, "grad_norm": 0.3451764939977074, "learning_rate": 3.7743797576427335e-05, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.2401534467935562, "step": 1040, "valid_targets_mean": 6253.1, "valid_targets_min": 712 }, { "epoch": 1.6720000000000002, "grad_norm": 0.4111940706574221, "learning_rate": 3.770683792790733e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.2934751510620117, "step": 1045, "valid_targets_mean": 4744.1, "valid_targets_min": 1059 }, { "epoch": 1.6800000000000002, "grad_norm": 0.4087263278002059, "learning_rate": 3.766959640905954e-05, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707015872001648, "step": 1050, "valid_targets_mean": 5591.9, "valid_targets_min": 710 }, { "epoch": 1.688, "grad_norm": 0.5089485422227342, "learning_rate": 3.763207361272153e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.27094948291778564, "step": 1055, "valid_targets_mean": 3115.1, "valid_targets_min": 787 }, { "epoch": 1.696, "grad_norm": 0.39668167250416864, "learning_rate": 3.759427013620849e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.23788487911224365, "step": 1060, "valid_targets_mean": 4781.2, "valid_targets_min": 1059 }, { "epoch": 1.704, "grad_norm": 0.4307058651279445, "learning_rate": 3.755618658130366e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.2379121482372284, "step": 1065, "valid_targets_mean": 3575.8, "valid_targets_min": 730 }, { "epoch": 1.712, "grad_norm": 0.6248314289543657, "learning_rate": 3.751782355424877e-05, "loss": 0.3129, "loss_nan_ranks": 0, "loss_rank_avg": 0.33632132411003113, "step": 1070, "valid_targets_mean": 2413.9, "valid_targets_min": 919 }, { "epoch": 1.72, "grad_norm": 0.3832687956684591, "learning_rate": 3.7479181665734395e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.27428677678108215, "step": 1075, "valid_targets_mean": 5823.8, "valid_targets_min": 795 }, { "epoch": 1.728, "grad_norm": 0.4146423424953804, "learning_rate": 3.7440261530890213e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.24523381888866425, "step": 1080, "valid_targets_mean": 5357.3, "valid_targets_min": 1045 }, { "epoch": 1.736, "grad_norm": 0.4881475237391791, "learning_rate": 3.740106376927527e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.25967293977737427, "step": 1085, "valid_targets_mean": 3166.9, "valid_targets_min": 756 }, { "epoch": 1.744, "grad_norm": 0.4001288366939507, "learning_rate": 3.7361589004868035e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.2417476922273636, "step": 1090, "valid_targets_mean": 4840.1, "valid_targets_min": 693 }, { "epoch": 1.752, "grad_norm": 0.4845852844999974, "learning_rate": 3.7321837866056535e-05, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.28427213430404663, "step": 1095, "valid_targets_mean": 3742.1, "valid_targets_min": 993 }, { "epoch": 1.76, "grad_norm": 0.44706609607667686, "learning_rate": 3.728181098562831e-05, "loss": 0.2547, "loss_nan_ranks": 0, "loss_rank_avg": 0.23905465006828308, "step": 1100, "valid_targets_mean": 4081.2, "valid_targets_min": 888 }, { "epoch": 1.768, "grad_norm": 0.4606642272123344, "learning_rate": 3.7241509000760355e-05, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.2809835374355316, "step": 1105, "valid_targets_mean": 4572.8, "valid_targets_min": 790 }, { "epoch": 1.776, "grad_norm": 0.44374131291191704, "learning_rate": 3.720093255300899e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.23165518045425415, "step": 1110, "valid_targets_mean": 5182.4, "valid_targets_min": 898 }, { "epoch": 1.784, "grad_norm": 0.39542261654137617, "learning_rate": 3.7160082288299645e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.26467621326446533, "step": 1115, "valid_targets_mean": 6130.7, "valid_targets_min": 1011 }, { "epoch": 1.792, "grad_norm": 0.40912132064625895, "learning_rate": 3.7118958856916534e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.25465548038482666, "step": 1120, "valid_targets_mean": 6377.2, "valid_targets_min": 1032 }, { "epoch": 1.8, "grad_norm": 0.39755902551807576, "learning_rate": 3.707756291349237e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.2527580261230469, "step": 1125, "valid_targets_mean": 5014.4, "valid_targets_min": 1094 }, { "epoch": 1.808, "grad_norm": 0.514457815285411, "learning_rate": 3.703589511699787e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838781476020813, "step": 1130, "valid_targets_mean": 3433.5, "valid_targets_min": 975 }, { "epoch": 1.8159999999999998, "grad_norm": 0.44550270673299985, "learning_rate": 3.6993956130731355e-05, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567026615142822, "step": 1135, "valid_targets_mean": 3949.9, "valid_targets_min": 976 }, { "epoch": 1.8239999999999998, "grad_norm": 0.5422815583872076, "learning_rate": 3.6951746622308106e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.2764151692390442, "step": 1140, "valid_targets_mean": 2868.9, "valid_targets_min": 1072 }, { "epoch": 1.8319999999999999, "grad_norm": 0.41869577320813534, "learning_rate": 3.69092672636498e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.28278565406799316, "step": 1145, "valid_targets_mean": 5837.7, "valid_targets_min": 1035 }, { "epoch": 1.8399999999999999, "grad_norm": 0.3757713903865787, "learning_rate": 3.686651873097375e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.23112526535987854, "step": 1150, "valid_targets_mean": 6685.0, "valid_targets_min": 932 }, { "epoch": 1.8479999999999999, "grad_norm": 0.4409326357854815, "learning_rate": 3.682350170478223e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.23602645099163055, "step": 1155, "valid_targets_mean": 5068.7, "valid_targets_min": 1197 }, { "epoch": 1.8559999999999999, "grad_norm": 0.40528589174751617, "learning_rate": 3.678021686985153e-05, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.2743171453475952, "step": 1160, "valid_targets_mean": 4716.9, "valid_targets_min": 1127 }, { "epoch": 1.8639999999999999, "grad_norm": 0.41676048150188805, "learning_rate": 3.6736664915221144e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.23870986700057983, "step": 1165, "valid_targets_mean": 4469.6, "valid_targets_min": 843 }, { "epoch": 1.8719999999999999, "grad_norm": 0.5284619471071941, "learning_rate": 3.669284653418278e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.29566067457199097, "step": 1170, "valid_targets_mean": 3079.8, "valid_targets_min": 710 }, { "epoch": 1.88, "grad_norm": 0.47907263465195665, "learning_rate": 3.6648762424269306e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2716890275478363, "step": 1175, "valid_targets_mean": 3397.4, "valid_targets_min": 884 }, { "epoch": 1.888, "grad_norm": 0.41124099809929116, "learning_rate": 3.660441328724365e-05, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.26922544836997986, "step": 1180, "valid_targets_mean": 5981.5, "valid_targets_min": 1078 }, { "epoch": 1.896, "grad_norm": 0.46088125238526284, "learning_rate": 3.655979982908764e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.25594204664230347, "step": 1185, "valid_targets_mean": 3616.8, "valid_targets_min": 719 }, { "epoch": 1.904, "grad_norm": 0.4543017272146403, "learning_rate": 3.6514922759990756e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.26674598455429077, "step": 1190, "valid_targets_mean": 3739.4, "valid_targets_min": 1079 }, { "epoch": 1.912, "grad_norm": 0.4192846645781652, "learning_rate": 3.646978279433883e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.2927936911582947, "step": 1195, "valid_targets_mean": 5007.6, "valid_targets_min": 938 }, { "epoch": 1.92, "grad_norm": 0.4436459924254246, "learning_rate": 3.6424380650702685e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.26739734411239624, "step": 1200, "valid_targets_mean": 4250.5, "valid_targets_min": 721 }, { "epoch": 1.928, "grad_norm": 0.4240018692969433, "learning_rate": 3.637871705182667e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.24744366109371185, "step": 1205, "valid_targets_mean": 5123.5, "valid_targets_min": 968 }, { "epoch": 1.936, "grad_norm": 0.36924402152142755, "learning_rate": 3.633279272461717e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.23109649121761322, "step": 1210, "valid_targets_mean": 5121.6, "valid_targets_min": 710 }, { "epoch": 1.944, "grad_norm": 0.3870106636312311, "learning_rate": 3.628660840013102e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.24079151451587677, "step": 1215, "valid_targets_mean": 5143.0, "valid_targets_min": 916 }, { "epoch": 1.952, "grad_norm": 0.47018664339123123, "learning_rate": 3.624016481356392e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.28172844648361206, "step": 1220, "valid_targets_mean": 3450.4, "valid_targets_min": 616 }, { "epoch": 1.96, "grad_norm": 0.46397233622758055, "learning_rate": 3.619346270423866e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602039575576782, "step": 1225, "valid_targets_mean": 3486.5, "valid_targets_min": 815 }, { "epoch": 1.968, "grad_norm": 0.43784857356480683, "learning_rate": 3.6146502815593384e-05, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.26954376697540283, "step": 1230, "valid_targets_mean": 4244.4, "valid_targets_min": 897 }, { "epoch": 1.976, "grad_norm": 0.3574426307276786, "learning_rate": 3.609928589516977e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643759846687317, "step": 1235, "valid_targets_mean": 5850.1, "valid_targets_min": 1066 }, { "epoch": 1.984, "grad_norm": 0.38025251874050797, "learning_rate": 3.6051812694601114e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.2867104411125183, "step": 1240, "valid_targets_mean": 6052.6, "valid_targets_min": 796 }, { "epoch": 1.992, "grad_norm": 0.4749876308252262, "learning_rate": 3.6004083969600346e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2491377741098404, "step": 1245, "valid_targets_mean": 3096.4, "valid_targets_min": 881 }, { "epoch": 2.0, "grad_norm": 0.39416119445325465, "learning_rate": 3.595610047994804e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.21893836557865143, "step": 1250, "valid_targets_mean": 4368.7, "valid_targets_min": 685 }, { "epoch": 2.008, "grad_norm": 0.4997159356103167, "learning_rate": 3.5907862989480285e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.24703270196914673, "step": 1255, "valid_targets_mean": 3216.5, "valid_targets_min": 943 }, { "epoch": 2.016, "grad_norm": 0.537153879112119, "learning_rate": 3.585937226607656e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.24673984944820404, "step": 1260, "valid_targets_mean": 3123.9, "valid_targets_min": 626 }, { "epoch": 2.024, "grad_norm": 0.5137006043744009, "learning_rate": 3.5810629081647476e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.25879064202308655, "step": 1265, "valid_targets_mean": 2930.7, "valid_targets_min": 830 }, { "epoch": 2.032, "grad_norm": 0.39071865921634885, "learning_rate": 3.576163421212249e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.21474619209766388, "step": 1270, "valid_targets_mean": 5110.3, "valid_targets_min": 879 }, { "epoch": 2.04, "grad_norm": 0.42220001994538664, "learning_rate": 3.5712388437437576e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.2964683473110199, "step": 1275, "valid_targets_mean": 5167.3, "valid_targets_min": 918 }, { "epoch": 2.048, "grad_norm": 0.49759776720417487, "learning_rate": 3.566289254152283e-05, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.25483906269073486, "step": 1280, "valid_targets_mean": 3432.9, "valid_targets_min": 850 }, { "epoch": 2.056, "grad_norm": 0.43733797744170083, "learning_rate": 3.56131473122899e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.2655543386936188, "step": 1285, "valid_targets_mean": 4495.1, "valid_targets_min": 973 }, { "epoch": 2.064, "grad_norm": 0.4421965923645115, "learning_rate": 3.556315354161955e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.23384560644626617, "step": 1290, "valid_targets_mean": 4117.4, "valid_targets_min": 828 }, { "epoch": 2.072, "grad_norm": 0.3725666055720055, "learning_rate": 3.551291202534899e-05, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.2299247682094574, "step": 1295, "valid_targets_mean": 5426.9, "valid_targets_min": 1115 }, { "epoch": 2.08, "grad_norm": 0.6713941175950688, "learning_rate": 3.546242356325922e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.29278409481048584, "step": 1300, "valid_targets_mean": 2013.2, "valid_targets_min": 782 }, { "epoch": 2.088, "grad_norm": 0.557278656484483, "learning_rate": 3.5411688959062323e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544538080692291, "step": 1305, "valid_targets_mean": 3579.6, "valid_targets_min": 762 }, { "epoch": 2.096, "grad_norm": 0.3687842744740229, "learning_rate": 3.5360709020388625e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.25263142585754395, "step": 1310, "valid_targets_mean": 6351.1, "valid_targets_min": 905 }, { "epoch": 2.104, "grad_norm": 0.3793263690857251, "learning_rate": 3.530948455877388e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.24786485731601715, "step": 1315, "valid_targets_mean": 5880.1, "valid_targets_min": 910 }, { "epoch": 2.112, "grad_norm": 0.47916929111479617, "learning_rate": 3.525801638964634e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757444679737091, "step": 1320, "valid_targets_mean": 3739.0, "valid_targets_min": 685 }, { "epoch": 2.12, "grad_norm": 0.5444709991468958, "learning_rate": 3.520630533231376e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.3086904287338257, "step": 1325, "valid_targets_mean": 3999.2, "valid_targets_min": 974 }, { "epoch": 2.128, "grad_norm": 0.48962862421008274, "learning_rate": 3.5154352209950376e-05, "loss": 0.2585, "loss_nan_ranks": 0, "loss_rank_avg": 0.27979689836502075, "step": 1330, "valid_targets_mean": 3676.9, "valid_targets_min": 825 }, { "epoch": 2.136, "grad_norm": 0.45083380728163236, "learning_rate": 3.510215784958376e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.2559383511543274, "step": 1335, "valid_targets_mean": 4485.2, "valid_targets_min": 779 }, { "epoch": 2.144, "grad_norm": 0.33484746429649287, "learning_rate": 3.5049723082081755e-05, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.2397380918264389, "step": 1340, "valid_targets_mean": 6896.4, "valid_targets_min": 629 }, { "epoch": 2.152, "grad_norm": 0.5512883869808385, "learning_rate": 3.49970487421391e-05, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.2993601858615875, "step": 1345, "valid_targets_mean": 3205.4, "valid_targets_min": 988 }, { "epoch": 2.16, "grad_norm": 0.42190102820629805, "learning_rate": 3.494413566826427e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.2174837589263916, "step": 1350, "valid_targets_mean": 4768.2, "valid_targets_min": 972 }, { "epoch": 2.168, "grad_norm": 0.5081581527596065, "learning_rate": 3.489098470276608e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.23775967955589294, "step": 1355, "valid_targets_mean": 2642.8, "valid_targets_min": 845 }, { "epoch": 2.176, "grad_norm": 0.40826096131920026, "learning_rate": 3.483759669174024e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.27968931198120117, "step": 1360, "valid_targets_mean": 4708.7, "valid_targets_min": 797 }, { "epoch": 2.184, "grad_norm": 0.4485915411385824, "learning_rate": 3.478397248505598e-05, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.2608921527862549, "step": 1365, "valid_targets_mean": 4368.9, "valid_targets_min": 1052 }, { "epoch": 2.192, "grad_norm": 0.5512019565130977, "learning_rate": 3.473011293634241e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2932088375091553, "step": 1370, "valid_targets_mean": 3872.3, "valid_targets_min": 1022 }, { "epoch": 2.2, "grad_norm": 0.42038314886774936, "learning_rate": 3.467601890297502e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.23290091753005981, "step": 1375, "valid_targets_mean": 3820.8, "valid_targets_min": 862 }, { "epoch": 2.208, "grad_norm": 0.486361040619312, "learning_rate": 3.4621691246061976e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654815912246704, "step": 1380, "valid_targets_mean": 2967.8, "valid_targets_min": 748 }, { "epoch": 2.216, "grad_norm": 0.3689995882810626, "learning_rate": 3.456713083043046e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.2481921762228012, "step": 1385, "valid_targets_mean": 6700.3, "valid_targets_min": 766 }, { "epoch": 2.224, "grad_norm": 0.3741844661161578, "learning_rate": 3.451233852461285e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2775578498840332, "step": 1390, "valid_targets_mean": 6166.1, "valid_targets_min": 1012 }, { "epoch": 2.232, "grad_norm": 0.4690171509050791, "learning_rate": 3.4457315200832935e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.27017349004745483, "step": 1395, "valid_targets_mean": 3758.4, "valid_targets_min": 916 }, { "epoch": 2.24, "grad_norm": 0.46502707551837297, "learning_rate": 3.440206173499201e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.24808195233345032, "step": 1400, "valid_targets_mean": 3311.0, "valid_targets_min": 919 }, { "epoch": 2.248, "grad_norm": 0.5358873234497143, "learning_rate": 3.4346579006654945e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.28968346118927, "step": 1405, "valid_targets_mean": 3115.9, "valid_targets_min": 556 }, { "epoch": 2.2560000000000002, "grad_norm": 0.42084243548194467, "learning_rate": 3.4290867899036166e-05, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.22804833948612213, "step": 1410, "valid_targets_mean": 3692.8, "valid_targets_min": 753 }, { "epoch": 2.2640000000000002, "grad_norm": 0.4001618784605517, "learning_rate": 3.4234929298985614e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.23770037293434143, "step": 1415, "valid_targets_mean": 5107.0, "valid_targets_min": 1186 }, { "epoch": 2.2720000000000002, "grad_norm": 0.5080158679760888, "learning_rate": 3.417876409697463e-05, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.20453549921512604, "step": 1420, "valid_targets_mean": 2835.4, "valid_targets_min": 690 }, { "epoch": 2.2800000000000002, "grad_norm": 0.4168243110819609, "learning_rate": 3.412237318708175e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.23663721978664398, "step": 1425, "valid_targets_mean": 4147.2, "valid_targets_min": 957 }, { "epoch": 2.288, "grad_norm": 0.45954399327365, "learning_rate": 3.4065757466978504e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507503926753998, "step": 1430, "valid_targets_mean": 3781.1, "valid_targets_min": 808 }, { "epoch": 2.296, "grad_norm": 0.4702539653734292, "learning_rate": 3.400891783791511e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.27482253313064575, "step": 1435, "valid_targets_mean": 3705.0, "valid_targets_min": 1032 }, { "epoch": 2.304, "grad_norm": 0.40026868215420613, "learning_rate": 3.395185520470614e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.24075943231582642, "step": 1440, "valid_targets_mean": 5237.6, "valid_targets_min": 760 }, { "epoch": 2.312, "grad_norm": 0.3905513051922005, "learning_rate": 3.38945704757161e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.22074247896671295, "step": 1445, "valid_targets_mean": 4402.3, "valid_targets_min": 756 }, { "epoch": 2.32, "grad_norm": 0.4882416307667647, "learning_rate": 3.383706456284498e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2848014533519745, "step": 1450, "valid_targets_mean": 3364.2, "valid_targets_min": 901 }, { "epoch": 2.328, "grad_norm": 0.45445708291864306, "learning_rate": 3.377933838151374e-05, "loss": 0.2603, "loss_nan_ranks": 0, "loss_rank_avg": 0.27066075801849365, "step": 1455, "valid_targets_mean": 3707.1, "valid_targets_min": 1017 }, { "epoch": 2.336, "grad_norm": 0.6608392796917465, "learning_rate": 3.3721392850649714e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.33999860286712646, "step": 1460, "valid_targets_mean": 2394.0, "valid_targets_min": 1063 }, { "epoch": 2.344, "grad_norm": 0.47360622747404885, "learning_rate": 3.3663228892672034e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.2844492197036743, "step": 1465, "valid_targets_mean": 4209.1, "valid_targets_min": 1020 }, { "epoch": 2.352, "grad_norm": 0.37445807515235896, "learning_rate": 3.36048474334769e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.21594926714897156, "step": 1470, "valid_targets_mean": 4527.0, "valid_targets_min": 1016 }, { "epoch": 2.36, "grad_norm": 0.4066613926869203, "learning_rate": 3.3546249402422834e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.2440742552280426, "step": 1475, "valid_targets_mean": 4281.1, "valid_targets_min": 884 }, { "epoch": 2.368, "grad_norm": 0.450872690024147, "learning_rate": 3.3487435732315944e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.23967817425727844, "step": 1480, "valid_targets_mean": 3973.4, "valid_targets_min": 815 }, { "epoch": 2.376, "grad_norm": 0.4373336501281426, "learning_rate": 3.342840735939501e-05, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.28060564398765564, "step": 1485, "valid_targets_mean": 3881.0, "valid_targets_min": 1006 }, { "epoch": 2.384, "grad_norm": 0.41616555215578727, "learning_rate": 3.33691652233166e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.23200851678848267, "step": 1490, "valid_targets_mean": 4087.1, "valid_targets_min": 682 }, { "epoch": 2.392, "grad_norm": 0.4741632763884423, "learning_rate": 3.330971026714016e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.2454630434513092, "step": 1495, "valid_targets_mean": 3751.9, "valid_targets_min": 1012 }, { "epoch": 2.4, "grad_norm": 0.44777751707599694, "learning_rate": 3.325004343731292e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585783004760742, "step": 1500, "valid_targets_mean": 4000.0, "valid_targets_min": 897 }, { "epoch": 2.408, "grad_norm": 0.4838887067897237, "learning_rate": 3.3190165683654885e-05, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.27823567390441895, "step": 1505, "valid_targets_mean": 3297.0, "valid_targets_min": 1109 }, { "epoch": 2.416, "grad_norm": 0.42450262258661076, "learning_rate": 3.31300779593437e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.25310438871383667, "step": 1510, "valid_targets_mean": 4192.0, "valid_targets_min": 1057 }, { "epoch": 2.424, "grad_norm": 0.4114223292664404, "learning_rate": 3.306978122089948e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.23483526706695557, "step": 1515, "valid_targets_mean": 4129.9, "valid_targets_min": 785 }, { "epoch": 2.432, "grad_norm": 0.4382457699711022, "learning_rate": 3.300927642816957e-05, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.25855690240859985, "step": 1520, "valid_targets_mean": 3935.2, "valid_targets_min": 765 }, { "epoch": 2.44, "grad_norm": 0.37454574276197367, "learning_rate": 3.294856454431328e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.2558472752571106, "step": 1525, "valid_targets_mean": 4478.7, "valid_targets_min": 845 }, { "epoch": 2.448, "grad_norm": 0.6185855420387542, "learning_rate": 3.288764653578653e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.3244587182998657, "step": 1530, "valid_targets_mean": 2447.6, "valid_targets_min": 946 }, { "epoch": 2.456, "grad_norm": 0.41449538190334706, "learning_rate": 3.2826523372326516e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.22788169980049133, "step": 1535, "valid_targets_mean": 4480.9, "valid_targets_min": 930 }, { "epoch": 2.464, "grad_norm": 0.3844395691586439, "learning_rate": 3.276519602693621e-05, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.2364940345287323, "step": 1540, "valid_targets_mean": 4955.6, "valid_targets_min": 1039 }, { "epoch": 2.472, "grad_norm": 0.37710049485157016, "learning_rate": 3.270366547586892e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.24367119371891022, "step": 1545, "valid_targets_mean": 5767.8, "valid_targets_min": 1061 }, { "epoch": 2.48, "grad_norm": 0.38894525582252293, "learning_rate": 3.2641932698612715e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.23194950819015503, "step": 1550, "valid_targets_mean": 4335.3, "valid_targets_min": 726 }, { "epoch": 2.488, "grad_norm": 0.3982220790804564, "learning_rate": 3.2579998677874855e-05, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.23282426595687866, "step": 1555, "valid_targets_mean": 4442.9, "valid_targets_min": 890 }, { "epoch": 2.496, "grad_norm": 0.3920266130118298, "learning_rate": 3.251786439956614e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.22500693798065186, "step": 1560, "valid_targets_mean": 3975.3, "valid_targets_min": 638 }, { "epoch": 2.504, "grad_norm": 0.5374661523331783, "learning_rate": 3.2455530852785206e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.3037063479423523, "step": 1565, "valid_targets_mean": 3909.3, "valid_targets_min": 1022 }, { "epoch": 2.512, "grad_norm": 0.42133581754576677, "learning_rate": 3.239299902980281e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.27413496375083923, "step": 1570, "valid_targets_mean": 4875.9, "valid_targets_min": 1016 }, { "epoch": 2.52, "grad_norm": 0.4540812695017237, "learning_rate": 3.2330269926046e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.3003402054309845, "step": 1575, "valid_targets_mean": 4698.6, "valid_targets_min": 1056 }, { "epoch": 2.528, "grad_norm": 0.48721669960386377, "learning_rate": 3.2267344540082284e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.2769826650619507, "step": 1580, "valid_targets_mean": 3544.6, "valid_targets_min": 959 }, { "epoch": 2.536, "grad_norm": 0.44779354854153475, "learning_rate": 3.220422387360373e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.23960761725902557, "step": 1585, "valid_targets_mean": 4160.4, "valid_targets_min": 1206 }, { "epoch": 2.544, "grad_norm": 0.36624305776785404, "learning_rate": 3.2140908931411026e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.24884971976280212, "step": 1590, "valid_targets_mean": 5886.5, "valid_targets_min": 777 }, { "epoch": 2.552, "grad_norm": 0.4205442975727069, "learning_rate": 3.207740072139748e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.2376871556043625, "step": 1595, "valid_targets_mean": 4554.3, "valid_targets_min": 807 }, { "epoch": 2.56, "grad_norm": 0.4390164861743431, "learning_rate": 3.2013700254532996e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751956582069397, "step": 1600, "valid_targets_mean": 3900.7, "valid_targets_min": 722 }, { "epoch": 2.568, "grad_norm": 0.45059040166393205, "learning_rate": 3.194980854484794e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.24145694077014923, "step": 1605, "valid_targets_mean": 3108.7, "valid_targets_min": 1069 }, { "epoch": 2.576, "grad_norm": 0.38498385041200234, "learning_rate": 3.188572660941702e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.25530481338500977, "step": 1610, "valid_targets_mean": 4882.4, "valid_targets_min": 630 }, { "epoch": 2.584, "grad_norm": 0.45078053611552554, "learning_rate": 3.182145546834311e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.23659245669841766, "step": 1615, "valid_targets_mean": 3979.6, "valid_targets_min": 933 }, { "epoch": 2.592, "grad_norm": 0.4873505068621663, "learning_rate": 3.1756996144740994e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.24679982662200928, "step": 1620, "valid_targets_mean": 2844.8, "valid_targets_min": 728 }, { "epoch": 2.6, "grad_norm": 0.375889816303558, "learning_rate": 3.1692349664721074e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.25449809432029724, "step": 1625, "valid_targets_mean": 5291.6, "valid_targets_min": 1192 }, { "epoch": 2.608, "grad_norm": 0.43710999498519076, "learning_rate": 3.1627517057373046e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557065486907959, "step": 1630, "valid_targets_mean": 4127.9, "valid_targets_min": 906 }, { "epoch": 2.616, "grad_norm": 0.47479745259245676, "learning_rate": 3.156249935474953e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.2876622974872589, "step": 1635, "valid_targets_mean": 4105.4, "valid_targets_min": 739 }, { "epoch": 2.624, "grad_norm": 0.38433518760476604, "learning_rate": 3.1497297591849614e-05, "loss": 0.2629, "loss_nan_ranks": 0, "loss_rank_avg": 0.25629955530166626, "step": 1640, "valid_targets_mean": 5574.8, "valid_targets_min": 858 }, { "epoch": 2.632, "grad_norm": 0.43299417778940696, "learning_rate": 3.143191280660238e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.23174050450325012, "step": 1645, "valid_targets_mean": 3752.2, "valid_targets_min": 1012 }, { "epoch": 2.64, "grad_norm": 0.4042914030109211, "learning_rate": 3.1366346039850424e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.2770325541496277, "step": 1650, "valid_targets_mean": 4572.9, "valid_targets_min": 955 }, { "epoch": 2.648, "grad_norm": 0.4000943004214781, "learning_rate": 3.130059833533323e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539942264556885, "step": 1655, "valid_targets_mean": 4367.9, "valid_targets_min": 851 }, { "epoch": 2.656, "grad_norm": 0.5246478390502145, "learning_rate": 3.123467073967059e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.25003015995025635, "step": 1660, "valid_targets_mean": 2662.1, "valid_targets_min": 935 }, { "epoch": 2.664, "grad_norm": 0.48721529047895606, "learning_rate": 3.116856430234594e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.24807119369506836, "step": 1665, "valid_targets_mean": 2776.6, "valid_targets_min": 830 }, { "epoch": 2.672, "grad_norm": 0.4011766685019322, "learning_rate": 3.110228007568963e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.25203073024749756, "step": 1670, "valid_targets_mean": 4795.0, "valid_targets_min": 1091 }, { "epoch": 2.68, "grad_norm": 0.4108384417120924, "learning_rate": 3.103581911486221e-05, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413668930530548, "step": 1675, "valid_targets_mean": 4554.4, "valid_targets_min": 807 }, { "epoch": 2.6879999999999997, "grad_norm": 0.4318489284689886, "learning_rate": 3.0969182477837604e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.2699677348136902, "step": 1680, "valid_targets_mean": 4299.4, "valid_targets_min": 951 }, { "epoch": 2.6959999999999997, "grad_norm": 0.46195534616572037, "learning_rate": 3.090237122538628e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2878229022026062, "step": 1685, "valid_targets_mean": 3651.4, "valid_targets_min": 882 }, { "epoch": 2.7039999999999997, "grad_norm": 0.4064409277711358, "learning_rate": 3.0835386421058345e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.252693772315979, "step": 1690, "valid_targets_mean": 4166.9, "valid_targets_min": 1026 }, { "epoch": 2.7119999999999997, "grad_norm": 0.3315855719749269, "learning_rate": 3.0768229131166664e-05, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.22979766130447388, "step": 1695, "valid_targets_mean": 6155.2, "valid_targets_min": 971 }, { "epoch": 2.7199999999999998, "grad_norm": 0.46914934540874326, "learning_rate": 3.070090042476983e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.23643366992473602, "step": 1700, "valid_targets_mean": 3444.9, "valid_targets_min": 850 }, { "epoch": 2.7279999999999998, "grad_norm": 0.6284719316531368, "learning_rate": 3.063340137365517e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.2869764566421509, "step": 1705, "valid_targets_mean": 2083.1, "valid_targets_min": 837 }, { "epoch": 2.7359999999999998, "grad_norm": 0.38536559734095, "learning_rate": 3.0565733052321674e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.25470173358917236, "step": 1710, "valid_targets_mean": 5245.9, "valid_targets_min": 1287 }, { "epoch": 2.7439999999999998, "grad_norm": 0.4111284973330911, "learning_rate": 3.0497896537962924e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.2471093237400055, "step": 1715, "valid_targets_mean": 4554.9, "valid_targets_min": 863 }, { "epoch": 2.752, "grad_norm": 0.340479711041136, "learning_rate": 3.042989291044991e-05, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.255589097738266, "step": 1720, "valid_targets_mean": 8342.3, "valid_targets_min": 843 }, { "epoch": 2.76, "grad_norm": 0.4997516270386313, "learning_rate": 3.036172325231383e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.26695573329925537, "step": 1725, "valid_targets_mean": 2913.8, "valid_targets_min": 928 }, { "epoch": 2.768, "grad_norm": 0.4160259337644636, "learning_rate": 3.0293388648728908e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.23652175068855286, "step": 1730, "valid_targets_mean": 4476.8, "valid_targets_min": 982 }, { "epoch": 2.776, "grad_norm": 0.39927985153665424, "learning_rate": 3.022489018749508e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.24088355898857117, "step": 1735, "valid_targets_mean": 3952.5, "valid_targets_min": 1032 }, { "epoch": 2.784, "grad_norm": 0.4550887207976117, "learning_rate": 3.015622895902068e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.2190483808517456, "step": 1740, "valid_targets_mean": 3110.4, "valid_targets_min": 1039 }, { "epoch": 2.792, "grad_norm": 0.33861046318017596, "learning_rate": 3.008740605630508e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.24156677722930908, "step": 1745, "valid_targets_mean": 6048.4, "valid_targets_min": 748 }, { "epoch": 2.8, "grad_norm": 0.36617432315449255, "learning_rate": 3.0018422574921337e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.24149316549301147, "step": 1750, "valid_targets_mean": 5241.0, "valid_targets_min": 1079 }, { "epoch": 2.808, "grad_norm": 0.3464726951761244, "learning_rate": 2.9949279612998673e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.2470303475856781, "step": 1755, "valid_targets_mean": 6875.5, "valid_targets_min": 1210 }, { "epoch": 2.816, "grad_norm": 0.3450155466545645, "learning_rate": 2.9879978271205064e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.2277037501335144, "step": 1760, "valid_targets_mean": 5934.5, "valid_targets_min": 912 }, { "epoch": 2.824, "grad_norm": 0.4016568882747598, "learning_rate": 2.9810519652729692e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.2241845428943634, "step": 1765, "valid_targets_mean": 4558.4, "valid_targets_min": 973 }, { "epoch": 2.832, "grad_norm": 0.41748302286864053, "learning_rate": 2.9740904863265378e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.263439804315567, "step": 1770, "valid_targets_mean": 4341.7, "valid_targets_min": 1283 }, { "epoch": 2.84, "grad_norm": 0.48850050096135555, "learning_rate": 2.967113501099097e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.23303407430648804, "step": 1775, "valid_targets_mean": 2772.5, "valid_targets_min": 787 }, { "epoch": 2.848, "grad_norm": 0.47900204436253896, "learning_rate": 2.9601211206553745e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.32549360394477844, "step": 1780, "valid_targets_mean": 3978.5, "valid_targets_min": 851 }, { "epoch": 2.856, "grad_norm": 0.39202466712624395, "learning_rate": 2.9531134563051686e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.24673870205879211, "step": 1785, "valid_targets_mean": 4397.2, "valid_targets_min": 789 }, { "epoch": 2.864, "grad_norm": 0.454753156477103, "learning_rate": 2.946090619601579e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.2228916883468628, "step": 1790, "valid_targets_mean": 3641.2, "valid_targets_min": 801 }, { "epoch": 2.872, "grad_norm": 0.5239133569031957, "learning_rate": 2.9390527223392292e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.26477718353271484, "step": 1795, "valid_targets_mean": 2819.3, "valid_targets_min": 764 }, { "epoch": 2.88, "grad_norm": 0.43565748091817924, "learning_rate": 2.931999876552488e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930182218551636, "step": 1800, "valid_targets_mean": 4048.8, "valid_targets_min": 1123 }, { "epoch": 2.888, "grad_norm": 0.4126016381922162, "learning_rate": 2.9249321945136854e-05, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.26448121666908264, "step": 1805, "valid_targets_mean": 4604.4, "valid_targets_min": 948 }, { "epoch": 2.896, "grad_norm": 0.4216543598725713, "learning_rate": 2.9178497887313257e-05, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.27048546075820923, "step": 1810, "valid_targets_mean": 4440.7, "valid_targets_min": 926 }, { "epoch": 2.904, "grad_norm": 0.339972934761611, "learning_rate": 2.9107527719482968e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.24039791524410248, "step": 1815, "valid_targets_mean": 5725.7, "valid_targets_min": 1038 }, { "epoch": 2.912, "grad_norm": 0.4284574874009162, "learning_rate": 2.9036412571400747e-05, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.25202876329421997, "step": 1820, "valid_targets_mean": 3956.6, "valid_targets_min": 841 }, { "epoch": 2.92, "grad_norm": 0.3887923193278144, "learning_rate": 2.8965153575129255e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.26022517681121826, "step": 1825, "valid_targets_mean": 5180.9, "valid_targets_min": 1022 }, { "epoch": 2.928, "grad_norm": 0.42207586149145204, "learning_rate": 2.8893751865021044e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.24122312664985657, "step": 1830, "valid_targets_mean": 3972.8, "valid_targets_min": 946 }, { "epoch": 2.936, "grad_norm": 0.38545070788876795, "learning_rate": 2.8822208577700473e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604748606681824, "step": 1835, "valid_targets_mean": 4398.5, "valid_targets_min": 782 }, { "epoch": 2.944, "grad_norm": 0.5068190010044846, "learning_rate": 2.8750524852045642e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.26114439964294434, "step": 1840, "valid_targets_mean": 2930.1, "valid_targets_min": 790 }, { "epoch": 2.952, "grad_norm": 0.38331449055182676, "learning_rate": 2.867870182917024e-05, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.23407770693302155, "step": 1845, "valid_targets_mean": 4040.6, "valid_targets_min": 758 }, { "epoch": 2.96, "grad_norm": 0.40079080583130816, "learning_rate": 2.8606740652405394e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.2599574327468872, "step": 1850, "valid_targets_mean": 4798.5, "valid_targets_min": 934 }, { "epoch": 2.968, "grad_norm": 0.3479930057967736, "learning_rate": 2.853464246728147e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.23751023411750793, "step": 1855, "valid_targets_mean": 5672.2, "valid_targets_min": 832 }, { "epoch": 2.976, "grad_norm": 0.3369578047927962, "learning_rate": 2.846240842150984e-05, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.20889130234718323, "step": 1860, "valid_targets_mean": 5308.2, "valid_targets_min": 788 }, { "epoch": 2.984, "grad_norm": 0.4291039444647585, "learning_rate": 2.839003966496458e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2270471304655075, "step": 1865, "valid_targets_mean": 3958.4, "valid_targets_min": 897 }, { "epoch": 2.992, "grad_norm": 0.43281841130812354, "learning_rate": 2.8317537349664215e-05, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.2587190866470337, "step": 1870, "valid_targets_mean": 4151.9, "valid_targets_min": 950 }, { "epoch": 3.0, "grad_norm": 0.3978270265787385, "learning_rate": 2.824490262975334e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.2422841191291809, "step": 1875, "valid_targets_mean": 4473.6, "valid_targets_min": 931 }, { "epoch": 3.008, "grad_norm": 0.3686194912968534, "learning_rate": 2.817213666148427e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.20717495679855347, "step": 1880, "valid_targets_mean": 4454.7, "valid_targets_min": 1031 }, { "epoch": 3.016, "grad_norm": 0.4391451892820445, "learning_rate": 2.809924060319862e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.2463517189025879, "step": 1885, "valid_targets_mean": 4455.8, "valid_targets_min": 850 }, { "epoch": 3.024, "grad_norm": 0.37945227439492357, "learning_rate": 2.802621561530888e-05, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.23665887117385864, "step": 1890, "valid_targets_mean": 4614.1, "valid_targets_min": 801 }, { "epoch": 3.032, "grad_norm": 0.5047817941563999, "learning_rate": 2.7953062860279937e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.24539366364479065, "step": 1895, "valid_targets_mean": 2838.2, "valid_targets_min": 945 }, { "epoch": 3.04, "grad_norm": 0.640395323678212, "learning_rate": 2.7879783502610557e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.33286240696907043, "step": 1900, "valid_targets_mean": 2273.1, "valid_targets_min": 937 }, { "epoch": 3.048, "grad_norm": 0.42850604085756194, "learning_rate": 2.7806378708814875e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.24500463902950287, "step": 1905, "valid_targets_mean": 4063.4, "valid_targets_min": 1026 }, { "epoch": 3.056, "grad_norm": 0.4303493596218602, "learning_rate": 2.773284964740379e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.23514248430728912, "step": 1910, "valid_targets_mean": 3806.9, "valid_targets_min": 1057 }, { "epoch": 3.064, "grad_norm": 0.5376670517442778, "learning_rate": 2.7659197488866403e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.24571284651756287, "step": 1915, "valid_targets_mean": 2978.4, "valid_targets_min": 835 }, { "epoch": 3.072, "grad_norm": 0.4856549540142223, "learning_rate": 2.7585423405651347e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.2590499818325043, "step": 1920, "valid_targets_mean": 3158.0, "valid_targets_min": 817 }, { "epoch": 3.08, "grad_norm": 0.41265678997745975, "learning_rate": 2.7511528572148153e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.24581827223300934, "step": 1925, "valid_targets_mean": 3845.9, "valid_targets_min": 779 }, { "epoch": 3.088, "grad_norm": 0.39148774769841904, "learning_rate": 2.7437514164668536e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.2122671902179718, "step": 1930, "valid_targets_mean": 4021.6, "valid_targets_min": 857 }, { "epoch": 3.096, "grad_norm": 0.42384683209642465, "learning_rate": 2.7363381361427692e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.2753984332084656, "step": 1935, "valid_targets_mean": 4518.8, "valid_targets_min": 996 }, { "epoch": 3.104, "grad_norm": 0.5156696168531341, "learning_rate": 2.72891313425255e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671349346637726, "step": 1940, "valid_targets_mean": 3111.5, "valid_targets_min": 856 }, { "epoch": 3.112, "grad_norm": 0.40374314761107644, "learning_rate": 2.7214765289927777e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.22792913019657135, "step": 1945, "valid_targets_mean": 4236.8, "valid_targets_min": 1042 }, { "epoch": 3.12, "grad_norm": 0.41400421213473976, "learning_rate": 2.714028438744746e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.28113529086112976, "step": 1950, "valid_targets_mean": 4941.1, "valid_targets_min": 945 }, { "epoch": 3.128, "grad_norm": 0.3753847058592898, "learning_rate": 2.706568982072573e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.22099116444587708, "step": 1955, "valid_targets_mean": 4709.8, "valid_targets_min": 898 }, { "epoch": 3.136, "grad_norm": 0.4414960074804987, "learning_rate": 2.6990982777213174e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.24348290264606476, "step": 1960, "valid_targets_mean": 4199.9, "valid_targets_min": 833 }, { "epoch": 3.144, "grad_norm": 0.39031860273125923, "learning_rate": 2.691616444615085e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.2442023903131485, "step": 1965, "valid_targets_mean": 4948.6, "valid_targets_min": 662 }, { "epoch": 3.152, "grad_norm": 0.42869791654686545, "learning_rate": 2.6841236018551402e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.24929338693618774, "step": 1970, "valid_targets_mean": 4449.2, "valid_targets_min": 1184 }, { "epoch": 3.16, "grad_norm": 0.3724581951765585, "learning_rate": 2.6766198687180028e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.2496282011270523, "step": 1975, "valid_targets_mean": 5392.3, "valid_targets_min": 909 }, { "epoch": 3.168, "grad_norm": 0.3179361729676042, "learning_rate": 2.6691053646535564e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.20636862516403198, "step": 1980, "valid_targets_mean": 6938.2, "valid_targets_min": 787 }, { "epoch": 3.176, "grad_norm": 0.46664739794355814, "learning_rate": 2.6615802092831446e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.22112616896629333, "step": 1985, "valid_targets_mean": 2945.5, "valid_targets_min": 884 }, { "epoch": 3.184, "grad_norm": 0.4339184924410943, "learning_rate": 2.6540445223976637e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.2532888352870941, "step": 1990, "valid_targets_mean": 4107.5, "valid_targets_min": 1002 }, { "epoch": 3.192, "grad_norm": 0.3729189208408062, "learning_rate": 2.6464984239556602e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.24716854095458984, "step": 1995, "valid_targets_mean": 5853.9, "valid_targets_min": 932 }, { "epoch": 3.2, "grad_norm": 0.3663312807394943, "learning_rate": 2.63894203408142e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.2260250449180603, "step": 2000, "valid_targets_mean": 5386.6, "valid_targets_min": 760 }, { "epoch": 3.208, "grad_norm": 0.43597269696745533, "learning_rate": 2.6313754730630528e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.23965974152088165, "step": 2005, "valid_targets_mean": 3921.7, "valid_targets_min": 1011 }, { "epoch": 3.216, "grad_norm": 0.38031686943560017, "learning_rate": 2.623798861350582e-05, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.2457212209701538, "step": 2010, "valid_targets_mean": 5434.2, "valid_targets_min": 793 }, { "epoch": 3.224, "grad_norm": 0.37852046127420746, "learning_rate": 2.6162123195540247e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.24134644865989685, "step": 2015, "valid_targets_mean": 4507.3, "valid_targets_min": 965 }, { "epoch": 3.232, "grad_norm": 0.3774539132405667, "learning_rate": 2.6086159684414726e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.20981399714946747, "step": 2020, "valid_targets_mean": 5689.2, "valid_targets_min": 983 }, { "epoch": 3.24, "grad_norm": 0.5876396358898935, "learning_rate": 2.6010099289371694e-05, "loss": 0.2517, "loss_nan_ranks": 0, "loss_rank_avg": 0.24734702706336975, "step": 2025, "valid_targets_mean": 3616.8, "valid_targets_min": 962 }, { "epoch": 3.248, "grad_norm": 0.41025472682008307, "learning_rate": 2.5933943221195844e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.2263985127210617, "step": 2030, "valid_targets_mean": 4079.0, "valid_targets_min": 976 }, { "epoch": 3.2560000000000002, "grad_norm": 0.3585820544990285, "learning_rate": 2.5857692692194884e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.24530109763145447, "step": 2035, "valid_targets_mean": 5752.3, "valid_targets_min": 902 }, { "epoch": 3.2640000000000002, "grad_norm": 0.4016499873533317, "learning_rate": 2.5781348916180195e-05, "loss": 0.2618, "loss_nan_ranks": 0, "loss_rank_avg": 0.26491880416870117, "step": 2040, "valid_targets_mean": 4694.8, "valid_targets_min": 918 }, { "epoch": 3.2720000000000002, "grad_norm": 0.40307560980296747, "learning_rate": 2.570491310844755e-05, "loss": 0.2409, "loss_nan_ranks": 0, "loss_rank_avg": 0.2063388228416443, "step": 2045, "valid_targets_mean": 3911.2, "valid_targets_min": 688 }, { "epoch": 3.2800000000000002, "grad_norm": 0.44852837331808115, "learning_rate": 2.562838648575774e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.21985195577144623, "step": 2050, "valid_targets_mean": 3346.2, "valid_targets_min": 963 }, { "epoch": 3.288, "grad_norm": 0.4285370827323687, "learning_rate": 2.5551770266317224e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.24515582621097565, "step": 2055, "valid_targets_mean": 4142.2, "valid_targets_min": 830 }, { "epoch": 3.296, "grad_norm": 0.3469454440141706, "learning_rate": 2.5475065669758713e-05, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.2313218116760254, "step": 2060, "valid_targets_mean": 6451.2, "valid_targets_min": 1134 }, { "epoch": 3.304, "grad_norm": 0.4660419550497371, "learning_rate": 2.5398273917121786e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.23948527872562408, "step": 2065, "valid_targets_mean": 3834.3, "valid_targets_min": 840 }, { "epoch": 3.312, "grad_norm": 0.46020726031423426, "learning_rate": 2.532139623083342e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.22267141938209534, "step": 2070, "valid_targets_mean": 3291.5, "valid_targets_min": 709 }, { "epoch": 3.32, "grad_norm": 0.4066475864337174, "learning_rate": 2.5244433834688552e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.24701744318008423, "step": 2075, "valid_targets_mean": 4166.8, "valid_targets_min": 1174 }, { "epoch": 3.328, "grad_norm": 0.3389260313456441, "learning_rate": 2.5167387953830602e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.2435072362422943, "step": 2080, "valid_targets_mean": 6527.8, "valid_targets_min": 881 }, { "epoch": 3.336, "grad_norm": 0.44452524791300885, "learning_rate": 2.5090259814731946e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.23047269880771637, "step": 2085, "valid_targets_mean": 4016.4, "valid_targets_min": 882 }, { "epoch": 3.344, "grad_norm": 0.5236654293524927, "learning_rate": 2.5013050645174414e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.25171908736228943, "step": 2090, "valid_targets_mean": 2928.3, "valid_targets_min": 945 }, { "epoch": 3.352, "grad_norm": 0.46686168548498463, "learning_rate": 2.4935761674229735e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.25355401635169983, "step": 2095, "valid_targets_mean": 3444.8, "valid_targets_min": 788 }, { "epoch": 3.36, "grad_norm": 0.4658436781904886, "learning_rate": 2.4858394132239982e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.24720919132232666, "step": 2100, "valid_targets_mean": 3369.1, "valid_targets_min": 870 }, { "epoch": 3.368, "grad_norm": 0.41610717299525096, "learning_rate": 2.4780949250797964e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.25919485092163086, "step": 2105, "valid_targets_mean": 4384.9, "valid_targets_min": 895 }, { "epoch": 3.376, "grad_norm": 0.3776558528507944, "learning_rate": 2.4703428262727656e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.2172096073627472, "step": 2110, "valid_targets_mean": 4115.6, "valid_targets_min": 758 }, { "epoch": 3.384, "grad_norm": 0.4332689527083962, "learning_rate": 2.4625832402064525e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.24866342544555664, "step": 2115, "valid_targets_mean": 4320.1, "valid_targets_min": 908 }, { "epoch": 3.392, "grad_norm": 0.34298883302266486, "learning_rate": 2.454816290403595e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.2340373992919922, "step": 2120, "valid_targets_mean": 5510.9, "valid_targets_min": 914 }, { "epoch": 3.4, "grad_norm": 0.39746900839974997, "learning_rate": 2.4470421005041492e-05, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.27413320541381836, "step": 2125, "valid_targets_mean": 4856.7, "valid_targets_min": 1080 }, { "epoch": 3.408, "grad_norm": 0.3693795848606551, "learning_rate": 2.4392607942633263e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.20374570786952972, "step": 2130, "valid_targets_mean": 4384.4, "valid_targets_min": 682 }, { "epoch": 3.416, "grad_norm": 0.6248740105863385, "learning_rate": 2.43147249554962e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.27008944749832153, "step": 2135, "valid_targets_mean": 2089.4, "valid_targets_min": 819 }, { "epoch": 3.424, "grad_norm": 0.4780329930048178, "learning_rate": 2.423677328342835e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.22337397933006287, "step": 2140, "valid_targets_mean": 3094.6, "valid_targets_min": 780 }, { "epoch": 3.432, "grad_norm": 0.3654477042526744, "learning_rate": 2.415875416732113e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.2606598734855652, "step": 2145, "valid_targets_mean": 5555.8, "valid_targets_min": 774 }, { "epoch": 3.44, "grad_norm": 0.36116589317728864, "learning_rate": 2.4080668849139603e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.23566177487373352, "step": 2150, "valid_targets_mean": 5559.3, "valid_targets_min": 682 }, { "epoch": 3.448, "grad_norm": 0.4284496251086486, "learning_rate": 2.4002518571902665e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.27861011028289795, "step": 2155, "valid_targets_mean": 5020.9, "valid_targets_min": 1002 }, { "epoch": 3.456, "grad_norm": 0.3785079045493894, "learning_rate": 2.392430457966328e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.21359242498874664, "step": 2160, "valid_targets_mean": 4796.9, "valid_targets_min": 778 }, { "epoch": 3.464, "grad_norm": 0.3289768949204519, "learning_rate": 2.3846028117488686e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.23382601141929626, "step": 2165, "valid_targets_mean": 6570.4, "valid_targets_min": 1014 }, { "epoch": 3.472, "grad_norm": 0.3147676115980224, "learning_rate": 2.3767690431440533e-05, "loss": 0.2402, "loss_nan_ranks": 0, "loss_rank_avg": 0.2314678281545639, "step": 2170, "valid_targets_mean": 7406.5, "valid_targets_min": 1083 }, { "epoch": 3.48, "grad_norm": 0.3671848999318846, "learning_rate": 2.368929276855512e-05, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.24486009776592255, "step": 2175, "valid_targets_mean": 4844.6, "valid_targets_min": 952 }, { "epoch": 3.488, "grad_norm": 0.39604902765788624, "learning_rate": 2.361083637682347e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.23706820607185364, "step": 2180, "valid_targets_mean": 4694.9, "valid_targets_min": 744 }, { "epoch": 3.496, "grad_norm": 0.5655798668270807, "learning_rate": 2.3532322505171502e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.27846089005470276, "step": 2185, "valid_targets_mean": 2487.4, "valid_targets_min": 670 }, { "epoch": 3.504, "grad_norm": 0.37720888972750033, "learning_rate": 2.3453752403440147e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.2432319074869156, "step": 2190, "valid_targets_mean": 4674.2, "valid_targets_min": 1020 }, { "epoch": 3.512, "grad_norm": 0.38338363036309026, "learning_rate": 2.337512732236545e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.2563523054122925, "step": 2195, "valid_targets_mean": 4757.8, "valid_targets_min": 859 }, { "epoch": 3.52, "grad_norm": 0.3383403543256627, "learning_rate": 2.3296448513558628e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.230048269033432, "step": 2200, "valid_targets_mean": 6312.8, "valid_targets_min": 906 }, { "epoch": 3.528, "grad_norm": 0.42174030998567286, "learning_rate": 2.321771722948622e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.23159737884998322, "step": 2205, "valid_targets_mean": 3522.6, "valid_targets_min": 777 }, { "epoch": 3.536, "grad_norm": 0.3441421244493924, "learning_rate": 2.3138934723450074e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.23105758428573608, "step": 2210, "valid_targets_mean": 5247.6, "valid_targets_min": 639 }, { "epoch": 3.544, "grad_norm": 0.4237690704094179, "learning_rate": 2.306010224956744e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.20057953894138336, "step": 2215, "valid_targets_mean": 3344.2, "valid_targets_min": 777 }, { "epoch": 3.552, "grad_norm": 0.40314828900451494, "learning_rate": 2.2981221062750986e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.23921722173690796, "step": 2220, "valid_targets_mean": 4463.3, "valid_targets_min": 897 }, { "epoch": 3.56, "grad_norm": 0.35913421571712756, "learning_rate": 2.290229241868882e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.22847603261470795, "step": 2225, "valid_targets_mean": 4817.8, "valid_targets_min": 973 }, { "epoch": 3.568, "grad_norm": 0.4300249539977357, "learning_rate": 2.282331757382454e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.2206239104270935, "step": 2230, "valid_targets_mean": 3468.5, "valid_targets_min": 913 }, { "epoch": 3.576, "grad_norm": 0.44969351210373343, "learning_rate": 2.2744297785337155e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.21605494618415833, "step": 2235, "valid_targets_mean": 3286.3, "valid_targets_min": 842 }, { "epoch": 3.584, "grad_norm": 0.42301687473892546, "learning_rate": 2.2665234311121155e-05, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.23820188641548157, "step": 2240, "valid_targets_mean": 3650.9, "valid_targets_min": 587 }, { "epoch": 3.592, "grad_norm": 0.392543464599928, "learning_rate": 2.258612840976645e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.24136680364608765, "step": 2245, "valid_targets_mean": 4852.1, "valid_targets_min": 1183 }, { "epoch": 3.6, "grad_norm": 0.367395547542587, "learning_rate": 2.2506981340538315e-05, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.2347022294998169, "step": 2250, "valid_targets_mean": 5126.2, "valid_targets_min": 765 }, { "epoch": 3.608, "grad_norm": 0.3205045384740095, "learning_rate": 2.2427794363357384e-05, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.2343018651008606, "step": 2255, "valid_targets_mean": 6760.8, "valid_targets_min": 957 }, { "epoch": 3.616, "grad_norm": 0.4272334380835925, "learning_rate": 2.2348568738779566e-05, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.23038670420646667, "step": 2260, "valid_targets_mean": 4056.7, "valid_targets_min": 877 }, { "epoch": 3.624, "grad_norm": 0.40730070006221614, "learning_rate": 2.2269305727975993e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.26035311818122864, "step": 2265, "valid_targets_mean": 4897.9, "valid_targets_min": 770 }, { "epoch": 3.632, "grad_norm": 0.39008805670033025, "learning_rate": 2.2190006592712927e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.2496114820241928, "step": 2270, "valid_targets_mean": 4502.3, "valid_targets_min": 956 }, { "epoch": 3.64, "grad_norm": 0.4098580625905869, "learning_rate": 2.2110672595331698e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.2622841000556946, "step": 2275, "valid_targets_mean": 4436.5, "valid_targets_min": 1137 }, { "epoch": 3.648, "grad_norm": 0.42996882915875295, "learning_rate": 2.2031304998728587e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.2525962293148041, "step": 2280, "valid_targets_mean": 4247.2, "valid_targets_min": 711 }, { "epoch": 3.656, "grad_norm": 0.3824484509543543, "learning_rate": 2.1951905066334737e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.23063942790031433, "step": 2285, "valid_targets_mean": 4258.1, "valid_targets_min": 959 }, { "epoch": 3.664, "grad_norm": 0.40350526206019344, "learning_rate": 2.1872474062096046e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.23316706717014313, "step": 2290, "valid_targets_mean": 4255.7, "valid_targets_min": 698 }, { "epoch": 3.672, "grad_norm": 0.44596553563121094, "learning_rate": 2.179301325045301e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.26697400212287903, "step": 2295, "valid_targets_mean": 3889.1, "valid_targets_min": 764 }, { "epoch": 3.68, "grad_norm": 0.3479970961360567, "learning_rate": 2.1713523896320647e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.21883633732795715, "step": 2300, "valid_targets_mean": 4919.6, "valid_targets_min": 1008 }, { "epoch": 3.6879999999999997, "grad_norm": 0.35571201991914386, "learning_rate": 2.163400726506832e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.23191869258880615, "step": 2305, "valid_targets_mean": 5307.3, "valid_targets_min": 1096 }, { "epoch": 3.6959999999999997, "grad_norm": 0.3604714079928107, "learning_rate": 2.155446462249961e-05, "loss": 0.247, "loss_nan_ranks": 0, "loss_rank_avg": 0.2559710144996643, "step": 2310, "valid_targets_mean": 5540.6, "valid_targets_min": 728 }, { "epoch": 3.7039999999999997, "grad_norm": 0.32612870359060286, "learning_rate": 2.147489723483217e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.2424880862236023, "step": 2315, "valid_targets_mean": 6959.5, "valid_targets_min": 1094 }, { "epoch": 3.7119999999999997, "grad_norm": 0.41493912008225486, "learning_rate": 2.139530636867757e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.24148619174957275, "step": 2320, "valid_targets_mean": 4001.1, "valid_targets_min": 1041 }, { "epoch": 3.7199999999999998, "grad_norm": 0.4110902151701686, "learning_rate": 2.1315693291021114e-05, "loss": 0.2473, "loss_nan_ranks": 0, "loss_rank_avg": 0.22682532668113708, "step": 2325, "valid_targets_mean": 3857.5, "valid_targets_min": 532 }, { "epoch": 3.7279999999999998, "grad_norm": 0.3771443937450319, "learning_rate": 2.1236059269201686e-05, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.2078881859779358, "step": 2330, "valid_targets_mean": 3960.9, "valid_targets_min": 1015 }, { "epoch": 3.7359999999999998, "grad_norm": 0.4361587523350003, "learning_rate": 2.1156405570891584e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.240316241979599, "step": 2335, "valid_targets_mean": 3572.1, "valid_targets_min": 996 }, { "epoch": 3.7439999999999998, "grad_norm": 0.4089677660324536, "learning_rate": 2.1076733464076322e-05, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.22675375640392303, "step": 2340, "valid_targets_mean": 3776.9, "valid_targets_min": 874 }, { "epoch": 3.752, "grad_norm": 0.42692556018849953, "learning_rate": 2.0997044217034462e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749752402305603, "step": 2345, "valid_targets_mean": 4011.2, "valid_targets_min": 1087 }, { "epoch": 3.76, "grad_norm": 0.3607657231192886, "learning_rate": 2.0917339098317405e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.23275761306285858, "step": 2350, "valid_targets_mean": 5583.9, "valid_targets_min": 887 }, { "epoch": 3.768, "grad_norm": 0.53112047115276, "learning_rate": 2.083761937672922e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.23606562614440918, "step": 2355, "valid_targets_mean": 2382.6, "valid_targets_min": 941 }, { "epoch": 3.776, "grad_norm": 0.44795554427006484, "learning_rate": 2.0757886321306433e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.30794838070869446, "step": 2360, "valid_targets_mean": 4058.8, "valid_targets_min": 709 }, { "epoch": 3.784, "grad_norm": 0.38096232285290094, "learning_rate": 2.0678141201297827e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.2388550341129303, "step": 2365, "valid_targets_mean": 4521.2, "valid_targets_min": 976 }, { "epoch": 3.792, "grad_norm": 0.3677287419628772, "learning_rate": 2.059838528614423e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.2527107894420624, "step": 2370, "valid_targets_mean": 4927.9, "valid_targets_min": 717 }, { "epoch": 3.8, "grad_norm": 0.4603649045230554, "learning_rate": 2.0518619845458322e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524024546146393, "step": 2375, "valid_targets_mean": 3487.9, "valid_targets_min": 900 }, { "epoch": 3.808, "grad_norm": 0.49340867750085365, "learning_rate": 2.0438846149004426e-05, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2245899885892868, "step": 2380, "valid_targets_mean": 3973.9, "valid_targets_min": 1047 }, { "epoch": 3.816, "grad_norm": 0.3391628456601482, "learning_rate": 2.0359065466678268e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.22324374318122864, "step": 2385, "valid_targets_mean": 5603.8, "valid_targets_min": 1077 }, { "epoch": 3.824, "grad_norm": 0.4064978135894322, "learning_rate": 2.0279279068486795e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.24098357558250427, "step": 2390, "valid_targets_mean": 4030.3, "valid_targets_min": 836 }, { "epoch": 3.832, "grad_norm": 0.45574421310954694, "learning_rate": 2.019948822452794e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.2887115776538849, "step": 2395, "valid_targets_mean": 3871.5, "valid_targets_min": 593 }, { "epoch": 3.84, "grad_norm": 0.42912425327908477, "learning_rate": 2.0119694204970393e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643599510192871, "step": 2400, "valid_targets_mean": 3953.9, "valid_targets_min": 752 }, { "epoch": 3.848, "grad_norm": 0.5452664048943783, "learning_rate": 2.0039898280033414e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.25383543968200684, "step": 2405, "valid_targets_mean": 2670.8, "valid_targets_min": 879 }, { "epoch": 3.856, "grad_norm": 0.35547888248847065, "learning_rate": 1.9960101719966592e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.25882688164711, "step": 2410, "valid_targets_mean": 6267.4, "valid_targets_min": 1061 }, { "epoch": 3.864, "grad_norm": 0.4236770102857227, "learning_rate": 1.9880305795029617e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.23290708661079407, "step": 2415, "valid_targets_mean": 3531.1, "valid_targets_min": 830 }, { "epoch": 3.872, "grad_norm": 0.5053989332284283, "learning_rate": 1.980051177547207e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2855120897293091, "step": 2420, "valid_targets_mean": 3139.5, "valid_targets_min": 883 }, { "epoch": 3.88, "grad_norm": 0.40363417243530514, "learning_rate": 1.9720720931513212e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508298456668854, "step": 2425, "valid_targets_mean": 4059.1, "valid_targets_min": 614 }, { "epoch": 3.888, "grad_norm": 0.43924888297351233, "learning_rate": 1.9640934533321735e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2625318765640259, "step": 2430, "valid_targets_mean": 3693.1, "valid_targets_min": 948 }, { "epoch": 3.896, "grad_norm": 0.3419350657709466, "learning_rate": 1.9561153850995577e-05, "loss": 0.2407, "loss_nan_ranks": 0, "loss_rank_avg": 0.21997395157814026, "step": 2435, "valid_targets_mean": 5387.0, "valid_targets_min": 979 }, { "epoch": 3.904, "grad_norm": 0.4260255800186257, "learning_rate": 1.948138015454168e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.23484918475151062, "step": 2440, "valid_targets_mean": 3805.9, "valid_targets_min": 1012 }, { "epoch": 3.912, "grad_norm": 0.4706145084246985, "learning_rate": 1.9401614713855775e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.30133742094039917, "step": 2445, "valid_targets_mean": 3473.2, "valid_targets_min": 666 }, { "epoch": 3.92, "grad_norm": 0.42155693267392574, "learning_rate": 1.932185879870218e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.23585715889930725, "step": 2450, "valid_targets_mean": 4632.4, "valid_targets_min": 946 }, { "epoch": 3.928, "grad_norm": 0.42216004508529464, "learning_rate": 1.924211367869357e-05, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.25942063331604004, "step": 2455, "valid_targets_mean": 4232.3, "valid_targets_min": 1077 }, { "epoch": 3.936, "grad_norm": 0.43356255890123696, "learning_rate": 1.9162380623270783e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.24051374197006226, "step": 2460, "valid_targets_mean": 3791.2, "valid_targets_min": 655 }, { "epoch": 3.944, "grad_norm": 0.41613078686108457, "learning_rate": 1.90826609016826e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.2255561798810959, "step": 2465, "valid_targets_mean": 3539.2, "valid_targets_min": 785 }, { "epoch": 3.952, "grad_norm": 0.38294039222353565, "learning_rate": 1.9002955782965548e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.2199365645647049, "step": 2470, "valid_targets_mean": 4334.4, "valid_targets_min": 791 }, { "epoch": 3.96, "grad_norm": 0.45878262976054157, "learning_rate": 1.8923266535923688e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.27829837799072266, "step": 2475, "valid_targets_mean": 3980.3, "valid_targets_min": 1038 }, { "epoch": 3.968, "grad_norm": 0.42297288882981043, "learning_rate": 1.8843594429108426e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.29415255784988403, "step": 2480, "valid_targets_mean": 4948.5, "valid_targets_min": 932 }, { "epoch": 3.976, "grad_norm": 0.4638883460903558, "learning_rate": 1.8763940730798324e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.2466743290424347, "step": 2485, "valid_targets_mean": 3243.7, "valid_targets_min": 712 }, { "epoch": 3.984, "grad_norm": 0.4897364741478554, "learning_rate": 1.8684306708978896e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.25233909487724304, "step": 2490, "valid_targets_mean": 3177.6, "valid_targets_min": 850 }, { "epoch": 3.992, "grad_norm": 0.46252614216792853, "learning_rate": 1.8604693631322433e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.23966452479362488, "step": 2495, "valid_targets_mean": 3006.2, "valid_targets_min": 860 }, { "epoch": 4.0, "grad_norm": 0.31710051876751844, "learning_rate": 1.852510276516783e-05, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.20360557734966278, "step": 2500, "valid_targets_mean": 5554.4, "valid_targets_min": 762 }, { "epoch": 4.008, "grad_norm": 0.4182463285312466, "learning_rate": 1.8445535377500393e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2686900496482849, "step": 2505, "valid_targets_mean": 4283.1, "valid_targets_min": 780 }, { "epoch": 4.016, "grad_norm": 0.34215268944260163, "learning_rate": 1.8365992734931686e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.24253295361995697, "step": 2510, "valid_targets_mean": 6879.1, "valid_targets_min": 993 }, { "epoch": 4.024, "grad_norm": 0.38956003361720304, "learning_rate": 1.8286476103679356e-05, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.21489191055297852, "step": 2515, "valid_targets_mean": 4114.4, "valid_targets_min": 1045 }, { "epoch": 4.032, "grad_norm": 0.3507035259915641, "learning_rate": 1.8206986749546992e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.22584864497184753, "step": 2520, "valid_targets_mean": 5080.9, "valid_targets_min": 841 }, { "epoch": 4.04, "grad_norm": 0.3812064932824899, "learning_rate": 1.8127525937903957e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.23593032360076904, "step": 2525, "valid_targets_mean": 4911.8, "valid_targets_min": 760 }, { "epoch": 4.048, "grad_norm": 0.5267876933020568, "learning_rate": 1.8048094933665262e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.2608511745929718, "step": 2530, "valid_targets_mean": 2954.8, "valid_targets_min": 969 }, { "epoch": 4.056, "grad_norm": 0.3449942876056951, "learning_rate": 1.7968695001271416e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.2336217761039734, "step": 2535, "valid_targets_mean": 6292.1, "valid_targets_min": 790 }, { "epoch": 4.064, "grad_norm": 0.4355115464048802, "learning_rate": 1.7889327404668316e-05, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.2266024351119995, "step": 2540, "valid_targets_mean": 3884.9, "valid_targets_min": 879 }, { "epoch": 4.072, "grad_norm": 0.3081848481333973, "learning_rate": 1.7809993407287083e-05, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.22978955507278442, "step": 2545, "valid_targets_mean": 7871.2, "valid_targets_min": 797 }, { "epoch": 4.08, "grad_norm": 0.5481512251233728, "learning_rate": 1.7730694272024018e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.30004870891571045, "step": 2550, "valid_targets_mean": 3161.5, "valid_targets_min": 804 }, { "epoch": 4.088, "grad_norm": 0.48046326523783284, "learning_rate": 1.765143126122044e-05, "loss": 0.2554, "loss_nan_ranks": 0, "loss_rank_avg": 0.2633433938026428, "step": 2555, "valid_targets_mean": 3137.6, "valid_targets_min": 913 }, { "epoch": 4.096, "grad_norm": 0.45306035014956936, "learning_rate": 1.7572205636642622e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.27019399404525757, "step": 2560, "valid_targets_mean": 4373.4, "valid_targets_min": 793 }, { "epoch": 4.104, "grad_norm": 0.3583844187285849, "learning_rate": 1.749301865946169e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.21709087491035461, "step": 2565, "valid_targets_mean": 5196.9, "valid_targets_min": 823 }, { "epoch": 4.112, "grad_norm": 0.4402520016943769, "learning_rate": 1.7413871590233557e-05, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.26503556966781616, "step": 2570, "valid_targets_mean": 4493.4, "valid_targets_min": 809 }, { "epoch": 4.12, "grad_norm": 0.3555706054314649, "learning_rate": 1.7334765688878848e-05, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.2207963764667511, "step": 2575, "valid_targets_mean": 5484.2, "valid_targets_min": 690 }, { "epoch": 4.128, "grad_norm": 0.4611646375770736, "learning_rate": 1.7255702214662852e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.24676471948623657, "step": 2580, "valid_targets_mean": 3392.4, "valid_targets_min": 784 }, { "epoch": 4.136, "grad_norm": 0.47243039431807954, "learning_rate": 1.7176682426175468e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.2714911103248596, "step": 2585, "valid_targets_mean": 3790.6, "valid_targets_min": 996 }, { "epoch": 4.144, "grad_norm": 0.3937112234840623, "learning_rate": 1.709770758131118e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.25096097588539124, "step": 2590, "valid_targets_mean": 4663.3, "valid_targets_min": 653 }, { "epoch": 4.152, "grad_norm": 0.4070587446512345, "learning_rate": 1.7018778937249017e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.2075790911912918, "step": 2595, "valid_targets_mean": 3767.4, "valid_targets_min": 858 }, { "epoch": 4.16, "grad_norm": 0.36994325328075317, "learning_rate": 1.6939897750432562e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.22925224900245667, "step": 2600, "valid_targets_mean": 5491.9, "valid_targets_min": 719 }, { "epoch": 4.168, "grad_norm": 0.45041384359435777, "learning_rate": 1.6861065276549933e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.24161088466644287, "step": 2605, "valid_targets_mean": 4071.9, "valid_targets_min": 855 }, { "epoch": 4.176, "grad_norm": 0.4581954398994809, "learning_rate": 1.6782282770513788e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.2478228509426117, "step": 2610, "valid_targets_mean": 3686.6, "valid_targets_min": 709 }, { "epoch": 4.184, "grad_norm": 0.4007037738747935, "learning_rate": 1.6703551486441382e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544166147708893, "step": 2615, "valid_targets_mean": 4708.0, "valid_targets_min": 835 }, { "epoch": 4.192, "grad_norm": 0.35558467476339845, "learning_rate": 1.6624872677634565e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.22993795573711395, "step": 2620, "valid_targets_mean": 5626.6, "valid_targets_min": 1024 }, { "epoch": 4.2, "grad_norm": 0.4362176145931464, "learning_rate": 1.654624759655986e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.23500782251358032, "step": 2625, "valid_targets_mean": 4308.1, "valid_targets_min": 908 }, { "epoch": 4.208, "grad_norm": 0.43269722980811254, "learning_rate": 1.64676774948285e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.25792813301086426, "step": 2630, "valid_targets_mean": 4154.8, "valid_targets_min": 1168 }, { "epoch": 4.216, "grad_norm": 0.362438370317793, "learning_rate": 1.6389163623176536e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.23212498426437378, "step": 2635, "valid_targets_mean": 5189.7, "valid_targets_min": 857 }, { "epoch": 4.224, "grad_norm": 0.6495031296425801, "learning_rate": 1.6310707231444884e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.33409446477890015, "step": 2640, "valid_targets_mean": 2262.6, "valid_targets_min": 923 }, { "epoch": 4.232, "grad_norm": 0.3044482725544302, "learning_rate": 1.623230956855947e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.1921289712190628, "step": 2645, "valid_targets_mean": 6717.5, "valid_targets_min": 1050 }, { "epoch": 4.24, "grad_norm": 0.4021251156140196, "learning_rate": 1.6153971882511324e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.23349186778068542, "step": 2650, "valid_targets_mean": 4582.3, "valid_targets_min": 722 }, { "epoch": 4.248, "grad_norm": 0.3445640898802388, "learning_rate": 1.6075695420336724e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.24022488296031952, "step": 2655, "valid_targets_mean": 5738.2, "valid_targets_min": 859 }, { "epoch": 4.256, "grad_norm": 0.3634851638301243, "learning_rate": 1.5997481428097338e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.18648147583007812, "step": 2660, "valid_targets_mean": 5074.1, "valid_targets_min": 879 }, { "epoch": 4.264, "grad_norm": 0.4641862374466239, "learning_rate": 1.5919331150860396e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.23830462992191315, "step": 2665, "valid_targets_mean": 3713.1, "valid_targets_min": 823 }, { "epoch": 4.272, "grad_norm": 0.5391929747868811, "learning_rate": 1.5841245832678873e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.2308681607246399, "step": 2670, "valid_targets_mean": 3575.1, "valid_targets_min": 748 }, { "epoch": 4.28, "grad_norm": 0.35324812073512407, "learning_rate": 1.576322671657166e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.22632098197937012, "step": 2675, "valid_targets_mean": 5186.4, "valid_targets_min": 764 }, { "epoch": 4.288, "grad_norm": 0.36772896338506605, "learning_rate": 1.5685275044503804e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.20238947868347168, "step": 2680, "valid_targets_mean": 4375.9, "valid_targets_min": 998 }, { "epoch": 4.296, "grad_norm": 0.5917343917305425, "learning_rate": 1.560739205736674e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.2685689628124237, "step": 2685, "valid_targets_mean": 2465.2, "valid_targets_min": 745 }, { "epoch": 4.304, "grad_norm": 0.38800770329149276, "learning_rate": 1.552957899495851e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.22670996189117432, "step": 2690, "valid_targets_mean": 4851.9, "valid_targets_min": 1051 }, { "epoch": 4.312, "grad_norm": 0.4348192390077996, "learning_rate": 1.5451837095964054e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.23623718321323395, "step": 2695, "valid_targets_mean": 4257.4, "valid_targets_min": 741 }, { "epoch": 4.32, "grad_norm": 0.3150520299968283, "learning_rate": 1.5374167597935478e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.18955495953559875, "step": 2700, "valid_targets_mean": 5891.4, "valid_targets_min": 845 }, { "epoch": 4.328, "grad_norm": 0.4228257855789774, "learning_rate": 1.5296571737272354e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.22553138434886932, "step": 2705, "valid_targets_mean": 3918.9, "valid_targets_min": 788 }, { "epoch": 4.336, "grad_norm": 0.4441377948845305, "learning_rate": 1.5219050749202037e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.22206555306911469, "step": 2710, "valid_targets_mean": 3918.2, "valid_targets_min": 916 }, { "epoch": 4.344, "grad_norm": 0.5003922378983456, "learning_rate": 1.5141605867760021e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.2991781234741211, "step": 2715, "valid_targets_mean": 3582.6, "valid_targets_min": 670 }, { "epoch": 4.352, "grad_norm": 0.3967867101584086, "learning_rate": 1.5064238325770267e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.24074117839336395, "step": 2720, "valid_targets_mean": 4480.3, "valid_targets_min": 945 }, { "epoch": 4.36, "grad_norm": 0.40832709295548075, "learning_rate": 1.498694935482559e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.2141822874546051, "step": 2725, "valid_targets_mean": 3890.5, "valid_targets_min": 894 }, { "epoch": 4.368, "grad_norm": 0.5353662529083422, "learning_rate": 1.4909740185268056e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.2768443822860718, "step": 2730, "valid_targets_mean": 3256.1, "valid_targets_min": 732 }, { "epoch": 4.376, "grad_norm": 0.3903407215377192, "learning_rate": 1.4832612046169408e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.25160282850265503, "step": 2735, "valid_targets_mean": 5186.7, "valid_targets_min": 898 }, { "epoch": 4.384, "grad_norm": 0.3610608999407683, "learning_rate": 1.4755566165311455e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.21602243185043335, "step": 2740, "valid_targets_mean": 5826.9, "valid_targets_min": 899 }, { "epoch": 4.392, "grad_norm": 0.3705361464347009, "learning_rate": 1.4678603769166591e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.2093980610370636, "step": 2745, "valid_targets_mean": 4775.3, "valid_targets_min": 685 }, { "epoch": 4.4, "grad_norm": 0.5672264522039926, "learning_rate": 1.4601726082878226e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.23798605799674988, "step": 2750, "valid_targets_mean": 2565.5, "valid_targets_min": 851 }, { "epoch": 4.408, "grad_norm": 0.3839516251209785, "learning_rate": 1.4524934330241292e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.20655933022499084, "step": 2755, "valid_targets_mean": 4338.2, "valid_targets_min": 710 }, { "epoch": 4.416, "grad_norm": 0.6594074981447611, "learning_rate": 1.4448229733682784e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.24626955389976501, "step": 2760, "valid_targets_mean": 2719.0, "valid_targets_min": 717 }, { "epoch": 4.424, "grad_norm": 0.5159254418985769, "learning_rate": 1.4371613514242264e-05, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.24901220202445984, "step": 2765, "valid_targets_mean": 3019.8, "valid_targets_min": 881 }, { "epoch": 4.432, "grad_norm": 0.3594039502636306, "learning_rate": 1.4295086891552457e-05, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.2654702663421631, "step": 2770, "valid_targets_mean": 6056.7, "valid_targets_min": 1036 }, { "epoch": 4.44, "grad_norm": 0.34691201685012074, "learning_rate": 1.4218651083819811e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.21709834039211273, "step": 2775, "valid_targets_mean": 5528.9, "valid_targets_min": 1091 }, { "epoch": 4.448, "grad_norm": 0.4454510808301901, "learning_rate": 1.4142307307805125e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.2332070767879486, "step": 2780, "valid_targets_mean": 3425.8, "valid_targets_min": 626 }, { "epoch": 4.456, "grad_norm": 0.33114532349140574, "learning_rate": 1.406605677880416e-05, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.216552734375, "step": 2785, "valid_targets_mean": 5557.9, "valid_targets_min": 686 }, { "epoch": 4.464, "grad_norm": 0.36774664936117085, "learning_rate": 1.3989900710628313e-05, "loss": 0.239, "loss_nan_ranks": 0, "loss_rank_avg": 0.21505959331989288, "step": 2790, "valid_targets_mean": 4693.8, "valid_targets_min": 990 }, { "epoch": 4.4719999999999995, "grad_norm": 0.3545900301698533, "learning_rate": 1.3913840315585279e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.21788690984249115, "step": 2795, "valid_targets_mean": 5270.3, "valid_targets_min": 830 }, { "epoch": 4.48, "grad_norm": 0.4302379594475467, "learning_rate": 1.3837876804459765e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.24874816834926605, "step": 2800, "valid_targets_mean": 4287.2, "valid_targets_min": 1103 }, { "epoch": 4.4879999999999995, "grad_norm": 0.367392918189934, "learning_rate": 1.3762011386494191e-05, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.22634848952293396, "step": 2805, "valid_targets_mean": 4934.0, "valid_targets_min": 917 }, { "epoch": 4.496, "grad_norm": 0.3355554630083534, "learning_rate": 1.3686245269369485e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.21311712265014648, "step": 2810, "valid_targets_mean": 5740.8, "valid_targets_min": 991 }, { "epoch": 4.504, "grad_norm": 0.3839903505349243, "learning_rate": 1.3610579659185809e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.22502079606056213, "step": 2815, "valid_targets_mean": 4504.8, "valid_targets_min": 955 }, { "epoch": 4.5120000000000005, "grad_norm": 0.3433561120934192, "learning_rate": 1.35350157604434e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.23318302631378174, "step": 2820, "valid_targets_mean": 6099.9, "valid_targets_min": 830 }, { "epoch": 4.52, "grad_norm": 0.3924173308347554, "learning_rate": 1.345955477602337e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.22661542892456055, "step": 2825, "valid_targets_mean": 4413.6, "valid_targets_min": 1228 }, { "epoch": 4.5280000000000005, "grad_norm": 0.3671450930398099, "learning_rate": 1.3384197907168561e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.2506842613220215, "step": 2830, "valid_targets_mean": 5014.2, "valid_targets_min": 865 }, { "epoch": 4.536, "grad_norm": 0.4471447410885578, "learning_rate": 1.3308946353464438e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.25687381625175476, "step": 2835, "valid_targets_mean": 3734.6, "valid_targets_min": 973 }, { "epoch": 4.5440000000000005, "grad_norm": 0.3665444810496819, "learning_rate": 1.3233801312819979e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.24433283507823944, "step": 2840, "valid_targets_mean": 5373.4, "valid_targets_min": 967 }, { "epoch": 4.552, "grad_norm": 0.38498330932928676, "learning_rate": 1.3158763981448606e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.23016983270645142, "step": 2845, "valid_targets_mean": 4454.9, "valid_targets_min": 1088 }, { "epoch": 4.5600000000000005, "grad_norm": 0.3993486182470705, "learning_rate": 1.3083835553849148e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.24869374930858612, "step": 2850, "valid_targets_mean": 4435.8, "valid_targets_min": 739 }, { "epoch": 4.568, "grad_norm": 0.4530152443374673, "learning_rate": 1.3009017222786828e-05, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.2325194925069809, "step": 2855, "valid_targets_mean": 3650.1, "valid_targets_min": 1149 }, { "epoch": 4.576, "grad_norm": 0.45145189985347955, "learning_rate": 1.2934310179274269e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.24084368348121643, "step": 2860, "valid_targets_mean": 3644.5, "valid_targets_min": 704 }, { "epoch": 4.584, "grad_norm": 0.4475782725112683, "learning_rate": 1.2859715612552541e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.21897542476654053, "step": 2865, "valid_targets_mean": 3397.4, "valid_targets_min": 1067 }, { "epoch": 4.592, "grad_norm": 0.4612371616890256, "learning_rate": 1.278523471007223e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.22148343920707703, "step": 2870, "valid_targets_mean": 2955.4, "valid_targets_min": 777 }, { "epoch": 4.6, "grad_norm": 0.3387602746131469, "learning_rate": 1.271086865747451e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.24698293209075928, "step": 2875, "valid_targets_mean": 6360.4, "valid_targets_min": 1383 }, { "epoch": 4.608, "grad_norm": 0.3839373637303783, "learning_rate": 1.2636618638572316e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.2379951924085617, "step": 2880, "valid_targets_mean": 5022.4, "valid_targets_min": 829 }, { "epoch": 4.616, "grad_norm": 0.3197611013771196, "learning_rate": 1.2562485835331466e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.23118649423122406, "step": 2885, "valid_targets_mean": 7057.1, "valid_targets_min": 1038 }, { "epoch": 4.624, "grad_norm": 0.43290245672745614, "learning_rate": 1.2488471427851852e-05, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.23651964962482452, "step": 2890, "valid_targets_mean": 3611.8, "valid_targets_min": 851 }, { "epoch": 4.632, "grad_norm": 0.4331683426323707, "learning_rate": 1.241457659434866e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.22483578324317932, "step": 2895, "valid_targets_mean": 3447.9, "valid_targets_min": 978 }, { "epoch": 4.64, "grad_norm": 0.3988096882137287, "learning_rate": 1.2340802511133605e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.2243075966835022, "step": 2900, "valid_targets_mean": 4385.4, "valid_targets_min": 863 }, { "epoch": 4.648, "grad_norm": 0.40557367557155005, "learning_rate": 1.2267150352596216e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.22742396593093872, "step": 2905, "valid_targets_mean": 4335.8, "valid_targets_min": 941 }, { "epoch": 4.656, "grad_norm": 0.41903497071079515, "learning_rate": 1.2193621291185132e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.23160028457641602, "step": 2910, "valid_targets_mean": 3808.8, "valid_targets_min": 916 }, { "epoch": 4.664, "grad_norm": 0.3333342358026764, "learning_rate": 1.2120216497389446e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.21926115453243256, "step": 2915, "valid_targets_mean": 5564.4, "valid_targets_min": 898 }, { "epoch": 4.672, "grad_norm": 0.35498213383205174, "learning_rate": 1.2046937139720068e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.23465262353420258, "step": 2920, "valid_targets_mean": 5612.9, "valid_targets_min": 901 }, { "epoch": 4.68, "grad_norm": 0.43676624123660573, "learning_rate": 1.1973784384691121e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.22778140008449554, "step": 2925, "valid_targets_mean": 3652.6, "valid_targets_min": 744 }, { "epoch": 4.688, "grad_norm": 0.43153283817401733, "learning_rate": 1.1900759396801382e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.23726201057434082, "step": 2930, "valid_targets_mean": 3769.8, "valid_targets_min": 1104 }, { "epoch": 4.696, "grad_norm": 0.4041357939241981, "learning_rate": 1.1827863338515741e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.23281404376029968, "step": 2935, "valid_targets_mean": 4432.1, "valid_targets_min": 897 }, { "epoch": 4.704, "grad_norm": 0.3514377881831837, "learning_rate": 1.1755097370246669e-05, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.220592200756073, "step": 2940, "valid_targets_mean": 5495.7, "valid_targets_min": 793 }, { "epoch": 4.712, "grad_norm": 0.4214613254086311, "learning_rate": 1.1682462650335791e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.2115774154663086, "step": 2945, "valid_targets_mean": 3903.4, "valid_targets_min": 785 }, { "epoch": 4.72, "grad_norm": 0.5099284948600926, "learning_rate": 1.1609960335035423e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.22030048072338104, "step": 2950, "valid_targets_mean": 2719.6, "valid_targets_min": 771 }, { "epoch": 4.728, "grad_norm": 0.3655229242181005, "learning_rate": 1.1537591578490165e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.20158278942108154, "step": 2955, "valid_targets_mean": 4298.5, "valid_targets_min": 793 }, { "epoch": 4.736, "grad_norm": 0.46139845446107813, "learning_rate": 1.146535753271853e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.24375522136688232, "step": 2960, "valid_targets_mean": 3361.3, "valid_targets_min": 902 }, { "epoch": 4.744, "grad_norm": 0.4688790022851686, "learning_rate": 1.139325934759461e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.25852593779563904, "step": 2965, "valid_targets_mean": 3596.0, "valid_targets_min": 968 }, { "epoch": 4.752, "grad_norm": 0.5227422410545948, "learning_rate": 1.1321298170829768e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.24697157740592957, "step": 2970, "valid_targets_mean": 2877.5, "valid_targets_min": 887 }, { "epoch": 4.76, "grad_norm": 0.4038881666049419, "learning_rate": 1.1249475147954363e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.21838301420211792, "step": 2975, "valid_targets_mean": 4123.2, "valid_targets_min": 777 }, { "epoch": 4.768, "grad_norm": 0.5184660299912265, "learning_rate": 1.1177791422299528e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.27220386266708374, "step": 2980, "valid_targets_mean": 3015.9, "valid_targets_min": 630 }, { "epoch": 4.776, "grad_norm": 0.3654819987069819, "learning_rate": 1.1106248134978959e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.22408969700336456, "step": 2985, "valid_targets_mean": 5349.6, "valid_targets_min": 1141 }, { "epoch": 4.784, "grad_norm": 0.3660126606227132, "learning_rate": 1.1034846424870744e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.2300996333360672, "step": 2990, "valid_targets_mean": 4971.9, "valid_targets_min": 978 }, { "epoch": 4.792, "grad_norm": 0.3756476057343205, "learning_rate": 1.0963587428599256e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.2119663953781128, "step": 2995, "valid_targets_mean": 4842.7, "valid_targets_min": 732 }, { "epoch": 4.8, "grad_norm": 0.4613837764914878, "learning_rate": 1.089247228051704e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.24079769849777222, "step": 3000, "valid_targets_mean": 3716.3, "valid_targets_min": 759 }, { "epoch": 4.808, "grad_norm": 0.28943767912823337, "learning_rate": 1.0821502112686753e-05, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.19776251912117004, "step": 3005, "valid_targets_mean": 6197.8, "valid_targets_min": 782 }, { "epoch": 4.816, "grad_norm": 0.4161037969654231, "learning_rate": 1.0750678054863158e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.22658786177635193, "step": 3010, "valid_targets_mean": 3665.1, "valid_targets_min": 752 }, { "epoch": 4.824, "grad_norm": 0.31379216309346025, "learning_rate": 1.0680001234475127e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.20140352845191956, "step": 3015, "valid_targets_mean": 6177.3, "valid_targets_min": 887 }, { "epoch": 4.832, "grad_norm": 0.3780126118328765, "learning_rate": 1.0609472776607715e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.24119669198989868, "step": 3020, "valid_targets_mean": 6278.8, "valid_targets_min": 1106 }, { "epoch": 4.84, "grad_norm": 0.3373262706812363, "learning_rate": 1.0539093803984217e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.20110008120536804, "step": 3025, "valid_targets_mean": 5751.3, "valid_targets_min": 1033 }, { "epoch": 4.848, "grad_norm": 0.37649695603656197, "learning_rate": 1.046886543694832e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.2516307532787323, "step": 3030, "valid_targets_mean": 5042.4, "valid_targets_min": 1139 }, { "epoch": 4.856, "grad_norm": 0.38263029301997636, "learning_rate": 1.0398788793446263e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.207616925239563, "step": 3035, "valid_targets_mean": 4312.8, "valid_targets_min": 1036 }, { "epoch": 4.864, "grad_norm": 0.42458541451939813, "learning_rate": 1.0328864989009037e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.22665390372276306, "step": 3040, "valid_targets_mean": 3687.1, "valid_targets_min": 969 }, { "epoch": 4.872, "grad_norm": 0.3892606340058019, "learning_rate": 1.0259095136734634e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.23070894181728363, "step": 3045, "valid_targets_mean": 4354.3, "valid_targets_min": 918 }, { "epoch": 4.88, "grad_norm": 0.40230384154567744, "learning_rate": 1.0189480347270311e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.24141496419906616, "step": 3050, "valid_targets_mean": 4812.8, "valid_targets_min": 942 }, { "epoch": 4.888, "grad_norm": 0.4084264186589575, "learning_rate": 1.0120021728794938e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.21485230326652527, "step": 3055, "valid_targets_mean": 4172.5, "valid_targets_min": 969 }, { "epoch": 4.896, "grad_norm": 0.5082884887305914, "learning_rate": 1.0050720387001334e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.2505829930305481, "step": 3060, "valid_targets_mean": 2977.1, "valid_targets_min": 690 }, { "epoch": 4.904, "grad_norm": 0.38678833449761596, "learning_rate": 9.981577425078672e-06, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.2366374433040619, "step": 3065, "valid_targets_mean": 4762.4, "valid_targets_min": 1002 }, { "epoch": 4.912, "grad_norm": 0.38418961481494723, "learning_rate": 9.912593943694924e-06, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.1991523802280426, "step": 3070, "valid_targets_mean": 4543.4, "valid_targets_min": 1056 }, { "epoch": 4.92, "grad_norm": 0.4832708684343786, "learning_rate": 9.843771040979328e-06, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.24161699414253235, "step": 3075, "valid_targets_mean": 3462.6, "valid_targets_min": 763 }, { "epoch": 4.928, "grad_norm": 0.4309087603014352, "learning_rate": 9.775109812504922e-06, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.20923660695552826, "step": 3080, "valid_targets_mean": 3484.4, "valid_targets_min": 664 }, { "epoch": 4.936, "grad_norm": 0.3788722471104869, "learning_rate": 9.706611351271088e-06, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.22105582058429718, "step": 3085, "valid_targets_mean": 4319.1, "valid_targets_min": 721 }, { "epoch": 4.944, "grad_norm": 0.4355369088708729, "learning_rate": 9.638276747686169e-06, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.24673102796077728, "step": 3090, "valid_targets_mean": 3661.9, "valid_targets_min": 881 }, { "epoch": 4.952, "grad_norm": 0.40667695740023535, "learning_rate": 9.570107089550091e-06, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.23325340449810028, "step": 3095, "valid_targets_mean": 4411.1, "valid_targets_min": 902 }, { "epoch": 4.96, "grad_norm": 0.3942359450360996, "learning_rate": 9.502103462037074e-06, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507432699203491, "step": 3100, "valid_targets_mean": 4678.1, "valid_targets_min": 899 }, { "epoch": 4.968, "grad_norm": 0.395308435273449, "learning_rate": 9.434266947678326e-06, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.22862330079078674, "step": 3105, "valid_targets_mean": 4401.1, "valid_targets_min": 1048 }, { "epoch": 4.976, "grad_norm": 0.35534927093483687, "learning_rate": 9.366598626344836e-06, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.24637477099895477, "step": 3110, "valid_targets_mean": 5403.4, "valid_targets_min": 942 }, { "epoch": 4.984, "grad_norm": 0.3598184673475776, "learning_rate": 9.299099575230172e-06, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.23107300698757172, "step": 3115, "valid_targets_mean": 5155.9, "valid_targets_min": 1085 }, { "epoch": 4.992, "grad_norm": 0.5088527769647312, "learning_rate": 9.231770868833334e-06, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.26669660210609436, "step": 3120, "valid_targets_mean": 3198.4, "valid_targets_min": 982 }, { "epoch": 5.0, "grad_norm": 0.34198183838948926, "learning_rate": 9.164613578941652e-06, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.21536295115947723, "step": 3125, "valid_targets_mean": 5529.9, "valid_targets_min": 896 }, { "epoch": 5.008, "grad_norm": 0.4912006951999863, "learning_rate": 9.097628774613732e-06, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.2081344723701477, "step": 3130, "valid_targets_mean": 2727.4, "valid_targets_min": 743 }, { "epoch": 5.016, "grad_norm": 0.4084241000168698, "learning_rate": 9.030817522162403e-06, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.2399434745311737, "step": 3135, "valid_targets_mean": 4014.1, "valid_targets_min": 664 }, { "epoch": 5.024, "grad_norm": 0.43709779953742833, "learning_rate": 8.964180885137797e-06, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.22896772623062134, "step": 3140, "valid_targets_mean": 4365.4, "valid_targets_min": 1046 }, { "epoch": 5.032, "grad_norm": 0.305518599208397, "learning_rate": 8.897719924310375e-06, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.20471172034740448, "step": 3145, "valid_targets_mean": 6402.6, "valid_targets_min": 931 }, { "epoch": 5.04, "grad_norm": 0.37990073340945496, "learning_rate": 8.831435697654068e-06, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.19448421895503998, "step": 3150, "valid_targets_mean": 4079.8, "valid_targets_min": 902 }, { "epoch": 5.048, "grad_norm": 0.31479459501943424, "learning_rate": 8.765329260329413e-06, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.19626212120056152, "step": 3155, "valid_targets_mean": 6214.5, "valid_targets_min": 951 }, { "epoch": 5.056, "grad_norm": 0.3740116945023727, "learning_rate": 8.699401664666774e-06, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.19557811319828033, "step": 3160, "valid_targets_mean": 4366.0, "valid_targets_min": 788 }, { "epoch": 5.064, "grad_norm": 0.4192074460438228, "learning_rate": 8.633653960149579e-06, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.26347237825393677, "step": 3165, "valid_targets_mean": 4294.9, "valid_targets_min": 869 }, { "epoch": 5.072, "grad_norm": 0.3170004260395546, "learning_rate": 8.56808719339762e-06, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.20620077848434448, "step": 3170, "valid_targets_mean": 6649.5, "valid_targets_min": 888 }, { "epoch": 5.08, "grad_norm": 0.3841314180170002, "learning_rate": 8.502702408150391e-06, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.24174794554710388, "step": 3175, "valid_targets_mean": 4925.1, "valid_targets_min": 909 }, { "epoch": 5.088, "grad_norm": 0.34188326135593766, "learning_rate": 8.43750064525047e-06, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.19666939973831177, "step": 3180, "valid_targets_mean": 5542.1, "valid_targets_min": 1072 }, { "epoch": 5.096, "grad_norm": 0.48888208213056195, "learning_rate": 8.372482942626952e-06, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.25927528738975525, "step": 3185, "valid_targets_mean": 3291.2, "valid_targets_min": 950 }, { "epoch": 5.104, "grad_norm": 0.5266810833672644, "learning_rate": 8.307650335278927e-06, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.2526220381259918, "step": 3190, "valid_targets_mean": 3052.0, "valid_targets_min": 842 }, { "epoch": 5.112, "grad_norm": 0.3489078895076499, "learning_rate": 8.243003855259015e-06, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.23310494422912598, "step": 3195, "valid_targets_mean": 6052.8, "valid_targets_min": 1104 }, { "epoch": 5.12, "grad_norm": 0.4273931588420199, "learning_rate": 8.178544531656897e-06, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.2163240909576416, "step": 3200, "valid_targets_mean": 4048.2, "valid_targets_min": 747 }, { "epoch": 5.128, "grad_norm": 0.4287189766428896, "learning_rate": 8.11427339058299e-06, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.25983962416648865, "step": 3205, "valid_targets_mean": 4372.1, "valid_targets_min": 1021 }, { "epoch": 5.136, "grad_norm": 0.4697741992206112, "learning_rate": 8.050191455152072e-06, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.23713898658752441, "step": 3210, "valid_targets_mean": 3780.0, "valid_targets_min": 833 }, { "epoch": 5.144, "grad_norm": 0.3426204752362461, "learning_rate": 7.986299745467013e-06, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.2151990830898285, "step": 3215, "valid_targets_mean": 5340.3, "valid_targets_min": 1017 }, { "epoch": 5.152, "grad_norm": 0.3476898053916093, "learning_rate": 7.922599278602524e-06, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.2065230756998062, "step": 3220, "valid_targets_mean": 5802.0, "valid_targets_min": 987 }, { "epoch": 5.16, "grad_norm": 0.34997024370706975, "learning_rate": 7.859091068588987e-06, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.22452686727046967, "step": 3225, "valid_targets_mean": 5912.6, "valid_targets_min": 711 }, { "epoch": 5.168, "grad_norm": 0.5145349413640553, "learning_rate": 7.795776126396284e-06, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.26052239537239075, "step": 3230, "valid_targets_mean": 3026.5, "valid_targets_min": 938 }, { "epoch": 5.176, "grad_norm": 0.44391793492379567, "learning_rate": 7.732655459917726e-06, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.23127031326293945, "step": 3235, "valid_targets_mean": 3623.2, "valid_targets_min": 646 }, { "epoch": 5.184, "grad_norm": 0.3630611195177078, "learning_rate": 7.669730073954005e-06, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.21552309393882751, "step": 3240, "valid_targets_mean": 5270.8, "valid_targets_min": 901 }, { "epoch": 5.192, "grad_norm": 0.4102333340497864, "learning_rate": 7.607000970197194e-06, "loss": 0.2317, "loss_nan_ranks": 0, "loss_rank_avg": 0.24429859220981598, "step": 3245, "valid_targets_mean": 4244.9, "valid_targets_min": 891 }, { "epoch": 5.2, "grad_norm": 0.36913473264732094, "learning_rate": 7.544469147214797e-06, "loss": 0.2254, "loss_nan_ranks": 0, "loss_rank_avg": 0.22578775882720947, "step": 3250, "valid_targets_mean": 5226.1, "valid_targets_min": 973 }, { "epoch": 5.208, "grad_norm": 0.40820878543241174, "learning_rate": 7.482135600433868e-06, "loss": 0.239, "loss_nan_ranks": 0, "loss_rank_avg": 0.25584137439727783, "step": 3255, "valid_targets_mean": 4932.1, "valid_targets_min": 1008 }, { "epoch": 5.216, "grad_norm": 0.4684722429375052, "learning_rate": 7.420001322125156e-06, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.24265044927597046, "step": 3260, "valid_targets_mean": 3623.2, "valid_targets_min": 874 }, { "epoch": 5.224, "grad_norm": 0.44692307822276434, "learning_rate": 7.3580673013872946e-06, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.20505103468894958, "step": 3265, "valid_targets_mean": 3615.4, "valid_targets_min": 750 }, { "epoch": 5.232, "grad_norm": 0.3654288352288813, "learning_rate": 7.2963345241310904e-06, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.19597743451595306, "step": 3270, "valid_targets_mean": 4878.7, "valid_targets_min": 867 }, { "epoch": 5.24, "grad_norm": 0.3915593147251127, "learning_rate": 7.234803973063797e-06, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2212725579738617, "step": 3275, "valid_targets_mean": 4959.9, "valid_targets_min": 723 }, { "epoch": 5.248, "grad_norm": 0.4748719949243943, "learning_rate": 7.173476627673492e-06, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.2473698854446411, "step": 3280, "valid_targets_mean": 3323.0, "valid_targets_min": 1015 }, { "epoch": 5.256, "grad_norm": 0.3588612065200158, "learning_rate": 7.112353464213477e-06, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.2438439577817917, "step": 3285, "valid_targets_mean": 6511.6, "valid_targets_min": 770 }, { "epoch": 5.264, "grad_norm": 0.4663585945976981, "learning_rate": 7.051435455686735e-06, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.23258927464485168, "step": 3290, "valid_targets_mean": 3390.1, "valid_targets_min": 782 }, { "epoch": 5.272, "grad_norm": 0.4205026890280819, "learning_rate": 6.990723571830438e-06, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.1906987726688385, "step": 3295, "valid_targets_mean": 3564.7, "valid_targets_min": 630 }, { "epoch": 5.28, "grad_norm": 0.426317166162649, "learning_rate": 6.93021877910052e-06, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.20793795585632324, "step": 3300, "valid_targets_mean": 3830.4, "valid_targets_min": 945 }, { "epoch": 5.288, "grad_norm": 0.42620206171289865, "learning_rate": 6.8699220406562985e-06, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.2456003874540329, "step": 3305, "valid_targets_mean": 4204.2, "valid_targets_min": 830 }, { "epoch": 5.296, "grad_norm": 0.3345250802407866, "learning_rate": 6.809834316345117e-06, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.20420578122138977, "step": 3310, "valid_targets_mean": 5562.4, "valid_targets_min": 842 }, { "epoch": 5.304, "grad_norm": 0.43008399094177285, "learning_rate": 6.749956562687083e-06, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.19601237773895264, "step": 3315, "valid_targets_mean": 3619.1, "valid_targets_min": 857 }, { "epoch": 5.312, "grad_norm": 0.44306372764221147, "learning_rate": 6.690289732859841e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.22992250323295593, "step": 3320, "valid_targets_mean": 3904.2, "valid_targets_min": 887 }, { "epoch": 5.32, "grad_norm": 0.349409240727027, "learning_rate": 6.630834776683403e-06, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.20814573764801025, "step": 3325, "valid_targets_mean": 5271.5, "valid_targets_min": 835 }, { "epoch": 5.328, "grad_norm": 0.4377279904884754, "learning_rate": 6.571592640605e-06, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.24027813971042633, "step": 3330, "valid_targets_mean": 4167.5, "valid_targets_min": 1091 }, { "epoch": 5.336, "grad_norm": 0.40618186734048567, "learning_rate": 6.512564267684061e-06, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.21228620409965515, "step": 3335, "valid_targets_mean": 4030.2, "valid_targets_min": 951 }, { "epoch": 5.344, "grad_norm": 0.30357992280217233, "learning_rate": 6.453750597577167e-06, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.2015833854675293, "step": 3340, "valid_targets_mean": 6969.1, "valid_targets_min": 971 }, { "epoch": 5.352, "grad_norm": 0.773767098694673, "learning_rate": 6.395152566523106e-06, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.27393215894699097, "step": 3345, "valid_targets_mean": 1623.4, "valid_targets_min": 897 }, { "epoch": 5.36, "grad_norm": 0.33428819684027417, "learning_rate": 6.336771107327966e-06, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.19410398602485657, "step": 3350, "valid_targets_mean": 5683.6, "valid_targets_min": 797 }, { "epoch": 5.368, "grad_norm": 0.45328327875390717, "learning_rate": 6.278607149350289e-06, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.23492465913295746, "step": 3355, "valid_targets_mean": 3600.2, "valid_targets_min": 841 }, { "epoch": 5.376, "grad_norm": 0.42792886228681065, "learning_rate": 6.220661618486268e-06, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.21100068092346191, "step": 3360, "valid_targets_mean": 4031.2, "valid_targets_min": 978 }, { "epoch": 5.384, "grad_norm": 0.3557291761519541, "learning_rate": 6.162935437155024e-06, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.19593030214309692, "step": 3365, "valid_targets_mean": 5009.3, "valid_targets_min": 932 }, { "epoch": 5.392, "grad_norm": 0.4833225610526371, "learning_rate": 6.105429524283901e-06, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.218770831823349, "step": 3370, "valid_targets_mean": 3252.6, "valid_targets_min": 1030 }, { "epoch": 5.4, "grad_norm": 0.39045313632453454, "learning_rate": 6.04814479529386e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.23024097084999084, "step": 3375, "valid_targets_mean": 5329.8, "valid_targets_min": 898 }, { "epoch": 5.408, "grad_norm": 0.45340949213189335, "learning_rate": 5.991082162084889e-06, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.2215794175863266, "step": 3380, "valid_targets_mean": 3607.6, "valid_targets_min": 845 }, { "epoch": 5.416, "grad_norm": 0.4468511461282984, "learning_rate": 5.934242533021499e-06, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.23574653267860413, "step": 3385, "valid_targets_mean": 3929.5, "valid_targets_min": 850 }, { "epoch": 5.424, "grad_norm": 0.45802290494827136, "learning_rate": 5.877626812918258e-06, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2201964259147644, "step": 3390, "valid_targets_mean": 3413.6, "valid_targets_min": 973 }, { "epoch": 5.432, "grad_norm": 0.3481392608973216, "learning_rate": 5.821235903025378e-06, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.18317848443984985, "step": 3395, "valid_targets_mean": 4914.8, "valid_targets_min": 774 }, { "epoch": 5.44, "grad_norm": 0.46295264230395117, "learning_rate": 5.765070701014391e-06, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.27391642332077026, "step": 3400, "valid_targets_mean": 3862.6, "valid_targets_min": 952 }, { "epoch": 5.448, "grad_norm": 0.44931670150343195, "learning_rate": 5.709132100963841e-06, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.21906086802482605, "step": 3405, "valid_targets_mean": 3500.1, "valid_targets_min": 987 }, { "epoch": 5.456, "grad_norm": 0.34292041400051865, "learning_rate": 5.653420993345062e-06, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.21244516968727112, "step": 3410, "valid_targets_mean": 5683.7, "valid_targets_min": 887 }, { "epoch": 5.464, "grad_norm": 0.5428548488630459, "learning_rate": 5.597938265007994e-06, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.23990648984909058, "step": 3415, "valid_targets_mean": 2892.4, "valid_targets_min": 951 }, { "epoch": 5.4719999999999995, "grad_norm": 0.4706595198308062, "learning_rate": 5.542684799167069e-06, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.249759703874588, "step": 3420, "valid_targets_mean": 3540.8, "valid_targets_min": 758 }, { "epoch": 5.48, "grad_norm": 0.33282202476267, "learning_rate": 5.487661475387152e-06, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.19662153720855713, "step": 3425, "valid_targets_mean": 5487.8, "valid_targets_min": 666 }, { "epoch": 5.4879999999999995, "grad_norm": 0.4006934508283925, "learning_rate": 5.432869169569541e-06, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.20843669772148132, "step": 3430, "valid_targets_mean": 4598.9, "valid_targets_min": 997 }, { "epoch": 5.496, "grad_norm": 0.44192500022237174, "learning_rate": 5.378308753938024e-06, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.25620633363723755, "step": 3435, "valid_targets_mean": 3980.2, "valid_targets_min": 815 }, { "epoch": 5.504, "grad_norm": 0.3681471863242707, "learning_rate": 5.323981097024986e-06, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.22333069145679474, "step": 3440, "valid_targets_mean": 4963.6, "valid_targets_min": 879 }, { "epoch": 5.5120000000000005, "grad_norm": 0.356019133477824, "learning_rate": 5.269887063657595e-06, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2231229841709137, "step": 3445, "valid_targets_mean": 5360.4, "valid_targets_min": 810 }, { "epoch": 5.52, "grad_norm": 0.36879369128157946, "learning_rate": 5.216027514944027e-06, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.18978220224380493, "step": 3450, "valid_targets_mean": 4393.9, "valid_targets_min": 674 }, { "epoch": 5.5280000000000005, "grad_norm": 0.3875347538251794, "learning_rate": 5.162403308259767e-06, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.289705753326416, "step": 3455, "valid_targets_mean": 5434.2, "valid_targets_min": 1041 }, { "epoch": 5.536, "grad_norm": 0.4285607405336305, "learning_rate": 5.109015297233935e-06, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.21771425008773804, "step": 3460, "valid_targets_mean": 3872.1, "valid_targets_min": 534 }, { "epoch": 5.5440000000000005, "grad_norm": 0.32801945020364764, "learning_rate": 5.055864331735736e-06, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.2591525912284851, "step": 3465, "valid_targets_mean": 6929.5, "valid_targets_min": 1136 }, { "epoch": 5.552, "grad_norm": 0.41166443102851746, "learning_rate": 5.002951257860909e-06, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.24956223368644714, "step": 3470, "valid_targets_mean": 4287.4, "valid_targets_min": 888 }, { "epoch": 5.5600000000000005, "grad_norm": 0.4554295252372924, "learning_rate": 4.950276917918256e-06, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.256850004196167, "step": 3475, "valid_targets_mean": 4103.8, "valid_targets_min": 845 }, { "epoch": 5.568, "grad_norm": 0.3506746288784145, "learning_rate": 4.8978421504162385e-06, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.2253202199935913, "step": 3480, "valid_targets_mean": 5456.3, "valid_targets_min": 745 }, { "epoch": 5.576, "grad_norm": 0.33485422936124876, "learning_rate": 4.845647790049634e-06, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.21637138724327087, "step": 3485, "valid_targets_mean": 6199.0, "valid_targets_min": 982 }, { "epoch": 5.584, "grad_norm": 0.35162902696087944, "learning_rate": 4.793694667686244e-06, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.24226173758506775, "step": 3490, "valid_targets_mean": 5727.0, "valid_targets_min": 1047 }, { "epoch": 5.592, "grad_norm": 0.37080133618018396, "learning_rate": 4.741983610353664e-06, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.1949070692062378, "step": 3495, "valid_targets_mean": 4252.1, "valid_targets_min": 919 }, { "epoch": 5.6, "grad_norm": 0.3999253776520656, "learning_rate": 4.690515441226122e-06, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.1985628753900528, "step": 3500, "valid_targets_mean": 3772.6, "valid_targets_min": 733 }, { "epoch": 5.608, "grad_norm": 0.4528901320681747, "learning_rate": 4.639290979611379e-06, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.23670107126235962, "step": 3505, "valid_targets_mean": 3763.6, "valid_targets_min": 771 }, { "epoch": 5.616, "grad_norm": 0.44302870753176904, "learning_rate": 4.588311040937683e-06, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.24087044596672058, "step": 3510, "valid_targets_mean": 3990.2, "valid_targets_min": 932 }, { "epoch": 5.624, "grad_norm": 0.3201486197160802, "learning_rate": 4.537576436740783e-06, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.2149900496006012, "step": 3515, "valid_targets_mean": 6031.9, "valid_targets_min": 817 }, { "epoch": 5.632, "grad_norm": 0.46436580014316425, "learning_rate": 4.487087974651016e-06, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.25911879539489746, "step": 3520, "valid_targets_mean": 4031.8, "valid_targets_min": 809 }, { "epoch": 5.64, "grad_norm": 0.525866298269229, "learning_rate": 4.436846458380455e-06, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.21722733974456787, "step": 3525, "valid_targets_mean": 4505.7, "valid_targets_min": 942 }, { "epoch": 5.648, "grad_norm": 0.43572904873432394, "learning_rate": 4.386852687710104e-06, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.23047277331352234, "step": 3530, "valid_targets_mean": 3991.1, "valid_targets_min": 790 }, { "epoch": 5.656, "grad_norm": 0.44158709967770554, "learning_rate": 4.337107458477177e-06, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.21699798107147217, "step": 3535, "valid_targets_mean": 4153.1, "valid_targets_min": 850 }, { "epoch": 5.664, "grad_norm": 0.3868164489125616, "learning_rate": 4.287611562562422e-06, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.2065228521823883, "step": 3540, "valid_targets_mean": 4349.3, "valid_targets_min": 587 }, { "epoch": 5.672, "grad_norm": 0.3324271889745773, "learning_rate": 4.238365787877516e-06, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.2171509563922882, "step": 3545, "valid_targets_mean": 6169.1, "valid_targets_min": 662 }, { "epoch": 5.68, "grad_norm": 0.35264056082201267, "learning_rate": 4.189370918352531e-06, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.2608416676521301, "step": 3550, "valid_targets_mean": 5970.1, "valid_targets_min": 799 }, { "epoch": 5.688, "grad_norm": 0.35571995306346826, "learning_rate": 4.140627733923439e-06, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.21136212348937988, "step": 3555, "valid_targets_mean": 5257.9, "valid_targets_min": 1041 }, { "epoch": 5.696, "grad_norm": 0.5361387745629723, "learning_rate": 4.092137010519712e-06, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.27192410826683044, "step": 3560, "valid_targets_mean": 2914.6, "valid_targets_min": 778 }, { "epoch": 5.704, "grad_norm": 0.3505859733083266, "learning_rate": 4.043899520051964e-06, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.2221640646457672, "step": 3565, "valid_targets_mean": 5925.2, "valid_targets_min": 1229 }, { "epoch": 5.712, "grad_norm": 0.49758496384659806, "learning_rate": 3.995916030399658e-06, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.27344635128974915, "step": 3570, "valid_targets_mean": 3491.2, "valid_targets_min": 991 }, { "epoch": 5.72, "grad_norm": 0.45141540037088984, "learning_rate": 3.948187305398892e-06, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.21061620116233826, "step": 3575, "valid_targets_mean": 3213.4, "valid_targets_min": 744 }, { "epoch": 5.728, "grad_norm": 0.4562178096296842, "learning_rate": 3.90071410483023e-06, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.2696354389190674, "step": 3580, "valid_targets_mean": 4130.9, "valid_targets_min": 898 }, { "epoch": 5.736, "grad_norm": 0.5457573577288195, "learning_rate": 3.853497184406623e-06, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726416289806366, "step": 3585, "valid_targets_mean": 2820.8, "valid_targets_min": 960 }, { "epoch": 5.744, "grad_norm": 0.38517110136124666, "learning_rate": 3.80653729576135e-06, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.2264452874660492, "step": 3590, "valid_targets_mean": 4501.1, "valid_targets_min": 704 }, { "epoch": 5.752, "grad_norm": 0.3357747814802782, "learning_rate": 3.7598351864360872e-06, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.23266029357910156, "step": 3595, "valid_targets_mean": 6337.8, "valid_targets_min": 714 }, { "epoch": 5.76, "grad_norm": 0.5020746707062533, "learning_rate": 3.713391599868985e-06, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2000608742237091, "step": 3600, "valid_targets_mean": 2661.7, "valid_targets_min": 791 }, { "epoch": 5.768, "grad_norm": 0.3763969776767038, "learning_rate": 3.6672072753828424e-06, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.21968242526054382, "step": 3605, "valid_targets_mean": 5032.1, "valid_targets_min": 1116 }, { "epoch": 5.776, "grad_norm": 0.41289477559493815, "learning_rate": 3.6212829481733368e-06, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.2321629524230957, "step": 3610, "valid_targets_mean": 4038.8, "valid_targets_min": 805 }, { "epoch": 5.784, "grad_norm": 0.5445568651515015, "learning_rate": 3.575619349297317e-06, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.25765252113342285, "step": 3615, "valid_targets_mean": 2809.0, "valid_targets_min": 739 }, { "epoch": 5.792, "grad_norm": 0.5472578411820961, "learning_rate": 3.5302172056611682e-06, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.25557756423950195, "step": 3620, "valid_targets_mean": 2783.1, "valid_targets_min": 883 }, { "epoch": 5.8, "grad_norm": 0.38982773078778155, "learning_rate": 3.485077240009247e-06, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.22403252124786377, "step": 3625, "valid_targets_mean": 4643.8, "valid_targets_min": 939 }, { "epoch": 5.808, "grad_norm": 0.5233043026636898, "learning_rate": 3.4402001709123643e-06, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.24592408537864685, "step": 3630, "valid_targets_mean": 2974.1, "valid_targets_min": 979 }, { "epoch": 5.816, "grad_norm": 0.45922405516006465, "learning_rate": 3.3955867127563515e-06, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.24016621708869934, "step": 3635, "valid_targets_mean": 3544.6, "valid_targets_min": 832 }, { "epoch": 5.824, "grad_norm": 0.4404664235271227, "learning_rate": 3.351237575730695e-06, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.19508153200149536, "step": 3640, "valid_targets_mean": 3297.2, "valid_targets_min": 922 }, { "epoch": 5.832, "grad_norm": 0.4375315952651967, "learning_rate": 3.307153465817219e-06, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.24130797386169434, "step": 3645, "valid_targets_mean": 4176.2, "valid_targets_min": 1140 }, { "epoch": 5.84, "grad_norm": 0.342391410159785, "learning_rate": 3.263335084778856e-06, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.21955269575119019, "step": 3650, "valid_targets_mean": 5674.6, "valid_targets_min": 916 }, { "epoch": 5.848, "grad_norm": 0.45569732049327233, "learning_rate": 3.2197831301484816e-06, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.23995280265808105, "step": 3655, "valid_targets_mean": 3858.6, "valid_targets_min": 1042 }, { "epoch": 5.856, "grad_norm": 0.43878393630957296, "learning_rate": 3.1764982952177805e-06, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.2358689308166504, "step": 3660, "valid_targets_mean": 4056.5, "valid_targets_min": 815 }, { "epoch": 5.864, "grad_norm": 0.4303963408010303, "learning_rate": 3.1334812690262507e-06, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.247379869222641, "step": 3665, "valid_targets_mean": 4625.3, "valid_targets_min": 1003 }, { "epoch": 5.872, "grad_norm": 0.45709638886257675, "learning_rate": 3.0907327363502084e-06, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.21598784625530243, "step": 3670, "valid_targets_mean": 3449.9, "valid_targets_min": 1054 }, { "epoch": 5.88, "grad_norm": 0.4280225439458205, "learning_rate": 3.0482533776918987e-06, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.25824448466300964, "step": 3675, "valid_targets_mean": 4414.6, "valid_targets_min": 875 }, { "epoch": 5.888, "grad_norm": 0.3077675965104222, "learning_rate": 3.0060438692686533e-06, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.1975744068622589, "step": 3680, "valid_targets_mean": 5987.2, "valid_targets_min": 793 }, { "epoch": 5.896, "grad_norm": 0.3403603704565209, "learning_rate": 2.964104883002139e-06, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.21167896687984467, "step": 3685, "valid_targets_mean": 5536.9, "valid_targets_min": 871 }, { "epoch": 5.904, "grad_norm": 0.4054315157161449, "learning_rate": 2.9224370865076457e-06, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.25502288341522217, "step": 3690, "valid_targets_mean": 4805.2, "valid_targets_min": 822 }, { "epoch": 5.912, "grad_norm": 0.35789980590099835, "learning_rate": 2.8810411430834716e-06, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.19632747769355774, "step": 3695, "valid_targets_mean": 5478.2, "valid_targets_min": 712 }, { "epoch": 5.92, "grad_norm": 0.6164021351090805, "learning_rate": 2.8399177117003595e-06, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.2608773410320282, "step": 3700, "valid_targets_mean": 2676.1, "valid_targets_min": 944 }, { "epoch": 5.928, "grad_norm": 0.45745995980330256, "learning_rate": 2.7990674469910085e-06, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.21105098724365234, "step": 3705, "valid_targets_mean": 3218.9, "valid_targets_min": 639 }, { "epoch": 5.936, "grad_norm": 0.3710919492928431, "learning_rate": 2.7584909992396515e-06, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.25090497732162476, "step": 3710, "valid_targets_mean": 5523.6, "valid_targets_min": 952 }, { "epoch": 5.944, "grad_norm": 0.3323094252823238, "learning_rate": 2.7181890143716995e-06, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.20140644907951355, "step": 3715, "valid_targets_mean": 6081.9, "valid_targets_min": 1116 }, { "epoch": 5.952, "grad_norm": 0.4718363509817398, "learning_rate": 2.6781621339434717e-06, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.20775261521339417, "step": 3720, "valid_targets_mean": 3344.9, "valid_targets_min": 937 }, { "epoch": 5.96, "grad_norm": 0.3964056160212036, "learning_rate": 2.638410995131966e-06, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.2471739947795868, "step": 3725, "valid_targets_mean": 4901.1, "valid_targets_min": 930 }, { "epoch": 5.968, "grad_norm": 0.3725995303239783, "learning_rate": 2.5989362307247313e-06, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.20092034339904785, "step": 3730, "valid_targets_mean": 4411.7, "valid_targets_min": 770 }, { "epoch": 5.976, "grad_norm": 0.38039589975141935, "learning_rate": 2.5597384691097847e-06, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.21905504167079926, "step": 3735, "valid_targets_mean": 4735.8, "valid_targets_min": 717 }, { "epoch": 5.984, "grad_norm": 0.5842176629456968, "learning_rate": 2.520818334265611e-06, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.2322233021259308, "step": 3740, "valid_targets_mean": 2426.8, "valid_targets_min": 762 }, { "epoch": 5.992, "grad_norm": 0.3974036678792113, "learning_rate": 2.482176445751232e-06, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.23819592595100403, "step": 3745, "valid_targets_mean": 5103.4, "valid_targets_min": 806 }, { "epoch": 6.0, "grad_norm": 0.5999847162525445, "learning_rate": 2.4438134186963415e-06, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.26903235912323, "step": 3750, "valid_targets_mean": 5103.5, "valid_targets_min": 786 }, { "epoch": 6.008, "grad_norm": 0.3349477545342433, "learning_rate": 2.4057298637915105e-06, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.21318253874778748, "step": 3755, "valid_targets_mean": 6269.4, "valid_targets_min": 896 }, { "epoch": 6.016, "grad_norm": 0.4317583641741853, "learning_rate": 2.3679263872784717e-06, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.26914650201797485, "step": 3760, "valid_targets_mean": 4306.1, "valid_targets_min": 810 }, { "epoch": 6.024, "grad_norm": 0.41472298145715747, "learning_rate": 2.330403590940471e-06, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.24200578033924103, "step": 3765, "valid_targets_mean": 4969.2, "valid_targets_min": 864 }, { "epoch": 6.032, "grad_norm": 0.40539356972798346, "learning_rate": 2.2931620720926717e-06, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.2599494457244873, "step": 3770, "valid_targets_mean": 5092.1, "valid_targets_min": 1093 }, { "epoch": 6.04, "grad_norm": 0.5024307919648837, "learning_rate": 2.256202423572669e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.24911504983901978, "step": 3775, "valid_targets_mean": 3418.2, "valid_targets_min": 819 }, { "epoch": 6.048, "grad_norm": 0.4439148698555944, "learning_rate": 2.219525233731035e-06, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.22976058721542358, "step": 3780, "valid_targets_mean": 3652.3, "valid_targets_min": 878 }, { "epoch": 6.056, "grad_norm": 0.4025990629518132, "learning_rate": 2.183131086421961e-06, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.2216932326555252, "step": 3785, "valid_targets_mean": 4467.1, "valid_targets_min": 651 }, { "epoch": 6.064, "grad_norm": 0.34119261650968813, "learning_rate": 2.1470205609939533e-06, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.22316013276576996, "step": 3790, "valid_targets_mean": 5872.5, "valid_targets_min": 743 }, { "epoch": 6.072, "grad_norm": 0.44619413022846166, "learning_rate": 2.1111942322806335e-06, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.22817836701869965, "step": 3795, "valid_targets_mean": 3575.1, "valid_targets_min": 782 }, { "epoch": 6.08, "grad_norm": 0.3574078861297622, "learning_rate": 2.0756526705915635e-06, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.24410027265548706, "step": 3800, "valid_targets_mean": 5989.6, "valid_targets_min": 1000 }, { "epoch": 6.088, "grad_norm": 0.6009272336278385, "learning_rate": 2.0403964417031764e-06, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.23332129418849945, "step": 3805, "valid_targets_mean": 2330.4, "valid_targets_min": 616 }, { "epoch": 6.096, "grad_norm": 0.36144075081920424, "learning_rate": 2.0054261068497773e-06, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.20843176543712616, "step": 3810, "valid_targets_mean": 5203.1, "valid_targets_min": 1022 }, { "epoch": 6.104, "grad_norm": 0.38552202621236137, "learning_rate": 1.9707422227145922e-06, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.22240760922431946, "step": 3815, "valid_targets_mean": 4687.2, "valid_targets_min": 1028 }, { "epoch": 6.112, "grad_norm": 0.41879689644483564, "learning_rate": 1.936345341420924e-06, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.2170860469341278, "step": 3820, "valid_targets_mean": 4666.2, "valid_targets_min": 1176 }, { "epoch": 6.12, "grad_norm": 0.6687266732348552, "learning_rate": 1.9022360105233507e-06, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.2556125521659851, "step": 3825, "valid_targets_mean": 2104.1, "valid_targets_min": 1037 }, { "epoch": 6.128, "grad_norm": 0.34492206038582207, "learning_rate": 1.8684147729990188e-06, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.2455054074525833, "step": 3830, "valid_targets_mean": 6336.3, "valid_targets_min": 1050 }, { "epoch": 6.136, "grad_norm": 0.4159150879186752, "learning_rate": 1.8348821672389893e-06, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.225693017244339, "step": 3835, "valid_targets_mean": 4592.3, "valid_targets_min": 1017 }, { "epoch": 6.144, "grad_norm": 0.38859249778164073, "learning_rate": 1.8016387270396784e-06, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.23034977912902832, "step": 3840, "valid_targets_mean": 5167.3, "valid_targets_min": 881 }, { "epoch": 6.152, "grad_norm": 0.3203760106705756, "learning_rate": 1.7686849815943486e-06, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.21037934720516205, "step": 3845, "valid_targets_mean": 6393.3, "valid_targets_min": 919 }, { "epoch": 6.16, "grad_norm": 0.3983227918706389, "learning_rate": 1.7360214554847e-06, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.2141357660293579, "step": 3850, "valid_targets_mean": 4325.4, "valid_targets_min": 920 }, { "epoch": 6.168, "grad_norm": 0.3289919821089591, "learning_rate": 1.703648668672495e-06, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.21512682735919952, "step": 3855, "valid_targets_mean": 6087.9, "valid_targets_min": 903 }, { "epoch": 6.176, "grad_norm": 0.43853553740948986, "learning_rate": 1.6715671364913077e-06, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.21846427023410797, "step": 3860, "valid_targets_mean": 3917.2, "valid_targets_min": 899 }, { "epoch": 6.184, "grad_norm": 0.38127578812735524, "learning_rate": 1.6397773696383091e-06, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.21105417609214783, "step": 3865, "valid_targets_mean": 4652.4, "valid_targets_min": 787 }, { "epoch": 6.192, "grad_norm": 0.3396436270940679, "learning_rate": 1.6082798741661321e-06, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.20317316055297852, "step": 3870, "valid_targets_mean": 5430.1, "valid_targets_min": 893 }, { "epoch": 6.2, "grad_norm": 0.38228587817606946, "learning_rate": 1.5770751514748273e-06, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.21367615461349487, "step": 3875, "valid_targets_mean": 4672.6, "valid_targets_min": 1012 }, { "epoch": 6.208, "grad_norm": 0.47820322237336815, "learning_rate": 1.5461636983038686e-06, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.21911242604255676, "step": 3880, "valid_targets_mean": 3371.2, "valid_targets_min": 997 }, { "epoch": 6.216, "grad_norm": 0.4399583273624092, "learning_rate": 1.5155460067242578e-06, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.23615899682044983, "step": 3885, "valid_targets_mean": 4043.5, "valid_targets_min": 745 }, { "epoch": 6.224, "grad_norm": 0.3398925492873628, "learning_rate": 1.4852225641306816e-06, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.2137679159641266, "step": 3890, "valid_targets_mean": 5939.5, "valid_targets_min": 830 }, { "epoch": 6.232, "grad_norm": 0.4733714407702554, "learning_rate": 1.4551938532337607e-06, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.2328024059534073, "step": 3895, "valid_targets_mean": 3431.8, "valid_targets_min": 972 }, { "epoch": 6.24, "grad_norm": 0.561178279992971, "learning_rate": 1.4254603520523614e-06, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.21961773931980133, "step": 3900, "valid_targets_mean": 2525.5, "valid_targets_min": 969 }, { "epoch": 6.248, "grad_norm": 0.4741052980704381, "learning_rate": 1.3960225339059875e-06, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.23817236721515656, "step": 3905, "valid_targets_mean": 4482.2, "valid_targets_min": 693 }, { "epoch": 6.256, "grad_norm": 0.4411532668736603, "learning_rate": 1.3668808674072409e-06, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.2441355437040329, "step": 3910, "valid_targets_mean": 3981.3, "valid_targets_min": 984 }, { "epoch": 6.264, "grad_norm": 0.4003229501442681, "learning_rate": 1.338035816454375e-06, "loss": 0.2119, "loss_nan_ranks": 0, "loss_rank_avg": 0.21280062198638916, "step": 3915, "valid_targets_mean": 4549.2, "valid_targets_min": 1135 }, { "epoch": 6.272, "grad_norm": 0.4571069597331237, "learning_rate": 1.3094878402238887e-06, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2197241187095642, "step": 3920, "valid_targets_mean": 3564.8, "valid_targets_min": 762 }, { "epoch": 6.28, "grad_norm": 0.36182902012131324, "learning_rate": 1.2812373931632371e-06, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.23633159697055817, "step": 3925, "valid_targets_mean": 5213.5, "valid_targets_min": 938 }, { "epoch": 6.288, "grad_norm": 0.34785431888006046, "learning_rate": 1.2532849249835932e-06, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.20579376816749573, "step": 3930, "valid_targets_mean": 5596.8, "valid_targets_min": 776 }, { "epoch": 6.296, "grad_norm": 0.4114868588415092, "learning_rate": 1.2256308806526774e-06, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.22689789533615112, "step": 3935, "valid_targets_mean": 4300.3, "valid_targets_min": 813 }, { "epoch": 6.304, "grad_norm": 0.39604646648569675, "learning_rate": 1.1982757003876855e-06, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.24964919686317444, "step": 3940, "valid_targets_mean": 5153.9, "valid_targets_min": 711 }, { "epoch": 6.312, "grad_norm": 0.3849772647568709, "learning_rate": 1.1712198196482793e-06, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.26009365916252136, "step": 3945, "valid_targets_mean": 5058.6, "valid_targets_min": 980 }, { "epoch": 6.32, "grad_norm": 0.48211470656475425, "learning_rate": 1.1444636691296518e-06, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.21652325987815857, "step": 3950, "valid_targets_mean": 3130.9, "valid_targets_min": 798 }, { "epoch": 6.328, "grad_norm": 0.5644365548848527, "learning_rate": 1.11800767475567e-06, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.27526530623435974, "step": 3955, "valid_targets_mean": 2978.4, "valid_targets_min": 849 }, { "epoch": 6.336, "grad_norm": 0.40333014592575334, "learning_rate": 1.0918522576721014e-06, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.27383342385292053, "step": 3960, "valid_targets_mean": 5273.9, "valid_targets_min": 630 }, { "epoch": 6.344, "grad_norm": 0.4321759599915463, "learning_rate": 1.0659978342399003e-06, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.24329343438148499, "step": 3965, "valid_targets_mean": 4204.4, "valid_targets_min": 827 }, { "epoch": 6.352, "grad_norm": 0.4489831786268062, "learning_rate": 1.0404448160285897e-06, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.20862233638763428, "step": 3970, "valid_targets_mean": 3446.6, "valid_targets_min": 936 }, { "epoch": 6.36, "grad_norm": 0.6568484958919774, "learning_rate": 1.0151936098097015e-06, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.2893434762954712, "step": 3975, "valid_targets_mean": 2431.0, "valid_targets_min": 865 }, { "epoch": 6.368, "grad_norm": 0.436806643140305, "learning_rate": 9.902446175503089e-07, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.21049389243125916, "step": 3980, "valid_targets_mean": 3591.6, "valid_targets_min": 558 }, { "epoch": 6.376, "grad_norm": 0.3733718504908191, "learning_rate": 9.655982364066197e-07, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.19698584079742432, "step": 3985, "valid_targets_mean": 4745.1, "valid_targets_min": 1147 }, { "epoch": 6.384, "grad_norm": 0.56021488352525, "learning_rate": 9.412548587176595e-07, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.21981269121170044, "step": 3990, "valid_targets_mean": 2582.5, "valid_targets_min": 679 }, { "epoch": 6.392, "grad_norm": 0.4255541904342452, "learning_rate": 9.172148719990237e-07, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.23671914637088776, "step": 3995, "valid_targets_mean": 4313.3, "valid_targets_min": 752 }, { "epoch": 6.4, "grad_norm": 0.4102539193396227, "learning_rate": 8.934786589367106e-07, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.2218114733695984, "step": 4000, "valid_targets_mean": 4082.2, "valid_targets_min": 787 }, { "epoch": 6.408, "grad_norm": 0.34989430636633106, "learning_rate": 8.700465973810246e-07, "loss": 0.2215, "loss_nan_ranks": 0, "loss_rank_avg": 0.1899658888578415, "step": 4005, "valid_targets_mean": 4683.2, "valid_targets_min": 963 }, { "epoch": 6.416, "grad_norm": 0.5084082139951963, "learning_rate": 8.469190603405719e-07, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.22666466236114502, "step": 4010, "valid_targets_mean": 2856.0, "valid_targets_min": 836 }, { "epoch": 6.424, "grad_norm": 0.38334389778158073, "learning_rate": 8.240964159763121e-07, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.20574325323104858, "step": 4015, "valid_targets_mean": 4797.1, "valid_targets_min": 989 }, { "epoch": 6.432, "grad_norm": 0.43778396216540555, "learning_rate": 8.015790275957003e-07, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.2721363604068756, "step": 4020, "valid_targets_mean": 4351.1, "valid_targets_min": 1141 }, { "epoch": 6.44, "grad_norm": 0.42691802245050525, "learning_rate": 7.793672536469077e-07, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.236424520611763, "step": 4025, "valid_targets_mean": 3813.6, "valid_targets_min": 820 }, { "epoch": 6.448, "grad_norm": 0.36072477649308493, "learning_rate": 7.574614477131081e-07, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.18866382539272308, "step": 4030, "valid_targets_mean": 4367.6, "valid_targets_min": 843 }, { "epoch": 6.456, "grad_norm": 0.41123091937206413, "learning_rate": 7.358619585068583e-07, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.23328976333141327, "step": 4035, "valid_targets_mean": 4417.2, "valid_targets_min": 939 }, { "epoch": 6.464, "grad_norm": 0.4254203784811884, "learning_rate": 7.145691298645419e-07, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.2179802656173706, "step": 4040, "valid_targets_mean": 3939.2, "valid_targets_min": 946 }, { "epoch": 6.4719999999999995, "grad_norm": 0.39330349529070346, "learning_rate": 6.935833007408965e-07, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.22284376621246338, "step": 4045, "valid_targets_mean": 4508.6, "valid_targets_min": 623 }, { "epoch": 6.48, "grad_norm": 0.44865937037871895, "learning_rate": 6.729048052036136e-07, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.21400213241577148, "step": 4050, "valid_targets_mean": 3500.1, "valid_targets_min": 858 }, { "epoch": 6.4879999999999995, "grad_norm": 0.48021795524832595, "learning_rate": 6.52533972428031e-07, "loss": 0.2178, "loss_nan_ranks": 0, "loss_rank_avg": 0.24885594844818115, "step": 4055, "valid_targets_mean": 3483.8, "valid_targets_min": 971 }, { "epoch": 6.496, "grad_norm": 0.34882215560284985, "learning_rate": 6.324711266918826e-07, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.21410886943340302, "step": 4060, "valid_targets_mean": 5634.1, "valid_targets_min": 991 }, { "epoch": 6.504, "grad_norm": 0.5126446488160206, "learning_rate": 6.127165873701457e-07, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.21240456402301788, "step": 4065, "valid_targets_mean": 2864.9, "valid_targets_min": 985 }, { "epoch": 6.5120000000000005, "grad_norm": 0.3140688580026172, "learning_rate": 5.932706689299461e-07, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.21024207770824432, "step": 4070, "valid_targets_mean": 6588.2, "valid_targets_min": 1101 }, { "epoch": 6.52, "grad_norm": 0.4986798403758234, "learning_rate": 5.741336809255615e-07, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.22286343574523926, "step": 4075, "valid_targets_mean": 3069.7, "valid_targets_min": 1026 }, { "epoch": 6.5280000000000005, "grad_norm": 0.3921933421532105, "learning_rate": 5.553059279934902e-07, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2469090223312378, "step": 4080, "valid_targets_mean": 4846.6, "valid_targets_min": 741 }, { "epoch": 6.536, "grad_norm": 1.4197403594404054, "learning_rate": 5.36787709847597e-07, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.21249955892562866, "step": 4085, "valid_targets_mean": 3518.8, "valid_targets_min": 947 }, { "epoch": 6.5440000000000005, "grad_norm": 0.39790011129897357, "learning_rate": 5.185793212743529e-07, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.2455723136663437, "step": 4090, "valid_targets_mean": 4974.9, "valid_targets_min": 833 }, { "epoch": 6.552, "grad_norm": 0.506846713782852, "learning_rate": 5.006810521281335e-07, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.22944439947605133, "step": 4095, "valid_targets_mean": 3162.4, "valid_targets_min": 889 }, { "epoch": 6.5600000000000005, "grad_norm": 0.5304911335607064, "learning_rate": 4.830931873266065e-07, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.228239044547081, "step": 4100, "valid_targets_mean": 2786.3, "valid_targets_min": 655 }, { "epoch": 6.568, "grad_norm": 0.42229465032601937, "learning_rate": 4.658160068462025e-07, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.22529050707817078, "step": 4105, "valid_targets_mean": 4120.8, "valid_targets_min": 924 }, { "epoch": 6.576, "grad_norm": 0.32368728463004987, "learning_rate": 4.488497857176466e-07, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.21758395433425903, "step": 4110, "valid_targets_mean": 6052.4, "valid_targets_min": 890 }, { "epoch": 6.584, "grad_norm": 0.3876726339635795, "learning_rate": 4.321947940215898e-07, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.27703386545181274, "step": 4115, "valid_targets_mean": 5807.9, "valid_targets_min": 955 }, { "epoch": 6.592, "grad_norm": 0.5109155715461828, "learning_rate": 4.1585129688430425e-07, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2829819321632385, "step": 4120, "valid_targets_mean": 3333.1, "valid_targets_min": 867 }, { "epoch": 6.6, "grad_norm": 0.4470302028073575, "learning_rate": 3.998195544734706e-07, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.24119625985622406, "step": 4125, "valid_targets_mean": 4098.7, "valid_targets_min": 1055 }, { "epoch": 6.608, "grad_norm": 0.3879001559853112, "learning_rate": 3.840998219940284e-07, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.23125238716602325, "step": 4130, "valid_targets_mean": 4793.9, "valid_targets_min": 995 }, { "epoch": 6.616, "grad_norm": 0.3390815157643552, "learning_rate": 3.6869234968411214e-07, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.21983827650547028, "step": 4135, "valid_targets_mean": 5686.7, "valid_targets_min": 931 }, { "epoch": 6.624, "grad_norm": 0.48742691434984764, "learning_rate": 3.5359738281107504e-07, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.23688867688179016, "step": 4140, "valid_targets_mean": 3576.5, "valid_targets_min": 877 }, { "epoch": 6.632, "grad_norm": 0.5825891651795995, "learning_rate": 3.38815161667585e-07, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.2347678393125534, "step": 4145, "valid_targets_mean": 2693.6, "valid_targets_min": 857 }, { "epoch": 6.64, "grad_norm": 0.33240965337871686, "learning_rate": 3.24345921567788e-07, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.22942331433296204, "step": 4150, "valid_targets_mean": 6286.4, "valid_targets_min": 1070 }, { "epoch": 6.648, "grad_norm": 0.47442097754914475, "learning_rate": 3.101898928435754e-07, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.2143860161304474, "step": 4155, "valid_targets_mean": 2954.4, "valid_targets_min": 1049 }, { "epoch": 6.656, "grad_norm": 0.47947322659482045, "learning_rate": 2.9634730084091343e-07, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.22327253222465515, "step": 4160, "valid_targets_mean": 3591.6, "valid_targets_min": 942 }, { "epoch": 6.664, "grad_norm": 0.4454312428655186, "learning_rate": 2.8281836591624865e-07, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.22166194021701813, "step": 4165, "valid_targets_mean": 3687.9, "valid_targets_min": 710 }, { "epoch": 6.672, "grad_norm": 0.4171522266163402, "learning_rate": 2.6960330343301033e-07, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.23376452922821045, "step": 4170, "valid_targets_mean": 4033.3, "valid_targets_min": 978 }, { "epoch": 6.68, "grad_norm": 0.4021870631095099, "learning_rate": 2.5670232375817784e-07, "loss": 0.2115, "loss_nan_ranks": 0, "loss_rank_avg": 0.19755598902702332, "step": 4175, "valid_targets_mean": 4376.8, "valid_targets_min": 690 }, { "epoch": 6.688, "grad_norm": 0.4432006157292327, "learning_rate": 2.441156322589322e-07, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.2194088101387024, "step": 4180, "valid_targets_mean": 3696.2, "valid_targets_min": 937 }, { "epoch": 6.696, "grad_norm": 0.3533442609966585, "learning_rate": 2.318434292993832e-07, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.22602006793022156, "step": 4185, "valid_targets_mean": 5390.4, "valid_targets_min": 952 }, { "epoch": 6.704, "grad_norm": 0.5451719228606399, "learning_rate": 2.1988591023738514e-07, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.23980574309825897, "step": 4190, "valid_targets_mean": 2911.3, "valid_targets_min": 756 }, { "epoch": 6.712, "grad_norm": 0.3356047849602916, "learning_rate": 2.0824326542142835e-07, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.18571820855140686, "step": 4195, "valid_targets_mean": 5152.4, "valid_targets_min": 1057 }, { "epoch": 6.72, "grad_norm": 0.5229315558444865, "learning_rate": 1.9691568018759931e-07, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.277045339345932, "step": 4200, "valid_targets_mean": 3369.2, "valid_targets_min": 805 }, { "epoch": 6.728, "grad_norm": 0.3325315865260218, "learning_rate": 1.8590333485664525e-07, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.2092788815498352, "step": 4205, "valid_targets_mean": 5736.8, "valid_targets_min": 972 }, { "epoch": 6.736, "grad_norm": 0.467439774714686, "learning_rate": 1.752064047310853e-07, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.23705033957958221, "step": 4210, "valid_targets_mean": 3690.5, "valid_targets_min": 852 }, { "epoch": 6.744, "grad_norm": 0.6183840075760885, "learning_rate": 1.6482506009243949e-07, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.22905892133712769, "step": 4215, "valid_targets_mean": 2088.2, "valid_targets_min": 810 }, { "epoch": 6.752, "grad_norm": 0.3342422145961255, "learning_rate": 1.5475946619850192e-07, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.20969925820827484, "step": 4220, "valid_targets_mean": 5836.8, "valid_targets_min": 1020 }, { "epoch": 6.76, "grad_norm": 0.34624668633463707, "learning_rate": 1.4500978328071845e-07, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.22905424237251282, "step": 4225, "valid_targets_mean": 5463.2, "valid_targets_min": 732 }, { "epoch": 6.768, "grad_norm": 0.4420870260003288, "learning_rate": 1.3557616654163775e-07, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.223080113530159, "step": 4230, "valid_targets_mean": 3664.9, "valid_targets_min": 826 }, { "epoch": 6.776, "grad_norm": 0.5518275111575168, "learning_rate": 1.264587661524308e-07, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.22578661143779755, "step": 4235, "valid_targets_mean": 2675.6, "valid_targets_min": 966 }, { "epoch": 6.784, "grad_norm": 0.4049368287917327, "learning_rate": 1.1765772725051084e-07, "loss": 0.2131, "loss_nan_ranks": 0, "loss_rank_avg": 0.21148250997066498, "step": 4240, "valid_targets_mean": 4096.6, "valid_targets_min": 877 }, { "epoch": 6.792, "grad_norm": 0.4040442168660199, "learning_rate": 1.0917318993721726e-07, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.21757608652114868, "step": 4245, "valid_targets_mean": 4106.6, "valid_targets_min": 657 }, { "epoch": 6.8, "grad_norm": 0.4656238469376599, "learning_rate": 1.0100528927558861e-07, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.20843830704689026, "step": 4250, "valid_targets_mean": 3208.7, "valid_targets_min": 952 }, { "epoch": 6.808, "grad_norm": 0.42442223312996796, "learning_rate": 9.31541552882087e-08, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.25054430961608887, "step": 4255, "valid_targets_mean": 4431.4, "valid_targets_min": 932 }, { "epoch": 6.816, "grad_norm": 0.5254292888858535, "learning_rate": 8.561991295514161e-08, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.23713023960590363, "step": 4260, "valid_targets_mean": 3043.6, "valid_targets_min": 793 }, { "epoch": 6.824, "grad_norm": 0.4371339395015146, "learning_rate": 7.840268221193548e-08, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.23466908931732178, "step": 4265, "valid_targets_mean": 3946.0, "valid_targets_min": 874 }, { "epoch": 6.832, "grad_norm": 0.35973979810814993, "learning_rate": 7.150257794772186e-08, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.21603873372077942, "step": 4270, "valid_targets_mean": 5114.9, "valid_targets_min": 1057 }, { "epoch": 6.84, "grad_norm": 0.3711213623529721, "learning_rate": 6.491971000337938e-08, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.21824629604816437, "step": 4275, "valid_targets_mean": 4986.2, "valid_targets_min": 934 }, { "epoch": 6.848, "grad_norm": 0.4906868870974589, "learning_rate": 5.8654183169788435e-08, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.23453839123249054, "step": 4280, "valid_targets_mean": 3274.4, "valid_targets_min": 1037 }, { "epoch": 6.856, "grad_norm": 0.5003819660470424, "learning_rate": 5.270609718616593e-08, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.23117989301681519, "step": 4285, "valid_targets_mean": 3046.3, "valid_targets_min": 887 }, { "epoch": 6.864, "grad_norm": 0.5538836489378799, "learning_rate": 4.70755467384687e-08, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.22990688681602478, "step": 4290, "valid_targets_mean": 2669.9, "valid_targets_min": 722 }, { "epoch": 6.872, "grad_norm": 0.3339220377327871, "learning_rate": 4.176262145789478e-08, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.19378703832626343, "step": 4295, "valid_targets_mean": 5727.6, "valid_targets_min": 1068 }, { "epoch": 6.88, "grad_norm": 0.36779708232161507, "learning_rate": 3.676740591945782e-08, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.2007201462984085, "step": 4300, "valid_targets_mean": 4660.1, "valid_targets_min": 587 }, { "epoch": 6.888, "grad_norm": 0.416473109709361, "learning_rate": 3.208997964062821e-08, "loss": 0.2258, "loss_nan_ranks": 0, "loss_rank_avg": 0.23714400827884674, "step": 4305, "valid_targets_mean": 4501.4, "valid_targets_min": 1129 }, { "epoch": 6.896, "grad_norm": 0.3816242071018597, "learning_rate": 2.773041708008295e-08, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.2064952254295349, "step": 4310, "valid_targets_mean": 4667.4, "valid_targets_min": 712 }, { "epoch": 6.904, "grad_norm": 0.3988685178845027, "learning_rate": 2.3688787636511057e-08, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.2150478959083557, "step": 4315, "valid_targets_mean": 3976.9, "valid_targets_min": 942 }, { "epoch": 6.912, "grad_norm": 0.4016474848255541, "learning_rate": 1.9965155647507782e-08, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2176404893398285, "step": 4320, "valid_targets_mean": 4303.1, "valid_targets_min": 921 }, { "epoch": 6.92, "grad_norm": 0.37224492037629603, "learning_rate": 1.655958038855765e-08, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.19105198979377747, "step": 4325, "valid_targets_mean": 4631.8, "valid_targets_min": 1050 }, { "epoch": 6.928, "grad_norm": 0.4229429441256482, "learning_rate": 1.3472116072084096e-08, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.22886265814304352, "step": 4330, "valid_targets_mean": 4466.5, "valid_targets_min": 1187 }, { "epoch": 6.936, "grad_norm": 0.3238044486735016, "learning_rate": 1.0702811846590167e-08, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.20526066422462463, "step": 4335, "valid_targets_mean": 6032.8, "valid_targets_min": 770 }, { "epoch": 6.944, "grad_norm": 0.405352461983432, "learning_rate": 8.251711795876916e-09, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.20454303920269012, "step": 4340, "valid_targets_mean": 4101.2, "valid_targets_min": 1081 }, { "epoch": 6.952, "grad_norm": 0.5254957752257481, "learning_rate": 6.1188549383373044e-09, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.20966967940330505, "step": 4345, "valid_targets_mean": 2603.4, "valid_targets_min": 856 }, { "epoch": 6.96, "grad_norm": 0.4987226166041217, "learning_rate": 4.304275226338916e-09, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.20376208424568176, "step": 4350, "valid_targets_mean": 3057.9, "valid_targets_min": 852 }, { "epoch": 6.968, "grad_norm": 0.4147630934098896, "learning_rate": 2.8080015456799503e-09, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.22926411032676697, "step": 4355, "valid_targets_mean": 4151.9, "valid_targets_min": 662 }, { "epoch": 6.976, "grad_norm": 0.4327182545700865, "learning_rate": 1.6300577151340257e-09, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.21291124820709229, "step": 4360, "valid_targets_mean": 3751.6, "valid_targets_min": 860 }, { "epoch": 6.984, "grad_norm": 0.3961055234395137, "learning_rate": 7.70462486070489e-10, "loss": 0.2178, "loss_nan_ranks": 0, "loss_rank_avg": 0.21084696054458618, "step": 4365, "valid_targets_mean": 4619.8, "valid_targets_min": 988 }, { "epoch": 6.992, "grad_norm": 0.4419544854529956, "learning_rate": 2.2922954214799065e-10, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.23672346770763397, "step": 4370, "valid_targets_mean": 3912.4, "valid_targets_min": 955 }, { "epoch": 7.0, "grad_norm": 0.4194586140813968, "learning_rate": 6.367499107984288e-12, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.24523112177848816, "step": 4375, "valid_targets_mean": 4153.5, "valid_targets_min": 836 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.24523112177848816, "step": 4375, "total_flos": 785288333426688.0, "train_loss": 0.2574095404761178, "train_runtime": 17825.8409, "train_samples_per_second": 3.926, "train_steps_per_second": 0.245, "valid_targets_mean": 4153.5, "valid_targets_min": 836 } ], "logging_steps": 5, "max_steps": 4375, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 785288333426688.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }