{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 6664, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.005252100840336135, "grad_norm": 14.420694283658325, "learning_rate": 2.39880059970015e-07, "loss": 0.8126, "loss_nan_ranks": 0, "loss_rank_avg": 0.790475606918335, "step": 5, "valid_targets_mean": 1423.4, "valid_targets_min": 715 }, { "epoch": 0.01050420168067227, "grad_norm": 15.311496330131531, "learning_rate": 5.397301349325338e-07, "loss": 0.8157, "loss_nan_ranks": 0, "loss_rank_avg": 0.8297374248504639, "step": 10, "valid_targets_mean": 1407.8, "valid_targets_min": 612 }, { "epoch": 0.015756302521008403, "grad_norm": 13.45958528833613, "learning_rate": 8.395802098950526e-07, "loss": 0.7879, "loss_nan_ranks": 0, "loss_rank_avg": 0.7610906362533569, "step": 15, "valid_targets_mean": 1413.5, "valid_targets_min": 714 }, { "epoch": 0.02100840336134454, "grad_norm": 11.905230272753508, "learning_rate": 1.1394302848575713e-06, "loss": 0.7735, "loss_nan_ranks": 0, "loss_rank_avg": 0.753049373626709, "step": 20, "valid_targets_mean": 1450.1, "valid_targets_min": 754 }, { "epoch": 0.026260504201680673, "grad_norm": 9.744011308309286, "learning_rate": 1.43928035982009e-06, "loss": 0.744, "loss_nan_ranks": 0, "loss_rank_avg": 0.7382731437683105, "step": 25, "valid_targets_mean": 1481.1, "valid_targets_min": 718 }, { "epoch": 0.031512605042016806, "grad_norm": 7.094821641510122, "learning_rate": 1.7391304347826088e-06, "loss": 0.7128, "loss_nan_ranks": 0, "loss_rank_avg": 0.6914137601852417, "step": 30, "valid_targets_mean": 1530.8, "valid_targets_min": 731 }, { "epoch": 0.03676470588235294, "grad_norm": 6.368906220458843, "learning_rate": 2.0389805097451275e-06, "loss": 0.6643, "loss_nan_ranks": 0, "loss_rank_avg": 0.6466853022575378, "step": 35, "valid_targets_mean": 1416.6, "valid_targets_min": 725 }, { "epoch": 0.04201680672268908, "grad_norm": 5.399102696758742, "learning_rate": 2.3388305847076464e-06, "loss": 0.6382, "loss_nan_ranks": 0, "loss_rank_avg": 0.6274276971817017, "step": 40, "valid_targets_mean": 1371.5, "valid_targets_min": 610 }, { "epoch": 0.04726890756302521, "grad_norm": 4.306253658085107, "learning_rate": 2.6386806596701653e-06, "loss": 0.5772, "loss_nan_ranks": 0, "loss_rank_avg": 0.5616586208343506, "step": 45, "valid_targets_mean": 1484.7, "valid_targets_min": 720 }, { "epoch": 0.052521008403361345, "grad_norm": 3.7077951595748515, "learning_rate": 2.9385307346326843e-06, "loss": 0.527, "loss_nan_ranks": 0, "loss_rank_avg": 0.4847095012664795, "step": 50, "valid_targets_mean": 1365.5, "valid_targets_min": 765 }, { "epoch": 0.05777310924369748, "grad_norm": 2.363263225041768, "learning_rate": 3.2383808095952024e-06, "loss": 0.4935, "loss_nan_ranks": 0, "loss_rank_avg": 0.5059503316879272, "step": 55, "valid_targets_mean": 1234.7, "valid_targets_min": 593 }, { "epoch": 0.06302521008403361, "grad_norm": 1.6467637243933408, "learning_rate": 3.5382308845577213e-06, "loss": 0.4679, "loss_nan_ranks": 0, "loss_rank_avg": 0.44630974531173706, "step": 60, "valid_targets_mean": 1540.4, "valid_targets_min": 704 }, { "epoch": 0.06827731092436974, "grad_norm": 1.5411024922038776, "learning_rate": 3.83808095952024e-06, "loss": 0.4446, "loss_nan_ranks": 0, "loss_rank_avg": 0.41912999749183655, "step": 65, "valid_targets_mean": 1329.9, "valid_targets_min": 722 }, { "epoch": 0.07352941176470588, "grad_norm": 1.244534525186305, "learning_rate": 4.137931034482759e-06, "loss": 0.4205, "loss_nan_ranks": 0, "loss_rank_avg": 0.39288026094436646, "step": 70, "valid_targets_mean": 1549.6, "valid_targets_min": 865 }, { "epoch": 0.07878151260504201, "grad_norm": 1.1996703760120404, "learning_rate": 4.437781109445278e-06, "loss": 0.4055, "loss_nan_ranks": 0, "loss_rank_avg": 0.40949755907058716, "step": 75, "valid_targets_mean": 1507.4, "valid_targets_min": 797 }, { "epoch": 0.08403361344537816, "grad_norm": 1.2896717545023444, "learning_rate": 4.737631184407796e-06, "loss": 0.4011, "loss_nan_ranks": 0, "loss_rank_avg": 0.43845802545547485, "step": 80, "valid_targets_mean": 1542.4, "valid_targets_min": 728 }, { "epoch": 0.08928571428571429, "grad_norm": 1.0177436395323942, "learning_rate": 5.037481259370315e-06, "loss": 0.3951, "loss_nan_ranks": 0, "loss_rank_avg": 0.38916561007499695, "step": 85, "valid_targets_mean": 1595.2, "valid_targets_min": 683 }, { "epoch": 0.09453781512605042, "grad_norm": 1.9249372968791647, "learning_rate": 5.337331334332834e-06, "loss": 0.3869, "loss_nan_ranks": 0, "loss_rank_avg": 0.39647072553634644, "step": 90, "valid_targets_mean": 1401.6, "valid_targets_min": 706 }, { "epoch": 0.09978991596638656, "grad_norm": 1.284016705259006, "learning_rate": 5.6371814092953526e-06, "loss": 0.3607, "loss_nan_ranks": 0, "loss_rank_avg": 0.3547477126121521, "step": 95, "valid_targets_mean": 1298.4, "valid_targets_min": 625 }, { "epoch": 0.10504201680672269, "grad_norm": 1.0443779966069502, "learning_rate": 5.937031484257871e-06, "loss": 0.3572, "loss_nan_ranks": 0, "loss_rank_avg": 0.35236796736717224, "step": 100, "valid_targets_mean": 1659.7, "valid_targets_min": 790 }, { "epoch": 0.11029411764705882, "grad_norm": 1.0855951515574154, "learning_rate": 6.2368815592203904e-06, "loss": 0.3587, "loss_nan_ranks": 0, "loss_rank_avg": 0.3708180785179138, "step": 105, "valid_targets_mean": 1600.4, "valid_targets_min": 684 }, { "epoch": 0.11554621848739496, "grad_norm": 1.1032891548957378, "learning_rate": 6.536731634182909e-06, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.322293221950531, "step": 110, "valid_targets_mean": 1338.3, "valid_targets_min": 739 }, { "epoch": 0.1207983193277311, "grad_norm": 0.9768878378529005, "learning_rate": 6.8365817091454274e-06, "loss": 0.3369, "loss_nan_ranks": 0, "loss_rank_avg": 0.3234562277793884, "step": 115, "valid_targets_mean": 1456.2, "valid_targets_min": 657 }, { "epoch": 0.12605042016806722, "grad_norm": 1.0487060724275885, "learning_rate": 7.136431784107947e-06, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.32765859365463257, "step": 120, "valid_targets_mean": 1340.2, "valid_targets_min": 783 }, { "epoch": 0.13130252100840337, "grad_norm": 1.1049013021741143, "learning_rate": 7.436281859070465e-06, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.31769877672195435, "step": 125, "valid_targets_mean": 1394.4, "valid_targets_min": 734 }, { "epoch": 0.13655462184873948, "grad_norm": 1.0426803049134692, "learning_rate": 7.736131934032984e-06, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3211321234703064, "step": 130, "valid_targets_mean": 1501.8, "valid_targets_min": 678 }, { "epoch": 0.14180672268907563, "grad_norm": 1.0513598327816873, "learning_rate": 8.035982008995503e-06, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.31629741191864014, "step": 135, "valid_targets_mean": 1651.7, "valid_targets_min": 843 }, { "epoch": 0.14705882352941177, "grad_norm": 1.0551559578309457, "learning_rate": 8.335832083958023e-06, "loss": 0.3204, "loss_nan_ranks": 0, "loss_rank_avg": 0.3266269564628601, "step": 140, "valid_targets_mean": 1632.1, "valid_targets_min": 782 }, { "epoch": 0.15231092436974789, "grad_norm": 0.9612333107113046, "learning_rate": 8.63568215892054e-06, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.33223849534988403, "step": 145, "valid_targets_mean": 1615.3, "valid_targets_min": 957 }, { "epoch": 0.15756302521008403, "grad_norm": 1.0081404887340868, "learning_rate": 8.93553223388306e-06, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.32516705989837646, "step": 150, "valid_targets_mean": 1482.9, "valid_targets_min": 713 }, { "epoch": 0.16281512605042017, "grad_norm": 1.0468696423891182, "learning_rate": 9.235382308845579e-06, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.3112391531467438, "step": 155, "valid_targets_mean": 1552.8, "valid_targets_min": 726 }, { "epoch": 0.16806722689075632, "grad_norm": 0.9973569578712165, "learning_rate": 9.535232383808097e-06, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.2998279333114624, "step": 160, "valid_targets_mean": 1590.4, "valid_targets_min": 1147 }, { "epoch": 0.17331932773109243, "grad_norm": 1.2443677749688786, "learning_rate": 9.835082458770614e-06, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.30380943417549133, "step": 165, "valid_targets_mean": 1417.6, "valid_targets_min": 700 }, { "epoch": 0.17857142857142858, "grad_norm": 1.1254552821617871, "learning_rate": 1.0134932533733135e-05, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.2681633234024048, "step": 170, "valid_targets_mean": 1255.4, "valid_targets_min": 640 }, { "epoch": 0.18382352941176472, "grad_norm": 0.9851494239413889, "learning_rate": 1.0434782608695653e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.2868928611278534, "step": 175, "valid_targets_mean": 1566.6, "valid_targets_min": 817 }, { "epoch": 0.18907563025210083, "grad_norm": 1.098473835442716, "learning_rate": 1.0734632683658172e-05, "loss": 0.286, "loss_nan_ranks": 0, "loss_rank_avg": 0.27357298135757446, "step": 180, "valid_targets_mean": 1440.9, "valid_targets_min": 724 }, { "epoch": 0.19432773109243698, "grad_norm": 1.1557321572729486, "learning_rate": 1.103448275862069e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.29238957166671753, "step": 185, "valid_targets_mean": 1399.1, "valid_targets_min": 657 }, { "epoch": 0.19957983193277312, "grad_norm": 1.1396871077620272, "learning_rate": 1.1334332833583211e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.2987218499183655, "step": 190, "valid_targets_mean": 1334.3, "valid_targets_min": 746 }, { "epoch": 0.20483193277310924, "grad_norm": 1.1178689873643397, "learning_rate": 1.1634182908545729e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.33798643946647644, "step": 195, "valid_targets_mean": 1452.8, "valid_targets_min": 692 }, { "epoch": 0.21008403361344538, "grad_norm": 1.0854720395667985, "learning_rate": 1.1934032983508246e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.25798511505126953, "step": 200, "valid_targets_mean": 1338.4, "valid_targets_min": 682 }, { "epoch": 0.21533613445378152, "grad_norm": 1.1508679180169188, "learning_rate": 1.2233883058470766e-05, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.276319682598114, "step": 205, "valid_targets_mean": 1360.2, "valid_targets_min": 703 }, { "epoch": 0.22058823529411764, "grad_norm": 0.990266456581399, "learning_rate": 1.2533733133433283e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.2741560935974121, "step": 210, "valid_targets_mean": 1520.9, "valid_targets_min": 864 }, { "epoch": 0.22584033613445378, "grad_norm": 0.9411807898115928, "learning_rate": 1.2833583208395803e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.3527371883392334, "step": 215, "valid_targets_mean": 1814.6, "valid_targets_min": 734 }, { "epoch": 0.23109243697478993, "grad_norm": 0.9509244068358998, "learning_rate": 1.313343328335832e-05, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.27980518341064453, "step": 220, "valid_targets_mean": 1478.3, "valid_targets_min": 607 }, { "epoch": 0.23634453781512604, "grad_norm": 0.9802646448806872, "learning_rate": 1.3433283358320841e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757881283760071, "step": 225, "valid_targets_mean": 1497.9, "valid_targets_min": 551 }, { "epoch": 0.2415966386554622, "grad_norm": 1.1416789358107773, "learning_rate": 1.3733133433283359e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.2863280773162842, "step": 230, "valid_targets_mean": 1550.5, "valid_targets_min": 676 }, { "epoch": 0.24684873949579833, "grad_norm": 1.2243896073517977, "learning_rate": 1.4032983508245878e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.2647148370742798, "step": 235, "valid_targets_mean": 1372.5, "valid_targets_min": 904 }, { "epoch": 0.25210084033613445, "grad_norm": 1.0671177129673626, "learning_rate": 1.4332833583208396e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.2796405553817749, "step": 240, "valid_targets_mean": 1479.0, "valid_targets_min": 859 }, { "epoch": 0.25735294117647056, "grad_norm": 1.1155587555825344, "learning_rate": 1.4632683658170917e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2673705816268921, "step": 245, "valid_targets_mean": 1234.8, "valid_targets_min": 737 }, { "epoch": 0.26260504201680673, "grad_norm": 1.0111523665697042, "learning_rate": 1.4932533733133435e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.3024107813835144, "step": 250, "valid_targets_mean": 1363.2, "valid_targets_min": 791 }, { "epoch": 0.26785714285714285, "grad_norm": 0.9398095246969382, "learning_rate": 1.5232383808095954e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.28389376401901245, "step": 255, "valid_targets_mean": 1532.1, "valid_targets_min": 786 }, { "epoch": 0.27310924369747897, "grad_norm": 0.9520954006331536, "learning_rate": 1.5532233883058472e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.262344628572464, "step": 260, "valid_targets_mean": 1471.0, "valid_targets_min": 944 }, { "epoch": 0.27836134453781514, "grad_norm": 0.9231810982153198, "learning_rate": 1.5832083958020993e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.25394904613494873, "step": 265, "valid_targets_mean": 1494.1, "valid_targets_min": 1075 }, { "epoch": 0.28361344537815125, "grad_norm": 1.036465235131244, "learning_rate": 1.613193403298351e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.2542717456817627, "step": 270, "valid_targets_mean": 1340.9, "valid_targets_min": 740 }, { "epoch": 0.28886554621848737, "grad_norm": 0.969535346268365, "learning_rate": 1.6431784107946028e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.2644956707954407, "step": 275, "valid_targets_mean": 1530.9, "valid_targets_min": 727 }, { "epoch": 0.29411764705882354, "grad_norm": 1.095458178867704, "learning_rate": 1.6731634182908546e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.2714339792728424, "step": 280, "valid_targets_mean": 1233.0, "valid_targets_min": 636 }, { "epoch": 0.29936974789915966, "grad_norm": 0.989855094627666, "learning_rate": 1.7031484257871064e-05, "loss": 0.2571, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507407069206238, "step": 285, "valid_targets_mean": 1246.8, "valid_targets_min": 684 }, { "epoch": 0.30462184873949577, "grad_norm": 1.0834380820761222, "learning_rate": 1.7331334332833585e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.26474529504776, "step": 290, "valid_targets_mean": 1392.5, "valid_targets_min": 798 }, { "epoch": 0.30987394957983194, "grad_norm": 1.035539563074315, "learning_rate": 1.7631184407796102e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.24842077493667603, "step": 295, "valid_targets_mean": 1319.9, "valid_targets_min": 661 }, { "epoch": 0.31512605042016806, "grad_norm": 1.0392297368060632, "learning_rate": 1.7931034482758623e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.2532370090484619, "step": 300, "valid_targets_mean": 1554.4, "valid_targets_min": 665 }, { "epoch": 0.32037815126050423, "grad_norm": 1.1437803903133303, "learning_rate": 1.823088455772114e-05, "loss": 0.2547, "loss_nan_ranks": 0, "loss_rank_avg": 0.26745492219924927, "step": 305, "valid_targets_mean": 1417.8, "valid_targets_min": 692 }, { "epoch": 0.32563025210084034, "grad_norm": 1.0470695391841682, "learning_rate": 1.853073463268366e-05, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.27369868755340576, "step": 310, "valid_targets_mean": 1223.8, "valid_targets_min": 632 }, { "epoch": 0.33088235294117646, "grad_norm": 0.99682750228871, "learning_rate": 1.8830584707646176e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.2700139284133911, "step": 315, "valid_targets_mean": 1550.6, "valid_targets_min": 922 }, { "epoch": 0.33613445378151263, "grad_norm": 0.9922010090048154, "learning_rate": 1.9130434782608697e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.23878350853919983, "step": 320, "valid_targets_mean": 1542.2, "valid_targets_min": 710 }, { "epoch": 0.34138655462184875, "grad_norm": 0.9969922099846812, "learning_rate": 1.9430284857571215e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.24636775255203247, "step": 325, "valid_targets_mean": 1390.6, "valid_targets_min": 750 }, { "epoch": 0.34663865546218486, "grad_norm": 0.9249347847273258, "learning_rate": 1.9730134932533736e-05, "loss": 0.2576, "loss_nan_ranks": 0, "loss_rank_avg": 0.25145918130874634, "step": 330, "valid_targets_mean": 1515.5, "valid_targets_min": 766 }, { "epoch": 0.35189075630252103, "grad_norm": 0.9954869233754978, "learning_rate": 2.0029985007496254e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.23031079769134521, "step": 335, "valid_targets_mean": 1333.3, "valid_targets_min": 748 }, { "epoch": 0.35714285714285715, "grad_norm": 1.0229626657604847, "learning_rate": 2.0329835082458775e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.2601286470890045, "step": 340, "valid_targets_mean": 1395.2, "valid_targets_min": 682 }, { "epoch": 0.36239495798319327, "grad_norm": 0.9742753314709449, "learning_rate": 2.0629685157421292e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.2516604959964752, "step": 345, "valid_targets_mean": 1515.6, "valid_targets_min": 738 }, { "epoch": 0.36764705882352944, "grad_norm": 1.0984493157523587, "learning_rate": 2.092953523238381e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.26009607315063477, "step": 350, "valid_targets_mean": 1312.8, "valid_targets_min": 731 }, { "epoch": 0.37289915966386555, "grad_norm": 1.0124670927846027, "learning_rate": 2.1229385307346328e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.2756904661655426, "step": 355, "valid_targets_mean": 1492.9, "valid_targets_min": 646 }, { "epoch": 0.37815126050420167, "grad_norm": 0.9303311281634132, "learning_rate": 2.152923538230885e-05, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.23849308490753174, "step": 360, "valid_targets_mean": 1369.1, "valid_targets_min": 780 }, { "epoch": 0.38340336134453784, "grad_norm": 0.938627487391855, "learning_rate": 2.1829085457271363e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.24323752522468567, "step": 365, "valid_targets_mean": 1521.9, "valid_targets_min": 676 }, { "epoch": 0.38865546218487396, "grad_norm": 1.0170934463633303, "learning_rate": 2.2128935532233884e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.23910865187644958, "step": 370, "valid_targets_mean": 1277.9, "valid_targets_min": 687 }, { "epoch": 0.3939075630252101, "grad_norm": 0.9747309964507797, "learning_rate": 2.2428785607196405e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.2347027212381363, "step": 375, "valid_targets_mean": 1336.5, "valid_targets_min": 703 }, { "epoch": 0.39915966386554624, "grad_norm": 1.0544024939800751, "learning_rate": 2.2728635682158923e-05, "loss": 0.2461, "loss_nan_ranks": 0, "loss_rank_avg": 0.22451592981815338, "step": 380, "valid_targets_mean": 1288.1, "valid_targets_min": 522 }, { "epoch": 0.40441176470588236, "grad_norm": 1.0293634003316077, "learning_rate": 2.302848575712144e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.2373955398797989, "step": 385, "valid_targets_mean": 1526.9, "valid_targets_min": 764 }, { "epoch": 0.4096638655462185, "grad_norm": 1.0510698011217983, "learning_rate": 2.3328335832083958e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.272568941116333, "step": 390, "valid_targets_mean": 1372.4, "valid_targets_min": 548 }, { "epoch": 0.41491596638655465, "grad_norm": 1.0256066743434804, "learning_rate": 2.362818590704648e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508437931537628, "step": 395, "valid_targets_mean": 1356.8, "valid_targets_min": 694 }, { "epoch": 0.42016806722689076, "grad_norm": 0.918276243513663, "learning_rate": 2.3928035982009e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.26278817653656006, "step": 400, "valid_targets_mean": 1540.9, "valid_targets_min": 823 }, { "epoch": 0.4254201680672269, "grad_norm": 0.829017462865176, "learning_rate": 2.4227886056971515e-05, "loss": 0.2182, "loss_nan_ranks": 0, "loss_rank_avg": 0.1897987425327301, "step": 405, "valid_targets_mean": 1442.4, "valid_targets_min": 682 }, { "epoch": 0.43067226890756305, "grad_norm": 1.009337402964787, "learning_rate": 2.4527736131934036e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.25567498803138733, "step": 410, "valid_targets_mean": 1407.6, "valid_targets_min": 693 }, { "epoch": 0.43592436974789917, "grad_norm": 1.102110069443316, "learning_rate": 2.4827586206896553e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.22340771555900574, "step": 415, "valid_targets_mean": 1197.8, "valid_targets_min": 639 }, { "epoch": 0.4411764705882353, "grad_norm": 0.9439286600674722, "learning_rate": 2.5127436281859074e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.22316749393939972, "step": 420, "valid_targets_mean": 1423.3, "valid_targets_min": 685 }, { "epoch": 0.44642857142857145, "grad_norm": 0.9288887022810997, "learning_rate": 2.542728635682159e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.22205528616905212, "step": 425, "valid_targets_mean": 1331.5, "valid_targets_min": 827 }, { "epoch": 0.45168067226890757, "grad_norm": 0.918938060661647, "learning_rate": 2.572713643178411e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.24578994512557983, "step": 430, "valid_targets_mean": 1381.7, "valid_targets_min": 686 }, { "epoch": 0.4569327731092437, "grad_norm": 0.8450512785959888, "learning_rate": 2.602698650674663e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.25319570302963257, "step": 435, "valid_targets_mean": 1472.2, "valid_targets_min": 713 }, { "epoch": 0.46218487394957986, "grad_norm": 1.3247180796200522, "learning_rate": 2.632683658170915e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.4720996022224426, "step": 440, "valid_targets_mean": 2248.9, "valid_targets_min": 920 }, { "epoch": 0.46743697478991597, "grad_norm": 0.7756817606153216, "learning_rate": 2.6626686656671666e-05, "loss": 0.4381, "loss_nan_ranks": 0, "loss_rank_avg": 0.4191029667854309, "step": 445, "valid_targets_mean": 3664.4, "valid_targets_min": 746 }, { "epoch": 0.4726890756302521, "grad_norm": 0.8141822973818857, "learning_rate": 2.6926536731634184e-05, "loss": 0.4066, "loss_nan_ranks": 0, "loss_rank_avg": 0.42180395126342773, "step": 450, "valid_targets_mean": 3591.1, "valid_targets_min": 1635 }, { "epoch": 0.47794117647058826, "grad_norm": 0.6183205557943057, "learning_rate": 2.7226386806596705e-05, "loss": 0.399, "loss_nan_ranks": 0, "loss_rank_avg": 0.37809157371520996, "step": 455, "valid_targets_mean": 4172.7, "valid_targets_min": 777 }, { "epoch": 0.4831932773109244, "grad_norm": 0.6341645150900163, "learning_rate": 2.752623688155922e-05, "loss": 0.3807, "loss_nan_ranks": 0, "loss_rank_avg": 0.3980065882205963, "step": 460, "valid_targets_mean": 4040.2, "valid_targets_min": 2187 }, { "epoch": 0.4884453781512605, "grad_norm": 0.7232188026091549, "learning_rate": 2.782608695652174e-05, "loss": 0.3993, "loss_nan_ranks": 0, "loss_rank_avg": 0.39658811688423157, "step": 465, "valid_targets_mean": 3156.3, "valid_targets_min": 1432 }, { "epoch": 0.49369747899159666, "grad_norm": 0.5975850484936072, "learning_rate": 2.812593703148426e-05, "loss": 0.377, "loss_nan_ranks": 0, "loss_rank_avg": 0.35548049211502075, "step": 470, "valid_targets_mean": 3529.7, "valid_targets_min": 767 }, { "epoch": 0.4989495798319328, "grad_norm": 0.6544292649550012, "learning_rate": 2.8425787106446782e-05, "loss": 0.3589, "loss_nan_ranks": 0, "loss_rank_avg": 0.36396756768226624, "step": 475, "valid_targets_mean": 3485.6, "valid_targets_min": 1488 }, { "epoch": 0.5042016806722689, "grad_norm": 0.5784234889060588, "learning_rate": 2.8725637181409296e-05, "loss": 0.3769, "loss_nan_ranks": 0, "loss_rank_avg": 0.3580145239830017, "step": 480, "valid_targets_mean": 3707.0, "valid_targets_min": 578 }, { "epoch": 0.509453781512605, "grad_norm": 0.5809204879202081, "learning_rate": 2.9025487256371818e-05, "loss": 0.3991, "loss_nan_ranks": 0, "loss_rank_avg": 0.37097570300102234, "step": 485, "valid_targets_mean": 4252.4, "valid_targets_min": 1241 }, { "epoch": 0.5147058823529411, "grad_norm": 0.6518660166623274, "learning_rate": 2.9325337331334335e-05, "loss": 0.3791, "loss_nan_ranks": 0, "loss_rank_avg": 0.39846816658973694, "step": 490, "valid_targets_mean": 4029.2, "valid_targets_min": 807 }, { "epoch": 0.5199579831932774, "grad_norm": 0.5952710397208067, "learning_rate": 2.9625187406296856e-05, "loss": 0.3793, "loss_nan_ranks": 0, "loss_rank_avg": 0.34132808446884155, "step": 495, "valid_targets_mean": 4507.0, "valid_targets_min": 2011 }, { "epoch": 0.5252100840336135, "grad_norm": 0.5921750584078646, "learning_rate": 2.992503748125937e-05, "loss": 0.3773, "loss_nan_ranks": 0, "loss_rank_avg": 0.3380280137062073, "step": 500, "valid_targets_mean": 4268.2, "valid_targets_min": 1329 }, { "epoch": 0.5304621848739496, "grad_norm": 0.7847684848643338, "learning_rate": 3.022488755622189e-05, "loss": 0.3692, "loss_nan_ranks": 0, "loss_rank_avg": 0.3614731431007385, "step": 505, "valid_targets_mean": 3858.9, "valid_targets_min": 1366 }, { "epoch": 0.5357142857142857, "grad_norm": 0.6674187275757447, "learning_rate": 3.052473763118441e-05, "loss": 0.3796, "loss_nan_ranks": 0, "loss_rank_avg": 0.36018460988998413, "step": 510, "valid_targets_mean": 3169.1, "valid_targets_min": 1334 }, { "epoch": 0.5409663865546218, "grad_norm": 0.5809835935023818, "learning_rate": 3.0824587706146934e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.34386080503463745, "step": 515, "valid_targets_mean": 4130.4, "valid_targets_min": 1762 }, { "epoch": 0.5462184873949579, "grad_norm": 0.6856115085091843, "learning_rate": 3.112443778110945e-05, "loss": 0.3807, "loss_nan_ranks": 0, "loss_rank_avg": 0.3728490471839905, "step": 520, "valid_targets_mean": 3285.0, "valid_targets_min": 855 }, { "epoch": 0.5514705882352942, "grad_norm": 0.7152310015109019, "learning_rate": 3.142428785607197e-05, "loss": 0.3934, "loss_nan_ranks": 0, "loss_rank_avg": 0.3993592858314514, "step": 525, "valid_targets_mean": 3298.2, "valid_targets_min": 1269 }, { "epoch": 0.5567226890756303, "grad_norm": 0.7853116245952066, "learning_rate": 3.172413793103448e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.3852170705795288, "step": 530, "valid_targets_mean": 2740.4, "valid_targets_min": 1041 }, { "epoch": 0.5619747899159664, "grad_norm": 0.7253886613797418, "learning_rate": 3.2023988005997004e-05, "loss": 0.3777, "loss_nan_ranks": 0, "loss_rank_avg": 0.3952094614505768, "step": 535, "valid_targets_mean": 2995.1, "valid_targets_min": 1291 }, { "epoch": 0.5672268907563025, "grad_norm": 0.7947910205242297, "learning_rate": 3.2323838080959525e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.3840707540512085, "step": 540, "valid_targets_mean": 2811.6, "valid_targets_min": 1133 }, { "epoch": 0.5724789915966386, "grad_norm": 0.7101634109805368, "learning_rate": 3.262368815592204e-05, "loss": 0.3656, "loss_nan_ranks": 0, "loss_rank_avg": 0.3580155372619629, "step": 545, "valid_targets_mean": 3709.5, "valid_targets_min": 865 }, { "epoch": 0.5777310924369747, "grad_norm": 0.7401801947692503, "learning_rate": 3.292353823088456e-05, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.37310606241226196, "step": 550, "valid_targets_mean": 2960.6, "valid_targets_min": 958 }, { "epoch": 0.582983193277311, "grad_norm": 0.6819266322867479, "learning_rate": 3.3223388305847075e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.376257061958313, "step": 555, "valid_targets_mean": 3189.2, "valid_targets_min": 771 }, { "epoch": 0.5882352941176471, "grad_norm": 0.5792785228231021, "learning_rate": 3.3523238380809596e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.3450887203216553, "step": 560, "valid_targets_mean": 3823.1, "valid_targets_min": 1631 }, { "epoch": 0.5934873949579832, "grad_norm": 0.706870647311464, "learning_rate": 3.382308845577212e-05, "loss": 0.3699, "loss_nan_ranks": 0, "loss_rank_avg": 0.33471646904945374, "step": 565, "valid_targets_mean": 2639.4, "valid_targets_min": 908 }, { "epoch": 0.5987394957983193, "grad_norm": 0.8079454260503596, "learning_rate": 3.412293853073464e-05, "loss": 0.3653, "loss_nan_ranks": 0, "loss_rank_avg": 0.39000123739242554, "step": 570, "valid_targets_mean": 2988.3, "valid_targets_min": 1264 }, { "epoch": 0.6039915966386554, "grad_norm": 0.6685925501276144, "learning_rate": 3.442278860569715e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.3652319312095642, "step": 575, "valid_targets_mean": 3563.1, "valid_targets_min": 1889 }, { "epoch": 0.6092436974789915, "grad_norm": 0.6271409370176393, "learning_rate": 3.4722638680659673e-05, "loss": 0.3594, "loss_nan_ranks": 0, "loss_rank_avg": 0.3371011018753052, "step": 580, "valid_targets_mean": 3737.9, "valid_targets_min": 1075 }, { "epoch": 0.6144957983193278, "grad_norm": 0.7635609780961795, "learning_rate": 3.5022488755622194e-05, "loss": 0.3644, "loss_nan_ranks": 0, "loss_rank_avg": 0.3491378426551819, "step": 585, "valid_targets_mean": 2745.8, "valid_targets_min": 1036 }, { "epoch": 0.6197478991596639, "grad_norm": 0.9486847263065615, "learning_rate": 3.5322338830584716e-05, "loss": 0.3682, "loss_nan_ranks": 0, "loss_rank_avg": 0.3554984927177429, "step": 590, "valid_targets_mean": 3516.4, "valid_targets_min": 1162 }, { "epoch": 0.625, "grad_norm": 0.6979971886991938, "learning_rate": 3.562218890554723e-05, "loss": 0.3604, "loss_nan_ranks": 0, "loss_rank_avg": 0.3572150468826294, "step": 595, "valid_targets_mean": 3279.4, "valid_targets_min": 1281 }, { "epoch": 0.6302521008403361, "grad_norm": 0.628571339160864, "learning_rate": 3.592203898050975e-05, "loss": 0.3601, "loss_nan_ranks": 0, "loss_rank_avg": 0.32577332854270935, "step": 600, "valid_targets_mean": 3180.4, "valid_targets_min": 1816 }, { "epoch": 0.6355042016806722, "grad_norm": 0.7162106687544288, "learning_rate": 3.6221889055472265e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.36203664541244507, "step": 605, "valid_targets_mean": 2939.2, "valid_targets_min": 1629 }, { "epoch": 0.6407563025210085, "grad_norm": 0.7531458122055458, "learning_rate": 3.6521739130434786e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.3718830943107605, "step": 610, "valid_targets_mean": 2755.7, "valid_targets_min": 1254 }, { "epoch": 0.6460084033613446, "grad_norm": 0.7043721880651528, "learning_rate": 3.68215892053973e-05, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.3637351989746094, "step": 615, "valid_targets_mean": 3390.2, "valid_targets_min": 1973 }, { "epoch": 0.6512605042016807, "grad_norm": 0.7411003182380056, "learning_rate": 3.712143928035982e-05, "loss": 0.3638, "loss_nan_ranks": 0, "loss_rank_avg": 0.35509952902793884, "step": 620, "valid_targets_mean": 2960.4, "valid_targets_min": 1195 }, { "epoch": 0.6565126050420168, "grad_norm": 0.6916717573319705, "learning_rate": 3.742128935532234e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.37266242504119873, "step": 625, "valid_targets_mean": 3181.4, "valid_targets_min": 1244 }, { "epoch": 0.6617647058823529, "grad_norm": 0.6405799101681395, "learning_rate": 3.772113943028486e-05, "loss": 0.3642, "loss_nan_ranks": 0, "loss_rank_avg": 0.351756751537323, "step": 630, "valid_targets_mean": 3464.2, "valid_targets_min": 1421 }, { "epoch": 0.667016806722689, "grad_norm": 0.6665303943258725, "learning_rate": 3.802098950524738e-05, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.34305959939956665, "step": 635, "valid_targets_mean": 3443.1, "valid_targets_min": 1097 }, { "epoch": 0.6722689075630253, "grad_norm": 0.6963251575164391, "learning_rate": 3.83208395802099e-05, "loss": 0.349, "loss_nan_ranks": 0, "loss_rank_avg": 0.36686572432518005, "step": 640, "valid_targets_mean": 3891.4, "valid_targets_min": 1168 }, { "epoch": 0.6775210084033614, "grad_norm": 0.6447119132301098, "learning_rate": 3.862068965517242e-05, "loss": 0.3547, "loss_nan_ranks": 0, "loss_rank_avg": 0.35105079412460327, "step": 645, "valid_targets_mean": 3368.9, "valid_targets_min": 1700 }, { "epoch": 0.6827731092436975, "grad_norm": 0.775468044490351, "learning_rate": 3.8920539730134934e-05, "loss": 0.3561, "loss_nan_ranks": 0, "loss_rank_avg": 0.35495996475219727, "step": 650, "valid_targets_mean": 2497.1, "valid_targets_min": 1261 }, { "epoch": 0.6880252100840336, "grad_norm": 0.6998673088388078, "learning_rate": 3.9220389805097455e-05, "loss": 0.37, "loss_nan_ranks": 0, "loss_rank_avg": 0.373879611492157, "step": 655, "valid_targets_mean": 3391.2, "valid_targets_min": 1124 }, { "epoch": 0.6932773109243697, "grad_norm": 0.6911940333174383, "learning_rate": 3.9520239880059976e-05, "loss": 0.3604, "loss_nan_ranks": 0, "loss_rank_avg": 0.3743062913417816, "step": 660, "valid_targets_mean": 3003.8, "valid_targets_min": 1361 }, { "epoch": 0.6985294117647058, "grad_norm": 0.6312467853415549, "learning_rate": 3.982008995502249e-05, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.3238492012023926, "step": 665, "valid_targets_mean": 3239.7, "valid_targets_min": 1679 }, { "epoch": 0.7037815126050421, "grad_norm": 0.6929968801305512, "learning_rate": 3.9999989022799437e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.374039888381958, "step": 670, "valid_targets_mean": 3101.2, "valid_targets_min": 1739 }, { "epoch": 0.7090336134453782, "grad_norm": 0.7069459947278421, "learning_rate": 3.9999865529431466e-05, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.3492530584335327, "step": 675, "valid_targets_mean": 2844.4, "valid_targets_min": 1278 }, { "epoch": 0.7142857142857143, "grad_norm": 0.6222986155844251, "learning_rate": 3.9999604822044886e-05, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.327778160572052, "step": 680, "valid_targets_mean": 3563.4, "valid_targets_min": 1522 }, { "epoch": 0.7195378151260504, "grad_norm": 0.6470886363287454, "learning_rate": 3.999920690242835e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.33931905031204224, "step": 685, "valid_targets_mean": 3589.0, "valid_targets_min": 464 }, { "epoch": 0.7247899159663865, "grad_norm": 0.5841030308921137, "learning_rate": 3.999867177331189e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.3474075198173523, "step": 690, "valid_targets_mean": 3827.1, "valid_targets_min": 1003 }, { "epoch": 0.7300420168067226, "grad_norm": 0.6944347153816217, "learning_rate": 3.9997999438366895e-05, "loss": 0.3424, "loss_nan_ranks": 0, "loss_rank_avg": 0.36091533303260803, "step": 695, "valid_targets_mean": 3042.1, "valid_targets_min": 1446 }, { "epoch": 0.7352941176470589, "grad_norm": 0.6583742822611474, "learning_rate": 3.9997189902206065e-05, "loss": 0.3494, "loss_nan_ranks": 0, "loss_rank_avg": 0.3591790199279785, "step": 700, "valid_targets_mean": 3257.8, "valid_targets_min": 1256 }, { "epoch": 0.740546218487395, "grad_norm": 0.6796220489697876, "learning_rate": 3.999624317038344e-05, "loss": 0.3623, "loss_nan_ranks": 0, "loss_rank_avg": 0.3584475815296173, "step": 705, "valid_targets_mean": 3858.5, "valid_targets_min": 1336 }, { "epoch": 0.7457983193277311, "grad_norm": 0.5779511153503359, "learning_rate": 3.9995159249394303e-05, "loss": 0.3632, "loss_nan_ranks": 0, "loss_rank_avg": 0.3402530550956726, "step": 710, "valid_targets_mean": 3821.1, "valid_targets_min": 1275 }, { "epoch": 0.7510504201680672, "grad_norm": 0.6920943343973615, "learning_rate": 3.999393814667517e-05, "loss": 0.3394, "loss_nan_ranks": 0, "loss_rank_avg": 0.35493505001068115, "step": 715, "valid_targets_mean": 2914.6, "valid_targets_min": 644 }, { "epoch": 0.7563025210084033, "grad_norm": 0.6484863168026516, "learning_rate": 3.9992579870603695e-05, "loss": 0.336, "loss_nan_ranks": 0, "loss_rank_avg": 0.3329768478870392, "step": 720, "valid_targets_mean": 3083.4, "valid_targets_min": 1397 }, { "epoch": 0.7615546218487395, "grad_norm": 0.7459309224625077, "learning_rate": 3.999108443049869e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.35886648297309875, "step": 725, "valid_targets_mean": 2747.4, "valid_targets_min": 1557 }, { "epoch": 0.7668067226890757, "grad_norm": 0.6643965239188359, "learning_rate": 3.998945183661997e-05, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.3370826840400696, "step": 730, "valid_targets_mean": 3405.2, "valid_targets_min": 1405 }, { "epoch": 0.7720588235294118, "grad_norm": 0.6311941065520537, "learning_rate": 3.9987682100168376e-05, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.32585620880126953, "step": 735, "valid_targets_mean": 3507.1, "valid_targets_min": 1042 }, { "epoch": 0.7773109243697479, "grad_norm": 0.6934056789740213, "learning_rate": 3.99857752332856e-05, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.3426210284233093, "step": 740, "valid_targets_mean": 3079.7, "valid_targets_min": 858 }, { "epoch": 0.782563025210084, "grad_norm": 0.6683294329205226, "learning_rate": 3.998373124905418e-05, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.3405384421348572, "step": 745, "valid_targets_mean": 2934.3, "valid_targets_min": 1288 }, { "epoch": 0.7878151260504201, "grad_norm": 0.6089870902503931, "learning_rate": 3.9981550161497375e-05, "loss": 0.36, "loss_nan_ranks": 0, "loss_rank_avg": 0.3385617136955261, "step": 750, "valid_targets_mean": 3428.2, "valid_targets_min": 1915 }, { "epoch": 0.7930672268907563, "grad_norm": 0.6028162675947055, "learning_rate": 3.9979231985579074e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.3657104969024658, "step": 755, "valid_targets_mean": 3764.9, "valid_targets_min": 1244 }, { "epoch": 0.7983193277310925, "grad_norm": 0.7017817313652911, "learning_rate": 3.99767767372037e-05, "loss": 0.3304, "loss_nan_ranks": 0, "loss_rank_avg": 0.33708494901657104, "step": 760, "valid_targets_mean": 3006.5, "valid_targets_min": 1255 }, { "epoch": 0.8035714285714286, "grad_norm": 0.6788931537841902, "learning_rate": 3.997418443321609e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.3829076290130615, "step": 765, "valid_targets_mean": 3326.2, "valid_targets_min": 1586 }, { "epoch": 0.8088235294117647, "grad_norm": 0.6396470227937194, "learning_rate": 3.997145509140138e-05, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.3249973654747009, "step": 770, "valid_targets_mean": 3205.2, "valid_targets_min": 1181 }, { "epoch": 0.8140756302521008, "grad_norm": 0.6959358945807129, "learning_rate": 3.9968588730484896e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.35094955563545227, "step": 775, "valid_targets_mean": 2735.1, "valid_targets_min": 974 }, { "epoch": 0.819327731092437, "grad_norm": 0.7121078872001974, "learning_rate": 3.9965585370132013e-05, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.3337578773498535, "step": 780, "valid_targets_mean": 3735.8, "valid_targets_min": 1681 }, { "epoch": 0.8245798319327731, "grad_norm": 0.731579949310607, "learning_rate": 3.996244503094804e-05, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.37752842903137207, "step": 785, "valid_targets_mean": 2883.7, "valid_targets_min": 1171 }, { "epoch": 0.8298319327731093, "grad_norm": 0.6650190290860145, "learning_rate": 3.995916773447804e-05, "loss": 0.3574, "loss_nan_ranks": 0, "loss_rank_avg": 0.3751668930053711, "step": 790, "valid_targets_mean": 3324.1, "valid_targets_min": 1455 }, { "epoch": 0.8350840336134454, "grad_norm": 0.6084187992006697, "learning_rate": 3.995575350320671e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.3428555428981781, "step": 795, "valid_targets_mean": 3948.6, "valid_targets_min": 1529 }, { "epoch": 0.8403361344537815, "grad_norm": 0.6734592462466594, "learning_rate": 3.995220236055824e-05, "loss": 0.3662, "loss_nan_ranks": 0, "loss_rank_avg": 0.36074283719062805, "step": 800, "valid_targets_mean": 3419.9, "valid_targets_min": 1450 }, { "epoch": 0.8455882352941176, "grad_norm": 0.5774931076226504, "learning_rate": 3.99485143308961e-05, "loss": 0.3351, "loss_nan_ranks": 0, "loss_rank_avg": 0.3051412105560303, "step": 805, "valid_targets_mean": 3465.6, "valid_targets_min": 1431 }, { "epoch": 0.8508403361344538, "grad_norm": 0.8400200119736569, "learning_rate": 3.994468943952296e-05, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.35333842039108276, "step": 810, "valid_targets_mean": 3085.4, "valid_targets_min": 802 }, { "epoch": 0.8560924369747899, "grad_norm": 0.6336110237839332, "learning_rate": 3.994072771268041e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.347425639629364, "step": 815, "valid_targets_mean": 3230.6, "valid_targets_min": 1433 }, { "epoch": 0.8613445378151261, "grad_norm": 0.6958422384825939, "learning_rate": 3.993662917754885e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.35881751775741577, "step": 820, "valid_targets_mean": 2908.7, "valid_targets_min": 614 }, { "epoch": 0.8665966386554622, "grad_norm": 0.7411583695170622, "learning_rate": 3.993239386224732e-05, "loss": 0.3536, "loss_nan_ranks": 0, "loss_rank_avg": 0.3721003532409668, "step": 825, "valid_targets_mean": 2748.8, "valid_targets_min": 637 }, { "epoch": 0.8718487394957983, "grad_norm": 0.63511436606181, "learning_rate": 3.992802179583322e-05, "loss": 0.3513, "loss_nan_ranks": 0, "loss_rank_avg": 0.3608887195587158, "step": 830, "valid_targets_mean": 3297.7, "valid_targets_min": 1683 }, { "epoch": 0.8771008403361344, "grad_norm": 0.6522816701659483, "learning_rate": 3.9923513008302204e-05, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.32889869809150696, "step": 835, "valid_targets_mean": 3406.1, "valid_targets_min": 1913 }, { "epoch": 0.8823529411764706, "grad_norm": 0.5886512960386365, "learning_rate": 3.991886753058792e-05, "loss": 0.3322, "loss_nan_ranks": 0, "loss_rank_avg": 0.32120782136917114, "step": 840, "valid_targets_mean": 3848.1, "valid_targets_min": 1659 }, { "epoch": 0.8876050420168067, "grad_norm": 0.6037677731592493, "learning_rate": 3.991408539456182e-05, "loss": 0.3476, "loss_nan_ranks": 0, "loss_rank_avg": 0.31538859009742737, "step": 845, "valid_targets_mean": 3390.7, "valid_targets_min": 1390 }, { "epoch": 0.8928571428571429, "grad_norm": 0.7282746261851238, "learning_rate": 3.990916663303293e-05, "loss": 0.351, "loss_nan_ranks": 0, "loss_rank_avg": 0.4035952389240265, "step": 850, "valid_targets_mean": 3338.5, "valid_targets_min": 611 }, { "epoch": 0.898109243697479, "grad_norm": 0.8755920451444243, "learning_rate": 3.990411127974762e-05, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.3417074978351593, "step": 855, "valid_targets_mean": 3389.6, "valid_targets_min": 1451 }, { "epoch": 0.9033613445378151, "grad_norm": 0.6595337996347566, "learning_rate": 3.989891936938939e-05, "loss": 0.349, "loss_nan_ranks": 0, "loss_rank_avg": 0.31698334217071533, "step": 860, "valid_targets_mean": 3097.9, "valid_targets_min": 1459 }, { "epoch": 0.9086134453781513, "grad_norm": 0.7205543746187569, "learning_rate": 3.9893590937578634e-05, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.37621456384658813, "step": 865, "valid_targets_mean": 2619.4, "valid_targets_min": 999 }, { "epoch": 0.9138655462184874, "grad_norm": 0.5683063041911645, "learning_rate": 3.9888126020872375e-05, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.31596362590789795, "step": 870, "valid_targets_mean": 3791.2, "valid_targets_min": 1564 }, { "epoch": 0.9191176470588235, "grad_norm": 1.070844790253151, "learning_rate": 3.988252465676401e-05, "loss": 0.3364, "loss_nan_ranks": 0, "loss_rank_avg": 0.33733999729156494, "step": 875, "valid_targets_mean": 3223.3, "valid_targets_min": 1233 }, { "epoch": 0.9243697478991597, "grad_norm": 0.637333593228743, "learning_rate": 3.98767868836831e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.3216400146484375, "step": 880, "valid_targets_mean": 3439.2, "valid_targets_min": 1524 }, { "epoch": 0.9296218487394958, "grad_norm": 0.5754820914455384, "learning_rate": 3.987091274099504e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.3149118423461914, "step": 885, "valid_targets_mean": 3744.9, "valid_targets_min": 1375 }, { "epoch": 0.9348739495798319, "grad_norm": 0.6651917315458717, "learning_rate": 3.986490226900084e-05, "loss": 0.3368, "loss_nan_ranks": 0, "loss_rank_avg": 0.3212442398071289, "step": 890, "valid_targets_mean": 3036.2, "valid_targets_min": 906 }, { "epoch": 0.9401260504201681, "grad_norm": 0.6067258438956236, "learning_rate": 3.985875550893684e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.30532318353652954, "step": 895, "valid_targets_mean": 3766.5, "valid_targets_min": 1246 }, { "epoch": 0.9453781512605042, "grad_norm": 0.6702408814712129, "learning_rate": 3.9852472502974386e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.3562542498111725, "step": 900, "valid_targets_mean": 3225.9, "valid_targets_min": 1333 }, { "epoch": 0.9506302521008403, "grad_norm": 0.5790810375186305, "learning_rate": 3.984605329421961e-05, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.32805150747299194, "step": 905, "valid_targets_mean": 3751.3, "valid_targets_min": 2264 }, { "epoch": 0.9558823529411765, "grad_norm": 0.5978703507597435, "learning_rate": 3.983949792671307e-05, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.347832053899765, "step": 910, "valid_targets_mean": 3505.2, "valid_targets_min": 1454 }, { "epoch": 0.9611344537815126, "grad_norm": 0.624321623961909, "learning_rate": 3.9832806445429486e-05, "loss": 0.3425, "loss_nan_ranks": 0, "loss_rank_avg": 0.3324778378009796, "step": 915, "valid_targets_mean": 3385.7, "valid_targets_min": 1430 }, { "epoch": 0.9663865546218487, "grad_norm": 0.6245540796780895, "learning_rate": 3.982597889627742e-05, "loss": 0.3348, "loss_nan_ranks": 0, "loss_rank_avg": 0.317277729511261, "step": 920, "valid_targets_mean": 3201.6, "valid_targets_min": 1433 }, { "epoch": 0.9716386554621849, "grad_norm": 0.6175278753890704, "learning_rate": 3.981901532609896e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.32414883375167847, "step": 925, "valid_targets_mean": 3362.1, "valid_targets_min": 1512 }, { "epoch": 0.976890756302521, "grad_norm": 0.6165488317026186, "learning_rate": 3.9811915782669406e-05, "loss": 0.3298, "loss_nan_ranks": 0, "loss_rank_avg": 0.31244921684265137, "step": 930, "valid_targets_mean": 3643.9, "valid_targets_min": 2048 }, { "epoch": 0.9821428571428571, "grad_norm": 0.6227928286121143, "learning_rate": 3.980468031469691e-05, "loss": 0.3463, "loss_nan_ranks": 0, "loss_rank_avg": 0.3477458953857422, "step": 935, "valid_targets_mean": 3107.1, "valid_targets_min": 815 }, { "epoch": 0.9873949579831933, "grad_norm": 0.6175153136159267, "learning_rate": 3.9797308971822206e-05, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.3596673607826233, "step": 940, "valid_targets_mean": 3339.4, "valid_targets_min": 1878 }, { "epoch": 0.9926470588235294, "grad_norm": 0.6173093585223963, "learning_rate": 3.978980180461821e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.33542400598526, "step": 945, "valid_targets_mean": 3394.6, "valid_targets_min": 1727 }, { "epoch": 0.9978991596638656, "grad_norm": 0.6354828168457491, "learning_rate": 3.9782158864589696e-05, "loss": 0.3261, "loss_nan_ranks": 0, "loss_rank_avg": 0.3046625554561615, "step": 950, "valid_targets_mean": 2924.3, "valid_targets_min": 1622 }, { "epoch": 1.0031512605042017, "grad_norm": 1.3016888810382736, "learning_rate": 3.977438020417293e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.2962370216846466, "step": 955, "valid_targets_mean": 1587.9, "valid_targets_min": 788 }, { "epoch": 1.0084033613445378, "grad_norm": 1.178432388446946, "learning_rate": 3.9766465876735354e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.23576419055461884, "step": 960, "valid_targets_mean": 1591.2, "valid_targets_min": 957 }, { "epoch": 1.013655462184874, "grad_norm": 0.9417299138332059, "learning_rate": 3.9758415936575155e-05, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.23771171271800995, "step": 965, "valid_targets_mean": 1418.7, "valid_targets_min": 796 }, { "epoch": 1.01890756302521, "grad_norm": 0.9391474883661355, "learning_rate": 3.975023043892094e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.23540674149990082, "step": 970, "valid_targets_mean": 1389.0, "valid_targets_min": 704 }, { "epoch": 1.0241596638655461, "grad_norm": 0.8489834118982603, "learning_rate": 3.974190943993133e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.221901997923851, "step": 975, "valid_targets_mean": 1513.9, "valid_targets_min": 638 }, { "epoch": 1.0294117647058822, "grad_norm": 0.830262362849459, "learning_rate": 3.973345299669461e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.23195049166679382, "step": 980, "valid_targets_mean": 1482.3, "valid_targets_min": 727 }, { "epoch": 1.0346638655462186, "grad_norm": 0.8915461834880904, "learning_rate": 3.972486116722828e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.208994060754776, "step": 985, "valid_targets_mean": 1189.1, "valid_targets_min": 655 }, { "epoch": 1.0399159663865547, "grad_norm": 0.9988345647892146, "learning_rate": 3.971613401047872e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2332269549369812, "step": 990, "valid_targets_mean": 1299.6, "valid_targets_min": 714 }, { "epoch": 1.0451680672268908, "grad_norm": 0.8523206270419763, "learning_rate": 3.970727158632075e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.23563072085380554, "step": 995, "valid_targets_mean": 1407.6, "valid_targets_min": 741 }, { "epoch": 1.050420168067227, "grad_norm": 1.0576241067376564, "learning_rate": 3.969827395555721e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.2590252757072449, "step": 1000, "valid_targets_mean": 1544.1, "valid_targets_min": 663 }, { "epoch": 1.055672268907563, "grad_norm": 1.1458471492556306, "learning_rate": 3.968914117991857e-05, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.230397567152977, "step": 1005, "valid_targets_mean": 1511.1, "valid_targets_min": 632 }, { "epoch": 1.0609243697478992, "grad_norm": 0.9006777040659446, "learning_rate": 3.967987332206249e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.2451692819595337, "step": 1010, "valid_targets_mean": 1638.0, "valid_targets_min": 933 }, { "epoch": 1.0661764705882353, "grad_norm": 0.7626623690643839, "learning_rate": 3.967047044557341e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.22060266137123108, "step": 1015, "valid_targets_mean": 1526.9, "valid_targets_min": 717 }, { "epoch": 1.0714285714285714, "grad_norm": 0.8215685697177867, "learning_rate": 3.966093261496208e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.2275817096233368, "step": 1020, "valid_targets_mean": 1387.4, "valid_targets_min": 659 }, { "epoch": 1.0766806722689075, "grad_norm": 0.8698242331020952, "learning_rate": 3.9651259895665146e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.2096673548221588, "step": 1025, "valid_targets_mean": 1382.9, "valid_targets_min": 642 }, { "epoch": 1.0819327731092436, "grad_norm": 0.768616027752401, "learning_rate": 3.9641452354044687e-05, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.20485013723373413, "step": 1030, "valid_targets_mean": 1312.1, "valid_targets_min": 765 }, { "epoch": 1.0871848739495797, "grad_norm": 0.8590772693317404, "learning_rate": 3.9631510057387765e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.24823632836341858, "step": 1035, "valid_targets_mean": 1397.6, "valid_targets_min": 631 }, { "epoch": 1.092436974789916, "grad_norm": 0.9234663166300711, "learning_rate": 3.962143307390596e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.2525438666343689, "step": 1040, "valid_targets_mean": 1419.4, "valid_targets_min": 623 }, { "epoch": 1.0976890756302522, "grad_norm": 0.7428187089700554, "learning_rate": 3.961122147273491e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.24657368659973145, "step": 1045, "valid_targets_mean": 1647.7, "valid_targets_min": 818 }, { "epoch": 1.1029411764705883, "grad_norm": 0.7835107757413885, "learning_rate": 3.9600875323933826e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.21424023807048798, "step": 1050, "valid_targets_mean": 1545.5, "valid_targets_min": 776 }, { "epoch": 1.1081932773109244, "grad_norm": 0.8623930769993505, "learning_rate": 3.959039469848502e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2390882670879364, "step": 1055, "valid_targets_mean": 1411.8, "valid_targets_min": 623 }, { "epoch": 1.1134453781512605, "grad_norm": 0.8342187952076956, "learning_rate": 3.9579779668293416e-05, "loss": 0.2341, "loss_nan_ranks": 0, "loss_rank_avg": 0.24478605389595032, "step": 1060, "valid_targets_mean": 1437.3, "valid_targets_min": 742 }, { "epoch": 1.1186974789915967, "grad_norm": 0.8716802159762432, "learning_rate": 3.956903030618605e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.21243079006671906, "step": 1065, "valid_targets_mean": 1193.6, "valid_targets_min": 611 }, { "epoch": 1.1239495798319328, "grad_norm": 0.8276094439043256, "learning_rate": 3.955814668591156e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2292919009923935, "step": 1070, "valid_targets_mean": 1514.0, "valid_targets_min": 793 }, { "epoch": 1.129201680672269, "grad_norm": 0.8269530258415205, "learning_rate": 3.9547128882139735e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.2063109278678894, "step": 1075, "valid_targets_mean": 1379.1, "valid_targets_min": 886 }, { "epoch": 1.134453781512605, "grad_norm": 0.7349504784818733, "learning_rate": 3.9535976970460925e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.2086534947156906, "step": 1080, "valid_targets_mean": 1455.5, "valid_targets_min": 991 }, { "epoch": 1.1397058823529411, "grad_norm": 0.7910940364262357, "learning_rate": 3.9524691027385585e-05, "loss": 0.2244, "loss_nan_ranks": 0, "loss_rank_avg": 0.22840695083141327, "step": 1085, "valid_targets_mean": 1525.2, "valid_targets_min": 908 }, { "epoch": 1.1449579831932772, "grad_norm": 0.9125068091813882, "learning_rate": 3.95132711303437e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.23359861969947815, "step": 1090, "valid_targets_mean": 1476.6, "valid_targets_min": 680 }, { "epoch": 1.1502100840336134, "grad_norm": 0.7517080972876787, "learning_rate": 3.9501717357684315e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.22301185131072998, "step": 1095, "valid_targets_mean": 1467.1, "valid_targets_min": 803 }, { "epoch": 1.1554621848739495, "grad_norm": 0.8187151581180054, "learning_rate": 3.9490029788674934e-05, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.22149021923542023, "step": 1100, "valid_targets_mean": 1341.3, "valid_targets_min": 765 }, { "epoch": 1.1607142857142858, "grad_norm": 0.7811554150228613, "learning_rate": 3.9478208503501e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.23048382997512817, "step": 1105, "valid_targets_mean": 1556.4, "valid_targets_min": 804 }, { "epoch": 1.165966386554622, "grad_norm": 0.8232786153715305, "learning_rate": 3.946625358326538e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.24594677984714508, "step": 1110, "valid_targets_mean": 1509.7, "valid_targets_min": 675 }, { "epoch": 1.171218487394958, "grad_norm": 0.7583404192175697, "learning_rate": 3.945416510998775e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.229123055934906, "step": 1115, "valid_targets_mean": 1408.4, "valid_targets_min": 882 }, { "epoch": 1.1764705882352942, "grad_norm": 0.7798738937206717, "learning_rate": 3.944194316660406e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.20927229523658752, "step": 1120, "valid_targets_mean": 1449.8, "valid_targets_min": 660 }, { "epoch": 1.1817226890756303, "grad_norm": 0.7782369720225292, "learning_rate": 3.942958783696598e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.21136952936649323, "step": 1125, "valid_targets_mean": 1489.8, "valid_targets_min": 678 }, { "epoch": 1.1869747899159664, "grad_norm": 0.8389164365291358, "learning_rate": 3.94170992058403e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.2247747778892517, "step": 1130, "valid_targets_mean": 1379.1, "valid_targets_min": 676 }, { "epoch": 1.1922268907563025, "grad_norm": 0.85218432627087, "learning_rate": 3.9404477358908354e-05, "loss": 0.2185, "loss_nan_ranks": 0, "loss_rank_avg": 0.20599870383739471, "step": 1135, "valid_targets_mean": 1347.1, "valid_targets_min": 794 }, { "epoch": 1.1974789915966386, "grad_norm": 0.7736857874589698, "learning_rate": 3.9391722382765445e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.2081984579563141, "step": 1140, "valid_targets_mean": 1372.6, "valid_targets_min": 607 }, { "epoch": 1.2027310924369747, "grad_norm": 0.8143324846381077, "learning_rate": 3.937883436492025e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.210773304104805, "step": 1145, "valid_targets_mean": 1323.6, "valid_targets_min": 722 }, { "epoch": 1.2079831932773109, "grad_norm": 0.8168389117740881, "learning_rate": 3.9365813393794186e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.2400819957256317, "step": 1150, "valid_targets_mean": 1597.7, "valid_targets_min": 858 }, { "epoch": 1.213235294117647, "grad_norm": 0.798484953443434, "learning_rate": 3.9352659558720836e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.19974064826965332, "step": 1155, "valid_targets_mean": 1270.8, "valid_targets_min": 689 }, { "epoch": 1.2184873949579833, "grad_norm": 0.7597271913919195, "learning_rate": 3.933937294994535e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.22933819890022278, "step": 1160, "valid_targets_mean": 1388.2, "valid_targets_min": 692 }, { "epoch": 1.2237394957983194, "grad_norm": 0.7412896199433119, "learning_rate": 3.932595365862379e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.2073134481906891, "step": 1165, "valid_targets_mean": 1447.2, "valid_targets_min": 828 }, { "epoch": 1.2289915966386555, "grad_norm": 0.8029587259024663, "learning_rate": 3.9312401776822504e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.22155123949050903, "step": 1170, "valid_targets_mean": 1399.7, "valid_targets_min": 618 }, { "epoch": 1.2342436974789917, "grad_norm": 0.753092266372571, "learning_rate": 3.9298717397517546e-05, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.20688486099243164, "step": 1175, "valid_targets_mean": 1454.3, "valid_targets_min": 629 }, { "epoch": 1.2394957983193278, "grad_norm": 0.7552069088401491, "learning_rate": 3.928490061459396e-05, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.2513880133628845, "step": 1180, "valid_targets_mean": 1746.1, "valid_targets_min": 1071 }, { "epoch": 1.2447478991596639, "grad_norm": 0.7724105286503384, "learning_rate": 3.927095152284521e-05, "loss": 0.2215, "loss_nan_ranks": 0, "loss_rank_avg": 0.2342674434185028, "step": 1185, "valid_targets_mean": 1282.2, "valid_targets_min": 677 }, { "epoch": 1.25, "grad_norm": 0.8255573649270425, "learning_rate": 3.925687021797249e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.19916367530822754, "step": 1190, "valid_targets_mean": 1227.6, "valid_targets_min": 679 }, { "epoch": 1.2552521008403361, "grad_norm": 0.7348173616246707, "learning_rate": 3.924265679658407e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.20118603110313416, "step": 1195, "valid_targets_mean": 1319.1, "valid_targets_min": 504 }, { "epoch": 1.2605042016806722, "grad_norm": 0.7536987070404887, "learning_rate": 3.922831135619462e-05, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.20859253406524658, "step": 1200, "valid_targets_mean": 1616.5, "valid_targets_min": 1023 }, { "epoch": 1.2657563025210083, "grad_norm": 0.7577745081343713, "learning_rate": 3.9213833995224605e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.2004815638065338, "step": 1205, "valid_targets_mean": 1453.0, "valid_targets_min": 661 }, { "epoch": 1.2710084033613445, "grad_norm": 0.7784879343054987, "learning_rate": 3.919922481299952e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.21279674768447876, "step": 1210, "valid_targets_mean": 1442.0, "valid_targets_min": 889 }, { "epoch": 1.2762605042016806, "grad_norm": 0.7318237431101263, "learning_rate": 3.918448390974928e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.20114900171756744, "step": 1215, "valid_targets_mean": 1548.4, "valid_targets_min": 723 }, { "epoch": 1.2815126050420167, "grad_norm": 0.8439347277266402, "learning_rate": 3.9169611386607476e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.20195883512496948, "step": 1220, "valid_targets_mean": 1359.8, "valid_targets_min": 793 }, { "epoch": 1.2867647058823528, "grad_norm": 0.7840655198861911, "learning_rate": 3.9154607345610746e-05, "loss": 0.2145, "loss_nan_ranks": 0, "loss_rank_avg": 0.22591176629066467, "step": 1225, "valid_targets_mean": 1478.6, "valid_targets_min": 861 }, { "epoch": 1.2920168067226891, "grad_norm": 0.7776629349610283, "learning_rate": 3.913947188969801e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.19768911600112915, "step": 1230, "valid_targets_mean": 1332.7, "valid_targets_min": 752 }, { "epoch": 1.2972689075630253, "grad_norm": 0.7729134790563235, "learning_rate": 3.912420512270981e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.2305484265089035, "step": 1235, "valid_targets_mean": 1622.7, "valid_targets_min": 789 }, { "epoch": 1.3025210084033614, "grad_norm": 0.8616431181942282, "learning_rate": 3.910880714938757e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1932060420513153, "step": 1240, "valid_targets_mean": 1195.4, "valid_targets_min": 567 }, { "epoch": 1.3077731092436975, "grad_norm": 0.7695069319629071, "learning_rate": 3.909327807537288e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.232661634683609, "step": 1245, "valid_targets_mean": 1504.5, "valid_targets_min": 605 }, { "epoch": 1.3130252100840336, "grad_norm": 0.7113969327868939, "learning_rate": 3.90776180072068e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.20750564336776733, "step": 1250, "valid_targets_mean": 1580.1, "valid_targets_min": 746 }, { "epoch": 1.3182773109243697, "grad_norm": 0.7945153800878063, "learning_rate": 3.906182705232909e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.20195449888706207, "step": 1255, "valid_targets_mean": 1158.2, "valid_targets_min": 723 }, { "epoch": 1.3235294117647058, "grad_norm": 0.7587646804913716, "learning_rate": 3.904590531907751e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.21249453723430634, "step": 1260, "valid_targets_mean": 1430.4, "valid_targets_min": 855 }, { "epoch": 1.328781512605042, "grad_norm": 0.7185755186164045, "learning_rate": 3.9029852916687034e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.2006302922964096, "step": 1265, "valid_targets_mean": 1590.4, "valid_targets_min": 902 }, { "epoch": 1.334033613445378, "grad_norm": 0.7257232800212272, "learning_rate": 3.9013669955289136e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.20573708415031433, "step": 1270, "valid_targets_mean": 1521.5, "valid_targets_min": 803 }, { "epoch": 1.3392857142857144, "grad_norm": 0.7974748283202712, "learning_rate": 3.899735654591101e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.22591374814510345, "step": 1275, "valid_targets_mean": 1455.2, "valid_targets_min": 740 }, { "epoch": 1.3445378151260505, "grad_norm": 0.8433766016494005, "learning_rate": 3.898091280047486e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.20434291660785675, "step": 1280, "valid_targets_mean": 1279.4, "valid_targets_min": 244 }, { "epoch": 1.3497899159663866, "grad_norm": 0.7810238280537369, "learning_rate": 3.896433883179703e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.22051532566547394, "step": 1285, "valid_targets_mean": 1366.9, "valid_targets_min": 714 }, { "epoch": 1.3550420168067228, "grad_norm": 0.9021667080271751, "learning_rate": 3.894763475358736e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.19154158234596252, "step": 1290, "valid_targets_mean": 1220.5, "valid_targets_min": 585 }, { "epoch": 1.3602941176470589, "grad_norm": 0.8197315751887221, "learning_rate": 3.8930800680448275e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.230904221534729, "step": 1295, "valid_targets_mean": 1596.4, "valid_targets_min": 1041 }, { "epoch": 1.365546218487395, "grad_norm": 0.7275089472098615, "learning_rate": 3.891383672787411e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.20911553502082825, "step": 1300, "valid_targets_mean": 1401.3, "valid_targets_min": 777 }, { "epoch": 1.370798319327731, "grad_norm": 0.7376318715306975, "learning_rate": 3.889674301225025e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.19725364446640015, "step": 1305, "valid_targets_mean": 1546.8, "valid_targets_min": 959 }, { "epoch": 1.3760504201680672, "grad_norm": 0.7408476899885955, "learning_rate": 3.8879519650852356e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.18753978610038757, "step": 1310, "valid_targets_mean": 1284.4, "valid_targets_min": 620 }, { "epoch": 1.3813025210084033, "grad_norm": 0.7266684151521309, "learning_rate": 3.886216676184555e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.20051538944244385, "step": 1315, "valid_targets_mean": 1356.6, "valid_targets_min": 656 }, { "epoch": 1.3865546218487395, "grad_norm": 0.7791953600527686, "learning_rate": 3.8844684464283614e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.23191730678081512, "step": 1320, "valid_targets_mean": 1564.5, "valid_targets_min": 697 }, { "epoch": 1.3918067226890756, "grad_norm": 0.6803022151794903, "learning_rate": 3.882707287810817e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.20292726159095764, "step": 1325, "valid_targets_mean": 1604.7, "valid_targets_min": 682 }, { "epoch": 1.3970588235294117, "grad_norm": 0.7109648477839206, "learning_rate": 3.880933212414786e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.19687709212303162, "step": 1330, "valid_targets_mean": 1383.4, "valid_targets_min": 730 }, { "epoch": 1.4023109243697478, "grad_norm": 0.7636435446308724, "learning_rate": 3.87914623241175e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.19838300347328186, "step": 1335, "valid_targets_mean": 1482.5, "valid_targets_min": 747 }, { "epoch": 1.407563025210084, "grad_norm": 0.7790600366170161, "learning_rate": 3.877346360061728e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.20176908373832703, "step": 1340, "valid_targets_mean": 1603.6, "valid_targets_min": 933 }, { "epoch": 1.41281512605042, "grad_norm": 0.7307120382472138, "learning_rate": 3.8755336077131894e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.19978278875350952, "step": 1345, "valid_targets_mean": 1517.9, "valid_targets_min": 799 }, { "epoch": 1.4180672268907564, "grad_norm": 0.7009558460825884, "learning_rate": 3.873707987802967e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.20674484968185425, "step": 1350, "valid_targets_mean": 1516.2, "valid_targets_min": 909 }, { "epoch": 1.4233193277310925, "grad_norm": 0.6935543353633367, "learning_rate": 3.871869512856179e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.19707924127578735, "step": 1355, "valid_targets_mean": 1606.8, "valid_targets_min": 741 }, { "epoch": 1.4285714285714286, "grad_norm": 0.7721082945840706, "learning_rate": 3.870018195486138e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.20531484484672546, "step": 1360, "valid_targets_mean": 1328.7, "valid_targets_min": 720 }, { "epoch": 1.4338235294117647, "grad_norm": 0.7736104466743927, "learning_rate": 3.868154048394262e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.201510488986969, "step": 1365, "valid_targets_mean": 1396.2, "valid_targets_min": 610 }, { "epoch": 1.4390756302521008, "grad_norm": 0.7550538776229306, "learning_rate": 3.8662770843699944e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2158433496952057, "step": 1370, "valid_targets_mean": 1352.9, "valid_targets_min": 684 }, { "epoch": 1.444327731092437, "grad_norm": 0.6820026840811728, "learning_rate": 3.8643873162907086e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.19932374358177185, "step": 1375, "valid_targets_mean": 1479.4, "valid_targets_min": 874 }, { "epoch": 1.449579831932773, "grad_norm": 0.6850687148845401, "learning_rate": 3.862484757121627e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.19579848647117615, "step": 1380, "valid_targets_mean": 1501.2, "valid_targets_min": 765 }, { "epoch": 1.4548319327731092, "grad_norm": 0.6990618001541059, "learning_rate": 3.860569419915727e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.20401817560195923, "step": 1385, "valid_targets_mean": 1419.9, "valid_targets_min": 589 }, { "epoch": 1.4600840336134453, "grad_norm": 0.699051470230191, "learning_rate": 3.858641317813653e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.23287919163703918, "step": 1390, "valid_targets_mean": 1587.2, "valid_targets_min": 918 }, { "epoch": 1.4653361344537816, "grad_norm": 0.5943455101511255, "learning_rate": 3.8567004640436234e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.3295353651046753, "step": 1395, "valid_targets_mean": 3546.9, "valid_targets_min": 702 }, { "epoch": 1.4705882352941178, "grad_norm": 0.570252231140088, "learning_rate": 3.8547468719213476e-05, "loss": 0.3267, "loss_nan_ranks": 0, "loss_rank_avg": 0.33764392137527466, "step": 1400, "valid_targets_mean": 4000.6, "valid_targets_min": 1005 }, { "epoch": 1.4758403361344539, "grad_norm": 0.5515303020894601, "learning_rate": 3.852780554849925e-05, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.3034968376159668, "step": 1405, "valid_targets_mean": 4063.9, "valid_targets_min": 1296 }, { "epoch": 1.48109243697479, "grad_norm": 0.5595030961730294, "learning_rate": 3.850801526319761e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.288005530834198, "step": 1410, "valid_targets_mean": 3747.0, "valid_targets_min": 1561 }, { "epoch": 1.486344537815126, "grad_norm": 0.5948008178131649, "learning_rate": 3.84880979990847e-05, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.32669079303741455, "step": 1415, "valid_targets_mean": 3562.5, "valid_targets_min": 1044 }, { "epoch": 1.4915966386554622, "grad_norm": 0.5216067222057376, "learning_rate": 3.846805389280782e-05, "loss": 0.3154, "loss_nan_ranks": 0, "loss_rank_avg": 0.2934839725494385, "step": 1420, "valid_targets_mean": 3911.4, "valid_targets_min": 920 }, { "epoch": 1.4968487394957983, "grad_norm": 0.4836038411370819, "learning_rate": 3.844788308188452e-05, "loss": 0.2861, "loss_nan_ranks": 0, "loss_rank_avg": 0.3024061918258667, "step": 1425, "valid_targets_mean": 5753.8, "valid_targets_min": 2060 }, { "epoch": 1.5021008403361344, "grad_norm": 0.5556606445880677, "learning_rate": 3.8427585704701634e-05, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.31254953145980835, "step": 1430, "valid_targets_mean": 3728.6, "valid_targets_min": 467 }, { "epoch": 1.5073529411764706, "grad_norm": 0.5895498142754928, "learning_rate": 3.840716190051433e-05, "loss": 0.3141, "loss_nan_ranks": 0, "loss_rank_avg": 0.32763177156448364, "step": 1435, "valid_targets_mean": 3554.0, "valid_targets_min": 1689 }, { "epoch": 1.5126050420168067, "grad_norm": 0.54899724482139, "learning_rate": 3.8386611809445155e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.30432096123695374, "step": 1440, "valid_targets_mean": 3708.1, "valid_targets_min": 1697 }, { "epoch": 1.5178571428571428, "grad_norm": 0.6115854171093719, "learning_rate": 3.8365935572483095e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.3384946882724762, "step": 1445, "valid_targets_mean": 3652.6, "valid_targets_min": 1223 }, { "epoch": 1.523109243697479, "grad_norm": 0.5435695015200867, "learning_rate": 3.834513333148258e-05, "loss": 0.3085, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052658438682556, "step": 1450, "valid_targets_mean": 4036.1, "valid_targets_min": 1552 }, { "epoch": 1.528361344537815, "grad_norm": 0.614280577128499, "learning_rate": 3.832420522916252e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.316119909286499, "step": 1455, "valid_targets_mean": 3543.5, "valid_targets_min": 1439 }, { "epoch": 1.5336134453781511, "grad_norm": 0.5885577114747288, "learning_rate": 3.830315140910534e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.30280590057373047, "step": 1460, "valid_targets_mean": 3287.0, "valid_targets_min": 1402 }, { "epoch": 1.5388655462184873, "grad_norm": 0.6135025188561368, "learning_rate": 3.8281972015755965e-05, "loss": 0.3204, "loss_nan_ranks": 0, "loss_rank_avg": 0.3206782341003418, "step": 1465, "valid_targets_mean": 3423.9, "valid_targets_min": 1586 }, { "epoch": 1.5441176470588234, "grad_norm": 0.584621502686007, "learning_rate": 3.826066719442086e-05, "loss": 0.3117, "loss_nan_ranks": 0, "loss_rank_avg": 0.3108097314834595, "step": 1470, "valid_targets_mean": 3406.0, "valid_targets_min": 1538 }, { "epoch": 1.5493697478991597, "grad_norm": 0.6706962593993887, "learning_rate": 3.823923709126701e-05, "loss": 0.3158, "loss_nan_ranks": 0, "loss_rank_avg": 0.31825387477874756, "step": 1475, "valid_targets_mean": 2954.0, "valid_targets_min": 1058 }, { "epoch": 1.5546218487394958, "grad_norm": 0.651116388475916, "learning_rate": 3.821768185332095e-05, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.32802870869636536, "step": 1480, "valid_targets_mean": 3051.8, "valid_targets_min": 1362 }, { "epoch": 1.559873949579832, "grad_norm": 0.5745329146566351, "learning_rate": 3.81960016284677e-05, "loss": 0.3145, "loss_nan_ranks": 0, "loss_rank_avg": 0.3129153251647949, "step": 1485, "valid_targets_mean": 3620.5, "valid_targets_min": 1392 }, { "epoch": 1.565126050420168, "grad_norm": 0.6580272364249068, "learning_rate": 3.817419656544979e-05, "loss": 0.3154, "loss_nan_ranks": 0, "loss_rank_avg": 0.3198480010032654, "step": 1490, "valid_targets_mean": 3103.6, "valid_targets_min": 1267 }, { "epoch": 1.5703781512605042, "grad_norm": 0.6033632847231352, "learning_rate": 3.815226681386626e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.3069283664226532, "step": 1495, "valid_targets_mean": 3592.7, "valid_targets_min": 1026 }, { "epoch": 1.5756302521008403, "grad_norm": 0.5732499269923438, "learning_rate": 3.8130212524171576e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.30469539761543274, "step": 1500, "valid_targets_mean": 3632.1, "valid_targets_min": 1785 }, { "epoch": 1.5808823529411766, "grad_norm": 0.5775861462441018, "learning_rate": 3.810803384767465e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.2886812388896942, "step": 1505, "valid_targets_mean": 3557.1, "valid_targets_min": 1957 }, { "epoch": 1.5861344537815127, "grad_norm": 0.5694130410160565, "learning_rate": 3.808573093653777e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.2857256233692169, "step": 1510, "valid_targets_mean": 3230.6, "valid_targets_min": 1570 }, { "epoch": 1.5913865546218489, "grad_norm": 0.6246265430681128, "learning_rate": 3.806330394377556e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.30203184485435486, "step": 1515, "valid_targets_mean": 3023.7, "valid_targets_min": 997 }, { "epoch": 1.596638655462185, "grad_norm": 0.658813587454356, "learning_rate": 3.8040753023253956e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.33436664938926697, "step": 1520, "valid_targets_mean": 3056.6, "valid_targets_min": 1293 }, { "epoch": 1.601890756302521, "grad_norm": 0.6211106779673433, "learning_rate": 3.801807832968912e-05, "loss": 0.3093, "loss_nan_ranks": 0, "loss_rank_avg": 0.29863476753234863, "step": 1525, "valid_targets_mean": 2915.6, "valid_targets_min": 1687 }, { "epoch": 1.6071428571428572, "grad_norm": 0.6368491555844873, "learning_rate": 3.799528001864637e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.33547699451446533, "step": 1530, "valid_targets_mean": 2985.1, "valid_targets_min": 1108 }, { "epoch": 1.6123949579831933, "grad_norm": 0.5840908746370534, "learning_rate": 3.797235824653918e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.3032509684562683, "step": 1535, "valid_targets_mean": 3195.0, "valid_targets_min": 571 }, { "epoch": 1.6176470588235294, "grad_norm": 0.6352859314737174, "learning_rate": 3.7949313170628006e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.3243550956249237, "step": 1540, "valid_targets_mean": 3106.2, "valid_targets_min": 738 }, { "epoch": 1.6228991596638656, "grad_norm": 0.6224156356901303, "learning_rate": 3.79261449490193e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.30039089918136597, "step": 1545, "valid_targets_mean": 3189.5, "valid_targets_min": 1896 }, { "epoch": 1.6281512605042017, "grad_norm": 0.6278005675540494, "learning_rate": 3.7902853740664356e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.3083696663379669, "step": 1550, "valid_targets_mean": 3278.9, "valid_targets_min": 1177 }, { "epoch": 1.6334033613445378, "grad_norm": 0.5850412843704133, "learning_rate": 3.7879439705358286e-05, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.3127497732639313, "step": 1555, "valid_targets_mean": 3398.8, "valid_targets_min": 1270 }, { "epoch": 1.638655462184874, "grad_norm": 0.5805366053879955, "learning_rate": 3.785590300373884e-05, "loss": 0.3063, "loss_nan_ranks": 0, "loss_rank_avg": 0.29494237899780273, "step": 1560, "valid_targets_mean": 3829.2, "valid_targets_min": 1668 }, { "epoch": 1.64390756302521, "grad_norm": 0.569934576020579, "learning_rate": 3.7832243797285385e-05, "loss": 0.3052, "loss_nan_ranks": 0, "loss_rank_avg": 0.3094933032989502, "step": 1565, "valid_targets_mean": 3426.9, "valid_targets_min": 1184 }, { "epoch": 1.6491596638655461, "grad_norm": 0.6159772681925453, "learning_rate": 3.780846224831775e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.3124518394470215, "step": 1570, "valid_targets_mean": 3523.6, "valid_targets_min": 1858 }, { "epoch": 1.6544117647058822, "grad_norm": 0.5971056987489094, "learning_rate": 3.7784558519995135e-05, "loss": 0.3075, "loss_nan_ranks": 0, "loss_rank_avg": 0.28216129541397095, "step": 1575, "valid_targets_mean": 3161.2, "valid_targets_min": 922 }, { "epoch": 1.6596638655462184, "grad_norm": 0.699651916524887, "learning_rate": 3.776053277631496e-05, "loss": 0.3079, "loss_nan_ranks": 0, "loss_rank_avg": 0.34362688660621643, "step": 1580, "valid_targets_mean": 2948.9, "valid_targets_min": 1812 }, { "epoch": 1.6649159663865545, "grad_norm": 0.7182980448996313, "learning_rate": 3.7736385182111785e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.2877700626850128, "step": 1585, "valid_targets_mean": 3107.7, "valid_targets_min": 977 }, { "epoch": 1.6701680672268906, "grad_norm": 0.5675825049010571, "learning_rate": 3.771211590305614e-05, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.2754617929458618, "step": 1590, "valid_targets_mean": 3372.6, "valid_targets_min": 810 }, { "epoch": 1.675420168067227, "grad_norm": 0.5802055167295502, "learning_rate": 3.768772510565342e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.29426002502441406, "step": 1595, "valid_targets_mean": 3305.2, "valid_targets_min": 1673 }, { "epoch": 1.680672268907563, "grad_norm": 0.5249464047322138, "learning_rate": 3.76632129572427e-05, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.2580610513687134, "step": 1600, "valid_targets_mean": 3933.0, "valid_targets_min": 1869 }, { "epoch": 1.6859243697478992, "grad_norm": 1.426921636472864, "learning_rate": 3.763857962599565e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.3049716353416443, "step": 1605, "valid_targets_mean": 3010.2, "valid_targets_min": 1377 }, { "epoch": 1.6911764705882353, "grad_norm": 0.6454799620397031, "learning_rate": 3.761382528091531e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.30134791135787964, "step": 1610, "valid_targets_mean": 3055.6, "valid_targets_min": 1219 }, { "epoch": 1.6964285714285714, "grad_norm": 0.5717900298014066, "learning_rate": 3.7588950091834986e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911268174648285, "step": 1615, "valid_targets_mean": 3442.4, "valid_targets_min": 1168 }, { "epoch": 1.7016806722689075, "grad_norm": 0.645609709718482, "learning_rate": 3.756395422941706e-05, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.30699074268341064, "step": 1620, "valid_targets_mean": 3041.9, "valid_targets_min": 1955 }, { "epoch": 1.7069327731092439, "grad_norm": 0.5866883370447175, "learning_rate": 3.753883786515181e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.2968907654285431, "step": 1625, "valid_targets_mean": 3640.2, "valid_targets_min": 1628 }, { "epoch": 1.71218487394958, "grad_norm": 0.5743154885711474, "learning_rate": 3.751360117135628e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.2586438059806824, "step": 1630, "valid_targets_mean": 3358.4, "valid_targets_min": 1482 }, { "epoch": 1.717436974789916, "grad_norm": 0.5881142433423517, "learning_rate": 3.7488244321173025e-05, "loss": 0.2883, "loss_nan_ranks": 0, "loss_rank_avg": 0.26784512400627136, "step": 1635, "valid_targets_mean": 3460.4, "valid_targets_min": 904 }, { "epoch": 1.7226890756302522, "grad_norm": 0.6168171706911441, "learning_rate": 3.746276748856898e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.3478624224662781, "step": 1640, "valid_targets_mean": 3728.4, "valid_targets_min": 1194 }, { "epoch": 1.7279411764705883, "grad_norm": 0.5755170388250846, "learning_rate": 3.743717084833425e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.30867037177085876, "step": 1645, "valid_targets_mean": 3940.4, "valid_targets_min": 1658 }, { "epoch": 1.7331932773109244, "grad_norm": 0.6224361276979423, "learning_rate": 3.741145457608093e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.31917211413383484, "step": 1650, "valid_targets_mean": 3536.9, "valid_targets_min": 1423 }, { "epoch": 1.7384453781512605, "grad_norm": 0.6144445149004428, "learning_rate": 3.738561884824183e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.3049688935279846, "step": 1655, "valid_targets_mean": 3351.2, "valid_targets_min": 2010 }, { "epoch": 1.7436974789915967, "grad_norm": 0.5954264479652966, "learning_rate": 3.735966384206936e-05, "loss": 0.3155, "loss_nan_ranks": 0, "loss_rank_avg": 0.30082428455352783, "step": 1660, "valid_targets_mean": 3498.6, "valid_targets_min": 1172 }, { "epoch": 1.7489495798319328, "grad_norm": 0.5715440496549611, "learning_rate": 3.733358973563425e-05, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.2998632788658142, "step": 1665, "valid_targets_mean": 3863.8, "valid_targets_min": 1229 }, { "epoch": 1.754201680672269, "grad_norm": 0.6026903585406433, "learning_rate": 3.730739670782435e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.2936575412750244, "step": 1670, "valid_targets_mean": 3600.5, "valid_targets_min": 1523 }, { "epoch": 1.759453781512605, "grad_norm": 0.5960750461839239, "learning_rate": 3.72810849383434e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.286255419254303, "step": 1675, "valid_targets_mean": 3623.9, "valid_targets_min": 997 }, { "epoch": 1.7647058823529411, "grad_norm": 0.5856872929601087, "learning_rate": 3.725465460770978e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.29570281505584717, "step": 1680, "valid_targets_mean": 3535.2, "valid_targets_min": 621 }, { "epoch": 1.7699579831932772, "grad_norm": 0.6652466131769478, "learning_rate": 3.7228105897255324e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.29390841722488403, "step": 1685, "valid_targets_mean": 3071.5, "valid_targets_min": 1282 }, { "epoch": 1.7752100840336134, "grad_norm": 0.5607387594187455, "learning_rate": 3.7201438989124e-05, "loss": 0.2794, "loss_nan_ranks": 0, "loss_rank_avg": 0.25984397530555725, "step": 1690, "valid_targets_mean": 3779.1, "valid_targets_min": 1421 }, { "epoch": 1.7804621848739495, "grad_norm": 0.5923487985204593, "learning_rate": 3.717465406627074e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.27242133021354675, "step": 1695, "valid_targets_mean": 3330.2, "valid_targets_min": 1853 }, { "epoch": 1.7857142857142856, "grad_norm": 0.5899947816496157, "learning_rate": 3.714775131246011e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.2966066002845764, "step": 1700, "valid_targets_mean": 3327.8, "valid_targets_min": 1410 }, { "epoch": 1.7909663865546217, "grad_norm": 0.66060731387224, "learning_rate": 3.71207309122651e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911011576652527, "step": 1705, "valid_targets_mean": 2920.6, "valid_targets_min": 1305 }, { "epoch": 1.7962184873949578, "grad_norm": 0.5843889526857856, "learning_rate": 3.709359305106585e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.2868155837059021, "step": 1710, "valid_targets_mean": 3539.7, "valid_targets_min": 996 }, { "epoch": 1.8014705882352942, "grad_norm": 0.586228171865445, "learning_rate": 3.7066337915048354e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.27134719491004944, "step": 1715, "valid_targets_mean": 3357.1, "valid_targets_min": 1349 }, { "epoch": 1.8067226890756303, "grad_norm": 0.606158452920606, "learning_rate": 3.7038965691203205e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.31426700949668884, "step": 1720, "valid_targets_mean": 3613.5, "valid_targets_min": 1248 }, { "epoch": 1.8119747899159664, "grad_norm": 0.5526990318942386, "learning_rate": 3.701147656732431e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.24181315302848816, "step": 1725, "valid_targets_mean": 3327.4, "valid_targets_min": 1109 }, { "epoch": 1.8172268907563025, "grad_norm": 0.6528173405719958, "learning_rate": 3.6983870732007596e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.2989552617073059, "step": 1730, "valid_targets_mean": 2790.8, "valid_targets_min": 1649 }, { "epoch": 1.8224789915966386, "grad_norm": 0.6835745034650174, "learning_rate": 3.695614837464972e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.3165176808834076, "step": 1735, "valid_targets_mean": 2811.8, "valid_targets_min": 1197 }, { "epoch": 1.8277310924369747, "grad_norm": 0.6755172073863958, "learning_rate": 3.692830968544675e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.3160332441329956, "step": 1740, "valid_targets_mean": 3420.2, "valid_targets_min": 1720 }, { "epoch": 1.832983193277311, "grad_norm": 0.6087751854436854, "learning_rate": 3.690035485539291e-05, "loss": 0.2993, "loss_nan_ranks": 0, "loss_rank_avg": 0.29514777660369873, "step": 1745, "valid_targets_mean": 3542.7, "valid_targets_min": 1054 }, { "epoch": 1.8382352941176472, "grad_norm": 0.6241785789650026, "learning_rate": 3.6872284076279205e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2934738099575043, "step": 1750, "valid_targets_mean": 3049.7, "valid_targets_min": 1643 }, { "epoch": 1.8434873949579833, "grad_norm": 0.5825825660256299, "learning_rate": 3.684409754069215e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.30002132058143616, "step": 1755, "valid_targets_mean": 3757.8, "valid_targets_min": 1135 }, { "epoch": 1.8487394957983194, "grad_norm": 0.6258913745185652, "learning_rate": 3.681579544201244e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.290172278881073, "step": 1760, "valid_targets_mean": 3715.1, "valid_targets_min": 1174 }, { "epoch": 1.8539915966386555, "grad_norm": 0.6554971879023268, "learning_rate": 3.6787377974413614e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.32472649216651917, "step": 1765, "valid_targets_mean": 3321.9, "valid_targets_min": 992 }, { "epoch": 1.8592436974789917, "grad_norm": 0.6104106962565312, "learning_rate": 3.6758845332860734e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.320326030254364, "step": 1770, "valid_targets_mean": 3713.2, "valid_targets_min": 1133 }, { "epoch": 1.8644957983193278, "grad_norm": 0.6602404199908332, "learning_rate": 3.673019771310903e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192262649536133, "step": 1775, "valid_targets_mean": 2961.8, "valid_targets_min": 1195 }, { "epoch": 1.8697478991596639, "grad_norm": 0.9226641425449463, "learning_rate": 3.670143531170258e-05, "loss": 0.3044, "loss_nan_ranks": 0, "loss_rank_avg": 0.30954253673553467, "step": 1780, "valid_targets_mean": 3012.6, "valid_targets_min": 484 }, { "epoch": 1.875, "grad_norm": 0.5947567961611435, "learning_rate": 3.667255832597294e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.3080810010433197, "step": 1785, "valid_targets_mean": 3639.9, "valid_targets_min": 1434 }, { "epoch": 1.8802521008403361, "grad_norm": 0.5635109826748741, "learning_rate": 3.664356695403781e-05, "loss": 0.2972, "loss_nan_ranks": 0, "loss_rank_avg": 0.2792786955833435, "step": 1790, "valid_targets_mean": 4017.4, "valid_targets_min": 1349 }, { "epoch": 1.8855042016806722, "grad_norm": 0.7060376087001079, "learning_rate": 3.661446139479965e-05, "loss": 0.2965, "loss_nan_ranks": 0, "loss_rank_avg": 0.31975793838500977, "step": 1795, "valid_targets_mean": 3178.8, "valid_targets_min": 1434 }, { "epoch": 1.8907563025210083, "grad_norm": 0.5936744481364934, "learning_rate": 3.658524184794436e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.2860378324985504, "step": 1800, "valid_targets_mean": 3633.9, "valid_targets_min": 521 }, { "epoch": 1.8960084033613445, "grad_norm": 0.5822754669183862, "learning_rate": 3.655590851393984e-05, "loss": 0.3049, "loss_nan_ranks": 0, "loss_rank_avg": 0.3000732660293579, "step": 1805, "valid_targets_mean": 3981.0, "valid_targets_min": 1464 }, { "epoch": 1.9012605042016806, "grad_norm": 0.6913451388646343, "learning_rate": 3.652646159403468e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.3260645866394043, "step": 1810, "valid_targets_mean": 2612.0, "valid_targets_min": 1239 }, { "epoch": 1.9065126050420167, "grad_norm": 0.6287538437173945, "learning_rate": 3.649690129025675e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.29579633474349976, "step": 1815, "valid_targets_mean": 3489.8, "valid_targets_min": 1457 }, { "epoch": 1.9117647058823528, "grad_norm": 0.6767664513173561, "learning_rate": 3.6467227805411824e-05, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.29462265968322754, "step": 1820, "valid_targets_mean": 3059.1, "valid_targets_min": 1460 }, { "epoch": 1.917016806722689, "grad_norm": 0.6395995499615521, "learning_rate": 3.6437441343082174e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.3023369312286377, "step": 1825, "valid_targets_mean": 3259.2, "valid_targets_min": 1084 }, { "epoch": 1.9222689075630253, "grad_norm": 0.5856128524517397, "learning_rate": 3.6407542107625167e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.27946245670318604, "step": 1830, "valid_targets_mean": 3337.9, "valid_targets_min": 1035 }, { "epoch": 1.9275210084033614, "grad_norm": 0.5516337340536542, "learning_rate": 3.637753030417192e-05, "loss": 0.282, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830444574356079, "step": 1835, "valid_targets_mean": 4091.9, "valid_targets_min": 1876 }, { "epoch": 1.9327731092436975, "grad_norm": 0.6188213113954284, "learning_rate": 3.6347406138625805e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.3005865812301636, "step": 1840, "valid_targets_mean": 3705.8, "valid_targets_min": 1062 }, { "epoch": 1.9380252100840336, "grad_norm": 0.6342838492371049, "learning_rate": 3.631716981766111e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.2753984034061432, "step": 1845, "valid_targets_mean": 3030.8, "valid_targets_min": 993 }, { "epoch": 1.9432773109243697, "grad_norm": 0.5880238709579537, "learning_rate": 3.6286821548721594e-05, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.28602135181427, "step": 1850, "valid_targets_mean": 3366.9, "valid_targets_min": 873 }, { "epoch": 1.9485294117647058, "grad_norm": 0.5720082036013604, "learning_rate": 3.625636154001904e-05, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.2676365375518799, "step": 1855, "valid_targets_mean": 3651.0, "valid_targets_min": 1295 }, { "epoch": 1.9537815126050422, "grad_norm": 0.585699773613234, "learning_rate": 3.622579000053186e-05, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.29407864809036255, "step": 1860, "valid_targets_mean": 3583.6, "valid_targets_min": 1598 }, { "epoch": 1.9590336134453783, "grad_norm": 0.6205691001395918, "learning_rate": 3.619510714000368e-05, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.27674800157546997, "step": 1865, "valid_targets_mean": 2903.2, "valid_targets_min": 1123 }, { "epoch": 1.9642857142857144, "grad_norm": 0.7438366690160714, "learning_rate": 3.616431316894181e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.31191760301589966, "step": 1870, "valid_targets_mean": 3116.1, "valid_targets_min": 1621 }, { "epoch": 1.9695378151260505, "grad_norm": 0.6496526680316776, "learning_rate": 3.613340829861592e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.2977924346923828, "step": 1875, "valid_targets_mean": 3081.4, "valid_targets_min": 1858 }, { "epoch": 1.9747899159663866, "grad_norm": 0.5707764114436218, "learning_rate": 3.61023927410565e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.25262773036956787, "step": 1880, "valid_targets_mean": 3470.7, "valid_targets_min": 420 }, { "epoch": 1.9800420168067228, "grad_norm": 0.601493220440057, "learning_rate": 3.607126670905346e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2920111417770386, "step": 1885, "valid_targets_mean": 3584.2, "valid_targets_min": 757 }, { "epoch": 1.9852941176470589, "grad_norm": 0.6874129379616689, "learning_rate": 3.60400304161546e-05, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.2971467673778534, "step": 1890, "valid_targets_mean": 2940.8, "valid_targets_min": 732 }, { "epoch": 1.990546218487395, "grad_norm": 0.6483438175679863, "learning_rate": 3.600868407666426e-05, "loss": 0.2939, "loss_nan_ranks": 0, "loss_rank_avg": 0.29474449157714844, "step": 1895, "valid_targets_mean": 3248.2, "valid_targets_min": 929 }, { "epoch": 1.995798319327731, "grad_norm": 0.5918173246249905, "learning_rate": 3.597722790564172e-05, "loss": 0.2929, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911064624786377, "step": 1900, "valid_targets_mean": 3728.8, "valid_targets_min": 1217 }, { "epoch": 2.0010504201680672, "grad_norm": 1.269479871339695, "learning_rate": 3.5945662118899824e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.21561074256896973, "step": 1905, "valid_targets_mean": 1523.7, "valid_targets_min": 544 }, { "epoch": 2.0063025210084033, "grad_norm": 0.834502760942854, "learning_rate": 3.5913986933003455e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.1978900134563446, "step": 1910, "valid_targets_mean": 1311.9, "valid_targets_min": 632 }, { "epoch": 2.0115546218487395, "grad_norm": 0.8472702704612042, "learning_rate": 3.5882202565268046e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.19883087277412415, "step": 1915, "valid_targets_mean": 1391.8, "valid_targets_min": 514 }, { "epoch": 2.0168067226890756, "grad_norm": 0.8558019853903324, "learning_rate": 3.58503092337581e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.2164035588502884, "step": 1920, "valid_targets_mean": 1409.8, "valid_targets_min": 701 }, { "epoch": 2.0220588235294117, "grad_norm": 0.755196603700863, "learning_rate": 3.5818307157285705e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.20270323753356934, "step": 1925, "valid_targets_mean": 1448.8, "valid_targets_min": 742 }, { "epoch": 2.027310924369748, "grad_norm": 0.7296703034732365, "learning_rate": 3.5786196555409006e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.18208900094032288, "step": 1930, "valid_targets_mean": 1219.5, "valid_targets_min": 746 }, { "epoch": 2.032563025210084, "grad_norm": 0.7684329269994562, "learning_rate": 3.575397764843073e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.19005586206912994, "step": 1935, "valid_targets_mean": 1416.7, "valid_targets_min": 774 }, { "epoch": 2.03781512605042, "grad_norm": 0.7346120823737189, "learning_rate": 3.572165065739664e-05, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.173833429813385, "step": 1940, "valid_targets_mean": 1294.7, "valid_targets_min": 648 }, { "epoch": 2.043067226890756, "grad_norm": 0.7872472114882302, "learning_rate": 3.5689215804094053e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.19836294651031494, "step": 1945, "valid_targets_mean": 1322.9, "valid_targets_min": 708 }, { "epoch": 2.0483193277310923, "grad_norm": 0.7139156271445127, "learning_rate": 3.5656673311050285e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.166924387216568, "step": 1950, "valid_targets_mean": 1500.9, "valid_targets_min": 788 }, { "epoch": 2.0535714285714284, "grad_norm": 0.7546720109875962, "learning_rate": 3.562402340153115e-05, "loss": 0.1969, "loss_nan_ranks": 0, "loss_rank_avg": 0.1813475340604782, "step": 1955, "valid_targets_mean": 1277.2, "valid_targets_min": 615 }, { "epoch": 2.0588235294117645, "grad_norm": 0.8007930214332662, "learning_rate": 3.559126629953942e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.19298464059829712, "step": 1960, "valid_targets_mean": 1355.1, "valid_targets_min": 627 }, { "epoch": 2.064075630252101, "grad_norm": 1.0715850452767404, "learning_rate": 3.5558402229813287e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.19311118125915527, "step": 1965, "valid_targets_mean": 1323.2, "valid_targets_min": 753 }, { "epoch": 2.069327731092437, "grad_norm": 0.7534257104768941, "learning_rate": 3.552543141782483e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.19203367829322815, "step": 1970, "valid_targets_mean": 1427.2, "valid_targets_min": 740 }, { "epoch": 2.0745798319327733, "grad_norm": 0.7434395907521474, "learning_rate": 3.549235408977843e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.19772931933403015, "step": 1975, "valid_targets_mean": 1519.6, "valid_targets_min": 642 }, { "epoch": 2.0798319327731094, "grad_norm": 0.7265121475274179, "learning_rate": 3.545917047260928e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.16659091413021088, "step": 1980, "valid_targets_mean": 1209.2, "valid_targets_min": 518 }, { "epoch": 2.0850840336134455, "grad_norm": 0.7590657870156368, "learning_rate": 3.542588079398179e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.20139284431934357, "step": 1985, "valid_targets_mean": 1439.6, "valid_targets_min": 721 }, { "epoch": 2.0903361344537816, "grad_norm": 0.7606478486879998, "learning_rate": 3.539248528228801e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.1940763294696808, "step": 1990, "valid_targets_mean": 1469.9, "valid_targets_min": 727 }, { "epoch": 2.0955882352941178, "grad_norm": 0.7061929545295577, "learning_rate": 3.535898416664611e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.19255903363227844, "step": 1995, "valid_targets_mean": 1412.1, "valid_targets_min": 803 }, { "epoch": 2.100840336134454, "grad_norm": 0.7887719103581653, "learning_rate": 3.5325377676898766e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.2186465561389923, "step": 2000, "valid_targets_mean": 1546.6, "valid_targets_min": 698 }, { "epoch": 2.10609243697479, "grad_norm": 0.8070718344561886, "learning_rate": 3.529166604361161e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2157689332962036, "step": 2005, "valid_targets_mean": 1728.5, "valid_targets_min": 832 }, { "epoch": 2.111344537815126, "grad_norm": 0.6799684604036553, "learning_rate": 3.525784949807162e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.18615804612636566, "step": 2010, "valid_targets_mean": 1575.1, "valid_targets_min": 891 }, { "epoch": 2.116596638655462, "grad_norm": 0.7859292131535734, "learning_rate": 3.522392827228557e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.20224624872207642, "step": 2015, "valid_targets_mean": 1346.5, "valid_targets_min": 621 }, { "epoch": 2.1218487394957983, "grad_norm": 0.7769917237320048, "learning_rate": 3.518990259897841e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.16991014778614044, "step": 2020, "valid_targets_mean": 1285.5, "valid_targets_min": 697 }, { "epoch": 2.1271008403361344, "grad_norm": 0.7202399948858199, "learning_rate": 3.515577271159167e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.1941305696964264, "step": 2025, "valid_targets_mean": 1565.5, "valid_targets_min": 824 }, { "epoch": 2.1323529411764706, "grad_norm": 0.7845226485201681, "learning_rate": 3.512153884428188e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.17622260749340057, "step": 2030, "valid_targets_mean": 1331.2, "valid_targets_min": 584 }, { "epoch": 2.1376050420168067, "grad_norm": 0.7398989600657419, "learning_rate": 3.5087201231918944e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.1894277185201645, "step": 2035, "valid_targets_mean": 1568.8, "valid_targets_min": 1033 }, { "epoch": 2.142857142857143, "grad_norm": 0.7770180042406308, "learning_rate": 3.505276011008454e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.2185641974210739, "step": 2040, "valid_targets_mean": 1584.9, "valid_targets_min": 1007 }, { "epoch": 2.148109243697479, "grad_norm": 0.78686344769378, "learning_rate": 3.501821571507048e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.1753498911857605, "step": 2045, "valid_targets_mean": 1267.1, "valid_targets_min": 613 }, { "epoch": 2.153361344537815, "grad_norm": 1.063699580344548, "learning_rate": 3.498356828387714e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.1909262090921402, "step": 2050, "valid_targets_mean": 1532.2, "valid_targets_min": 768 }, { "epoch": 2.158613445378151, "grad_norm": 0.7643365744929539, "learning_rate": 3.494881805421176e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.16610810160636902, "step": 2055, "valid_targets_mean": 1112.7, "valid_targets_min": 643 }, { "epoch": 2.1638655462184873, "grad_norm": 0.7926765771940254, "learning_rate": 3.4913965264486894e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.18852682411670685, "step": 2060, "valid_targets_mean": 1402.3, "valid_targets_min": 841 }, { "epoch": 2.1691176470588234, "grad_norm": 0.729414923035659, "learning_rate": 3.48790101538187e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.18665212392807007, "step": 2065, "valid_targets_mean": 1577.6, "valid_targets_min": 705 }, { "epoch": 2.1743697478991595, "grad_norm": 0.8405323016094074, "learning_rate": 3.484395296202537e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.1933499127626419, "step": 2070, "valid_targets_mean": 1190.7, "valid_targets_min": 716 }, { "epoch": 2.1796218487394956, "grad_norm": 0.7875851862101669, "learning_rate": 3.480879392962541e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.17440925538539886, "step": 2075, "valid_targets_mean": 1209.2, "valid_targets_min": 627 }, { "epoch": 2.184873949579832, "grad_norm": 0.7185518361219825, "learning_rate": 3.477353329783606e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.16545218229293823, "step": 2080, "valid_targets_mean": 1253.7, "valid_targets_min": 619 }, { "epoch": 2.190126050420168, "grad_norm": 0.7600617986037965, "learning_rate": 3.4738171308571595e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.19123047590255737, "step": 2085, "valid_targets_mean": 1403.3, "valid_targets_min": 734 }, { "epoch": 2.1953781512605044, "grad_norm": 0.7730815354374817, "learning_rate": 3.470270820444168e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.18116678297519684, "step": 2090, "valid_targets_mean": 1356.3, "valid_targets_min": 700 }, { "epoch": 2.2006302521008405, "grad_norm": 0.7542365322548513, "learning_rate": 3.4667144228749697e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.18537303805351257, "step": 2095, "valid_targets_mean": 1550.9, "valid_targets_min": 892 }, { "epoch": 2.2058823529411766, "grad_norm": 0.7438888508924026, "learning_rate": 3.463147962549109e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.16940736770629883, "step": 2100, "valid_targets_mean": 1295.9, "valid_targets_min": 711 }, { "epoch": 2.2111344537815127, "grad_norm": 0.7547714805297574, "learning_rate": 3.459571463935168e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.16632413864135742, "step": 2105, "valid_targets_mean": 1380.6, "valid_targets_min": 694 }, { "epoch": 2.216386554621849, "grad_norm": 0.7974469156906152, "learning_rate": 3.455984951570598e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.20498281717300415, "step": 2110, "valid_targets_mean": 1487.6, "valid_targets_min": 818 }, { "epoch": 2.221638655462185, "grad_norm": 0.7460498917875708, "learning_rate": 3.452388450061556e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.1839742511510849, "step": 2115, "valid_targets_mean": 1640.1, "valid_targets_min": 1011 }, { "epoch": 2.226890756302521, "grad_norm": 0.7976082882204165, "learning_rate": 3.448781984082727e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.1880989819765091, "step": 2120, "valid_targets_mean": 1356.1, "valid_targets_min": 748 }, { "epoch": 2.232142857142857, "grad_norm": 0.8198726303330894, "learning_rate": 3.4451655783771625e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.19785097241401672, "step": 2125, "valid_targets_mean": 1494.3, "valid_targets_min": 699 }, { "epoch": 2.2373949579831933, "grad_norm": 0.7959727926112404, "learning_rate": 3.4415392577561064e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.17913001775741577, "step": 2130, "valid_targets_mean": 1201.1, "valid_targets_min": 534 }, { "epoch": 2.2426470588235294, "grad_norm": 0.7163813248237905, "learning_rate": 3.4379030470988285e-05, "loss": 0.1909, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842835247516632, "step": 2135, "valid_targets_mean": 1393.6, "valid_targets_min": 687 }, { "epoch": 2.2478991596638656, "grad_norm": 0.7075959634728527, "learning_rate": 3.4342569713524496e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.18208453059196472, "step": 2140, "valid_targets_mean": 1363.2, "valid_targets_min": 549 }, { "epoch": 2.2531512605042017, "grad_norm": 0.7211274630211372, "learning_rate": 3.4306010555317735e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.18160000443458557, "step": 2145, "valid_targets_mean": 1349.1, "valid_targets_min": 725 }, { "epoch": 2.258403361344538, "grad_norm": 0.7402311941740003, "learning_rate": 3.4269353247191135e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.1999184489250183, "step": 2150, "valid_targets_mean": 1651.7, "valid_targets_min": 852 }, { "epoch": 2.263655462184874, "grad_norm": 0.6795776738854672, "learning_rate": 3.423259804064122e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.18849042057991028, "step": 2155, "valid_targets_mean": 1559.5, "valid_targets_min": 1010 }, { "epoch": 2.26890756302521, "grad_norm": 0.7308651601236005, "learning_rate": 3.419574518783616e-05, "loss": 0.1861, "loss_nan_ranks": 0, "loss_rank_avg": 0.17530426383018494, "step": 2160, "valid_targets_mean": 1387.0, "valid_targets_min": 545 }, { "epoch": 2.274159663865546, "grad_norm": 0.8144354216387479, "learning_rate": 3.4158794941614055e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.19270774722099304, "step": 2165, "valid_targets_mean": 1385.4, "valid_targets_min": 843 }, { "epoch": 2.2794117647058822, "grad_norm": 0.631924641323973, "learning_rate": 3.4121747555481216e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.19547529518604279, "step": 2170, "valid_targets_mean": 1716.2, "valid_targets_min": 802 }, { "epoch": 2.2846638655462184, "grad_norm": 0.7544602510753329, "learning_rate": 3.4084603283610365e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.18898774683475494, "step": 2175, "valid_targets_mean": 1409.9, "valid_targets_min": 612 }, { "epoch": 2.2899159663865545, "grad_norm": 0.7250456296463277, "learning_rate": 3.404736238083897e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.17501644790172577, "step": 2180, "valid_targets_mean": 1415.8, "valid_targets_min": 673 }, { "epoch": 2.2951680672268906, "grad_norm": 0.8001168867925627, "learning_rate": 3.401002510266744e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.18818825483322144, "step": 2185, "valid_targets_mean": 1332.9, "valid_targets_min": 705 }, { "epoch": 2.3004201680672267, "grad_norm": 0.6987572245775185, "learning_rate": 3.397259170525739e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.16560634970664978, "step": 2190, "valid_targets_mean": 1402.1, "valid_targets_min": 822 }, { "epoch": 2.3056722689075633, "grad_norm": 0.7531921047773884, "learning_rate": 3.393506244542991e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.16486376523971558, "step": 2195, "valid_targets_mean": 1272.8, "valid_targets_min": 604 }, { "epoch": 2.310924369747899, "grad_norm": 0.6999344056695282, "learning_rate": 3.389743758066374e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.17392639815807343, "step": 2200, "valid_targets_mean": 1460.0, "valid_targets_min": 647 }, { "epoch": 2.3161764705882355, "grad_norm": 0.7036250917228805, "learning_rate": 3.385971736909357e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.1617729663848877, "step": 2205, "valid_targets_mean": 1283.6, "valid_targets_min": 613 }, { "epoch": 2.3214285714285716, "grad_norm": 0.7068382427421205, "learning_rate": 3.382190206950822e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.17291636765003204, "step": 2210, "valid_targets_mean": 1288.4, "valid_targets_min": 713 }, { "epoch": 2.3266806722689077, "grad_norm": 0.663523616107997, "learning_rate": 3.3783991941348916e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.16455985605716705, "step": 2215, "valid_targets_mean": 1533.8, "valid_targets_min": 892 }, { "epoch": 2.331932773109244, "grad_norm": 0.7721343986047551, "learning_rate": 3.374598724470745e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.19193603098392487, "step": 2220, "valid_targets_mean": 1345.8, "valid_targets_min": 772 }, { "epoch": 2.33718487394958, "grad_norm": 0.7240487637559474, "learning_rate": 3.370788824032441e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.1901538372039795, "step": 2225, "valid_targets_mean": 1601.2, "valid_targets_min": 636 }, { "epoch": 2.342436974789916, "grad_norm": 0.7718537058087979, "learning_rate": 3.366969518958746e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.1778993457555771, "step": 2230, "valid_targets_mean": 1366.1, "valid_targets_min": 641 }, { "epoch": 2.347689075630252, "grad_norm": 0.7977490601269798, "learning_rate": 3.363140835452945e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.20514068007469177, "step": 2235, "valid_targets_mean": 1482.2, "valid_targets_min": 818 }, { "epoch": 2.3529411764705883, "grad_norm": 0.7668591077227411, "learning_rate": 3.3593027997826654e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.1879502534866333, "step": 2240, "valid_targets_mean": 1420.5, "valid_targets_min": 729 }, { "epoch": 2.3581932773109244, "grad_norm": 0.7855984838086749, "learning_rate": 3.355455438279702e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.21655318140983582, "step": 2245, "valid_targets_mean": 1723.6, "valid_targets_min": 1001 }, { "epoch": 2.3634453781512605, "grad_norm": 0.7364382070700145, "learning_rate": 3.351598777339827e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.1900310218334198, "step": 2250, "valid_targets_mean": 1626.4, "valid_targets_min": 1175 }, { "epoch": 2.3686974789915967, "grad_norm": 0.7437939379036828, "learning_rate": 3.3477328434226164e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.19543638825416565, "step": 2255, "valid_targets_mean": 1434.9, "valid_targets_min": 779 }, { "epoch": 2.3739495798319328, "grad_norm": 0.7246181422661423, "learning_rate": 3.343857663051264e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.1804441660642624, "step": 2260, "valid_targets_mean": 1413.4, "valid_targets_min": 730 }, { "epoch": 2.379201680672269, "grad_norm": 0.73443894447988, "learning_rate": 3.339973262812403e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.17590978741645813, "step": 2265, "valid_targets_mean": 1360.3, "valid_targets_min": 564 }, { "epoch": 2.384453781512605, "grad_norm": 0.8777730335212939, "learning_rate": 3.336079669355921e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.18321183323860168, "step": 2270, "valid_targets_mean": 1550.0, "valid_targets_min": 651 }, { "epoch": 2.389705882352941, "grad_norm": 0.7244538791290572, "learning_rate": 3.332176909394777e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.1737801432609558, "step": 2275, "valid_targets_mean": 1342.3, "valid_targets_min": 716 }, { "epoch": 2.3949579831932772, "grad_norm": 0.7245107985964735, "learning_rate": 3.3282650097048206e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.1800583004951477, "step": 2280, "valid_targets_mean": 1339.6, "valid_targets_min": 707 }, { "epoch": 2.4002100840336134, "grad_norm": 0.7235945312664076, "learning_rate": 3.324343997124606e-05, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.15614992380142212, "step": 2285, "valid_targets_mean": 1459.4, "valid_targets_min": 964 }, { "epoch": 2.4054621848739495, "grad_norm": 0.7567614980512993, "learning_rate": 3.3204138985552094e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.20014092326164246, "step": 2290, "valid_targets_mean": 1562.7, "valid_targets_min": 793 }, { "epoch": 2.4107142857142856, "grad_norm": 0.7418561305374557, "learning_rate": 3.316474740960041e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.17074398696422577, "step": 2295, "valid_targets_mean": 1367.2, "valid_targets_min": 727 }, { "epoch": 2.4159663865546217, "grad_norm": 0.7089430053862654, "learning_rate": 3.312526551364667e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.17129768431186676, "step": 2300, "valid_targets_mean": 1451.4, "valid_targets_min": 734 }, { "epoch": 2.421218487394958, "grad_norm": 0.5820555364713835, "learning_rate": 3.308569356856616e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320435255765915, "step": 2305, "valid_targets_mean": 2171.5, "valid_targets_min": 978 }, { "epoch": 2.426470588235294, "grad_norm": 0.6553889260546893, "learning_rate": 3.3046031845851993e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.16868937015533447, "step": 2310, "valid_targets_mean": 1519.2, "valid_targets_min": 595 }, { "epoch": 2.43172268907563, "grad_norm": 0.7087358397507307, "learning_rate": 3.3006280617613214e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.17215979099273682, "step": 2315, "valid_targets_mean": 1396.3, "valid_targets_min": 570 }, { "epoch": 2.4369747899159666, "grad_norm": 0.7369066907552546, "learning_rate": 3.296644015657295e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.18438240885734558, "step": 2320, "valid_targets_mean": 1494.4, "valid_targets_min": 914 }, { "epoch": 2.4422268907563023, "grad_norm": 0.69010875765003, "learning_rate": 3.292651073606652e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.16703712940216064, "step": 2325, "valid_targets_mean": 1541.1, "valid_targets_min": 1070 }, { "epoch": 2.447478991596639, "grad_norm": 0.7340635719059896, "learning_rate": 3.288649263003958e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.18820658326148987, "step": 2330, "valid_targets_mean": 1509.0, "valid_targets_min": 626 }, { "epoch": 2.452731092436975, "grad_norm": 0.7197216030974956, "learning_rate": 3.284638611304623e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.17071965336799622, "step": 2335, "valid_targets_mean": 1484.4, "valid_targets_min": 718 }, { "epoch": 2.457983193277311, "grad_norm": 0.7517975842539306, "learning_rate": 3.280619146024714e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.19978466629981995, "step": 2340, "valid_targets_mean": 1505.0, "valid_targets_min": 762 }, { "epoch": 2.463235294117647, "grad_norm": 0.7266865301196809, "learning_rate": 3.2765908947407665e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.2888498306274414, "step": 2345, "valid_targets_mean": 3602.9, "valid_targets_min": 1698 }, { "epoch": 2.4684873949579833, "grad_norm": 0.5649119554586547, "learning_rate": 3.2725538850895933e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.25794461369514465, "step": 2350, "valid_targets_mean": 3718.5, "valid_targets_min": 533 }, { "epoch": 2.4737394957983194, "grad_norm": 0.7045726718503901, "learning_rate": 3.268508144768096e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.2772102653980255, "step": 2355, "valid_targets_mean": 3299.2, "valid_targets_min": 835 }, { "epoch": 2.4789915966386555, "grad_norm": 0.564312940590048, "learning_rate": 3.264453701533075e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.2812797725200653, "step": 2360, "valid_targets_mean": 4040.6, "valid_targets_min": 1201 }, { "epoch": 2.4842436974789917, "grad_norm": 0.6103845308794094, "learning_rate": 3.260390583201041e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.26815706491470337, "step": 2365, "valid_targets_mean": 3995.7, "valid_targets_min": 980 }, { "epoch": 2.4894957983193278, "grad_norm": 0.5643937322946125, "learning_rate": 3.2563188176480217e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.31056275963783264, "step": 2370, "valid_targets_mean": 4070.5, "valid_targets_min": 1744 }, { "epoch": 2.494747899159664, "grad_norm": 0.5232363392589175, "learning_rate": 3.252238432809368e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.22355665266513824, "step": 2375, "valid_targets_mean": 3831.8, "valid_targets_min": 1734 }, { "epoch": 2.5, "grad_norm": 0.666569390983386, "learning_rate": 3.2481494566795716e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557009756565094, "step": 2380, "valid_targets_mean": 4593.9, "valid_targets_min": 1381 }, { "epoch": 2.505252100840336, "grad_norm": 0.5634090394701392, "learning_rate": 3.244051917312061e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.2774540185928345, "step": 2385, "valid_targets_mean": 3523.4, "valid_targets_min": 1024 }, { "epoch": 2.5105042016806722, "grad_norm": 0.5827012399453538, "learning_rate": 3.239945842819018e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.27029716968536377, "step": 2390, "valid_targets_mean": 3686.2, "valid_targets_min": 2107 }, { "epoch": 2.5157563025210083, "grad_norm": 0.6119604303971371, "learning_rate": 3.2358312613711804e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.2673264741897583, "step": 2395, "valid_targets_mean": 3195.1, "valid_targets_min": 802 }, { "epoch": 2.5210084033613445, "grad_norm": 0.5309909333341549, "learning_rate": 3.231708201197653e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.27537453174591064, "step": 2400, "valid_targets_mean": 4344.2, "valid_targets_min": 1597 }, { "epoch": 2.5262605042016806, "grad_norm": 0.6196309832297628, "learning_rate": 3.227576690585706e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.27964839339256287, "step": 2405, "valid_targets_mean": 3039.4, "valid_targets_min": 1535 }, { "epoch": 2.5315126050420167, "grad_norm": 0.6105328048520959, "learning_rate": 3.223436757880591e-05, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.2900930643081665, "step": 2410, "valid_targets_mean": 3732.8, "valid_targets_min": 1385 }, { "epoch": 2.536764705882353, "grad_norm": 0.6121657286750687, "learning_rate": 3.219288431485337e-05, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.296478807926178, "step": 2415, "valid_targets_mean": 3802.3, "valid_targets_min": 1451 }, { "epoch": 2.542016806722689, "grad_norm": 0.6645007327168074, "learning_rate": 3.2151317398605646e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.29341888427734375, "step": 2420, "valid_targets_mean": 2909.6, "valid_targets_min": 1269 }, { "epoch": 2.5472689075630255, "grad_norm": 0.6452736492861937, "learning_rate": 3.2109667115242815e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.2756231725215912, "step": 2425, "valid_targets_mean": 2893.6, "valid_targets_min": 935 }, { "epoch": 2.552521008403361, "grad_norm": 0.6459381577493258, "learning_rate": 3.206793375051694e-05, "loss": 0.2821, "loss_nan_ranks": 0, "loss_rank_avg": 0.2834113836288452, "step": 2430, "valid_targets_mean": 3271.2, "valid_targets_min": 1695 }, { "epoch": 2.5577731092436977, "grad_norm": 0.6599512718640789, "learning_rate": 3.2026117590750086e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2733537554740906, "step": 2435, "valid_targets_mean": 3117.0, "valid_targets_min": 671 }, { "epoch": 2.5630252100840334, "grad_norm": 0.567668736976835, "learning_rate": 3.198421892283235e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.2664722502231598, "step": 2440, "valid_targets_mean": 3738.3, "valid_targets_min": 1020 }, { "epoch": 2.56827731092437, "grad_norm": 0.6231370164675432, "learning_rate": 3.1942238034219885e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.28766465187072754, "step": 2445, "valid_targets_mean": 3198.6, "valid_targets_min": 1889 }, { "epoch": 2.5735294117647056, "grad_norm": 0.6316291488754031, "learning_rate": 3.190017521293296e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.2555858790874481, "step": 2450, "valid_targets_mean": 3085.4, "valid_targets_min": 1385 }, { "epoch": 2.578781512605042, "grad_norm": 0.6263309654818119, "learning_rate": 3.185803074755395e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.2710253596305847, "step": 2455, "valid_targets_mean": 3538.3, "valid_targets_min": 1548 }, { "epoch": 2.5840336134453783, "grad_norm": 0.6117849557050007, "learning_rate": 3.1815804927225363e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.26848098635673523, "step": 2460, "valid_targets_mean": 3289.2, "valid_targets_min": 699 }, { "epoch": 2.5892857142857144, "grad_norm": 0.6124680799238794, "learning_rate": 3.1773498041647876e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.27038100361824036, "step": 2465, "valid_targets_mean": 3072.8, "valid_targets_min": 648 }, { "epoch": 2.5945378151260505, "grad_norm": 0.5501431568044479, "learning_rate": 3.173111038107834e-05, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.2502066195011139, "step": 2470, "valid_targets_mean": 4004.5, "valid_targets_min": 1851 }, { "epoch": 2.5997899159663866, "grad_norm": 0.5757740316879347, "learning_rate": 3.168864223632776e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.26100954413414, "step": 2475, "valid_targets_mean": 3751.6, "valid_targets_min": 1540 }, { "epoch": 2.6050420168067228, "grad_norm": 0.623122866098537, "learning_rate": 3.1646093898759334e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.269726425409317, "step": 2480, "valid_targets_mean": 3402.6, "valid_targets_min": 1410 }, { "epoch": 2.610294117647059, "grad_norm": 0.6140867953660799, "learning_rate": 3.160346566028645e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.28402426838874817, "step": 2485, "valid_targets_mean": 3822.9, "valid_targets_min": 2040 }, { "epoch": 2.615546218487395, "grad_norm": 0.6458360451166494, "learning_rate": 3.156075781337068e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.2804952561855316, "step": 2490, "valid_targets_mean": 2824.4, "valid_targets_min": 1458 }, { "epoch": 2.620798319327731, "grad_norm": 0.614578628604973, "learning_rate": 3.1517970651019735e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.267007976770401, "step": 2495, "valid_targets_mean": 3497.6, "valid_targets_min": 1589 }, { "epoch": 2.6260504201680672, "grad_norm": 0.6550756431874655, "learning_rate": 3.1475104466785536e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.2752663195133209, "step": 2500, "valid_targets_mean": 2745.1, "valid_targets_min": 513 }, { "epoch": 2.6313025210084033, "grad_norm": 0.7285449233093796, "learning_rate": 3.143215955476211e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.30785495042800903, "step": 2505, "valid_targets_mean": 3143.5, "valid_targets_min": 1636 }, { "epoch": 2.6365546218487395, "grad_norm": 0.5763401907930161, "learning_rate": 3.138913620958365e-05, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.26492440700531006, "step": 2510, "valid_targets_mean": 3906.8, "valid_targets_min": 2383 }, { "epoch": 2.6418067226890756, "grad_norm": 0.5946439618794739, "learning_rate": 3.134603472642244e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.25987619161605835, "step": 2515, "valid_targets_mean": 3180.3, "valid_targets_min": 1372 }, { "epoch": 2.6470588235294117, "grad_norm": 0.7017146713713763, "learning_rate": 3.1302855400986866e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.25516122579574585, "step": 2520, "valid_targets_mean": 2634.1, "valid_targets_min": 1401 }, { "epoch": 2.652310924369748, "grad_norm": 0.7063131822296524, "learning_rate": 3.1259598529519336e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.2827465236186981, "step": 2525, "valid_targets_mean": 2937.3, "valid_targets_min": 1504 }, { "epoch": 2.657563025210084, "grad_norm": 0.6322826497339568, "learning_rate": 3.121626440879432e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.24802082777023315, "step": 2530, "valid_targets_mean": 3097.8, "valid_targets_min": 1648 }, { "epoch": 2.66281512605042, "grad_norm": 0.6405774977690727, "learning_rate": 3.117285333611625e-05, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.247537761926651, "step": 2535, "valid_targets_mean": 3982.1, "valid_targets_min": 959 }, { "epoch": 2.668067226890756, "grad_norm": 0.5925204140545449, "learning_rate": 3.112936560931752e-05, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.24100324511528015, "step": 2540, "valid_targets_mean": 3329.1, "valid_targets_min": 1261 }, { "epoch": 2.6733193277310923, "grad_norm": 0.6277943771927688, "learning_rate": 3.108580152675642e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.2357967495918274, "step": 2545, "valid_targets_mean": 3185.8, "valid_targets_min": 1294 }, { "epoch": 2.678571428571429, "grad_norm": 0.6292055198908869, "learning_rate": 3.104216138731511e-05, "loss": 0.2676, "loss_nan_ranks": 0, "loss_rank_avg": 0.2757669687271118, "step": 2550, "valid_targets_mean": 3340.1, "valid_targets_min": 1432 }, { "epoch": 2.6838235294117645, "grad_norm": 0.6031199057951037, "learning_rate": 3.0998445490397546e-05, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.26977115869522095, "step": 2555, "valid_targets_mean": 3379.6, "valid_targets_min": 742 }, { "epoch": 2.689075630252101, "grad_norm": 0.6624342295310539, "learning_rate": 3.095465413592743e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.27833864092826843, "step": 2560, "valid_targets_mean": 2969.1, "valid_targets_min": 988 }, { "epoch": 2.6943277310924367, "grad_norm": 0.6361231679633825, "learning_rate": 3.091078762434616e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749124765396118, "step": 2565, "valid_targets_mean": 3232.6, "valid_targets_min": 654 }, { "epoch": 2.6995798319327733, "grad_norm": 0.616757107135465, "learning_rate": 3.086684625661081e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631353735923767, "step": 2570, "valid_targets_mean": 3125.7, "valid_targets_min": 1328 }, { "epoch": 2.7048319327731094, "grad_norm": 0.6893720258364816, "learning_rate": 3.082283033419197e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.2686452567577362, "step": 2575, "valid_targets_mean": 3166.4, "valid_targets_min": 1302 }, { "epoch": 2.7100840336134455, "grad_norm": 0.6092903528556366, "learning_rate": 3.077874015907174e-05, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.2558513283729553, "step": 2580, "valid_targets_mean": 4101.6, "valid_targets_min": 1701 }, { "epoch": 2.7153361344537816, "grad_norm": 0.5889526951400187, "learning_rate": 3.073457603374167e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.25581663846969604, "step": 2585, "valid_targets_mean": 3677.3, "valid_targets_min": 1319 }, { "epoch": 2.7205882352941178, "grad_norm": 0.642935413766165, "learning_rate": 3.069033826120066e-05, "loss": 0.2416, "loss_nan_ranks": 0, "loss_rank_avg": 0.255086213350296, "step": 2590, "valid_targets_mean": 3259.8, "valid_targets_min": 1194 }, { "epoch": 2.725840336134454, "grad_norm": 0.6235865519519191, "learning_rate": 3.064602714495286e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.25447195768356323, "step": 2595, "valid_targets_mean": 2886.7, "valid_targets_min": 1220 }, { "epoch": 2.73109243697479, "grad_norm": 0.5840881578880576, "learning_rate": 3.060164298900565e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.25606703758239746, "step": 2600, "valid_targets_mean": 3948.4, "valid_targets_min": 1742 }, { "epoch": 2.736344537815126, "grad_norm": 0.70617682044821, "learning_rate": 3.055718609786749e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.2716052234172821, "step": 2605, "valid_targets_mean": 2877.3, "valid_targets_min": 1234 }, { "epoch": 2.741596638655462, "grad_norm": 0.6377305035799299, "learning_rate": 3.051265677654585e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.2713176906108856, "step": 2610, "valid_targets_mean": 3126.6, "valid_targets_min": 1686 }, { "epoch": 2.7468487394957983, "grad_norm": 0.5626998875518994, "learning_rate": 3.0468055330545162e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.23960676789283752, "step": 2615, "valid_targets_mean": 3957.4, "valid_targets_min": 618 }, { "epoch": 2.7521008403361344, "grad_norm": 0.6556128296668272, "learning_rate": 3.0423382065864653e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.25945764780044556, "step": 2620, "valid_targets_mean": 2844.3, "valid_targets_min": 1364 }, { "epoch": 2.7573529411764706, "grad_norm": 0.6666237064634677, "learning_rate": 3.0378637288996304e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.26987403631210327, "step": 2625, "valid_targets_mean": 3537.1, "valid_targets_min": 1514 }, { "epoch": 2.7626050420168067, "grad_norm": 0.6590248047133942, "learning_rate": 3.033382130692269e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.26807478070259094, "step": 2630, "valid_targets_mean": 2863.1, "valid_targets_min": 1073 }, { "epoch": 2.767857142857143, "grad_norm": 0.6761466657105407, "learning_rate": 3.0288934427114955e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.27322080731391907, "step": 2635, "valid_targets_mean": 2907.8, "valid_targets_min": 1026 }, { "epoch": 2.773109243697479, "grad_norm": 0.6353889677418061, "learning_rate": 3.0243976957530602e-05, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.23086395859718323, "step": 2640, "valid_targets_mean": 2695.9, "valid_targets_min": 1254 }, { "epoch": 2.778361344537815, "grad_norm": 0.7083565681570431, "learning_rate": 3.0198949206611475e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.27140820026397705, "step": 2645, "valid_targets_mean": 3112.3, "valid_targets_min": 720 }, { "epoch": 2.783613445378151, "grad_norm": 0.6445873412413864, "learning_rate": 3.0153851483281582e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.29137080907821655, "step": 2650, "valid_targets_mean": 3687.8, "valid_targets_min": 1817 }, { "epoch": 2.7888655462184873, "grad_norm": 0.6275537197106373, "learning_rate": 3.010868409694499e-05, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.2466498464345932, "step": 2655, "valid_targets_mean": 3197.7, "valid_targets_min": 1411 }, { "epoch": 2.7941176470588234, "grad_norm": 0.5902973797283267, "learning_rate": 3.0063447357483712e-05, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413676530122757, "step": 2660, "valid_targets_mean": 3804.1, "valid_targets_min": 2253 }, { "epoch": 2.79936974789916, "grad_norm": 0.6686261268710058, "learning_rate": 3.0018141575255587e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.2801203727722168, "step": 2665, "valid_targets_mean": 3269.8, "valid_targets_min": 1860 }, { "epoch": 2.8046218487394956, "grad_norm": 0.5958481124800947, "learning_rate": 2.9972767061092107e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.24206840991973877, "step": 2670, "valid_targets_mean": 3550.5, "valid_targets_min": 1805 }, { "epoch": 2.809873949579832, "grad_norm": 0.5964898157229672, "learning_rate": 2.9927324126296352e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.24410061538219452, "step": 2675, "valid_targets_mean": 3646.2, "valid_targets_min": 1145 }, { "epoch": 2.815126050420168, "grad_norm": 0.6446057186222791, "learning_rate": 2.98818130826408e-05, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.2676333785057068, "step": 2680, "valid_targets_mean": 3167.9, "valid_targets_min": 1722 }, { "epoch": 2.8203781512605044, "grad_norm": 0.7582205523508831, "learning_rate": 2.9836234242365204e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.25383812189102173, "step": 2685, "valid_targets_mean": 2996.0, "valid_targets_min": 1423 }, { "epoch": 2.82563025210084, "grad_norm": 0.6301709788550426, "learning_rate": 2.979058791817447e-05, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749696969985962, "step": 2690, "valid_targets_mean": 3538.0, "valid_targets_min": 1426 }, { "epoch": 2.8308823529411766, "grad_norm": 0.6480505666026394, "learning_rate": 2.974487442323647e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.2599114179611206, "step": 2695, "valid_targets_mean": 3115.1, "valid_targets_min": 538 }, { "epoch": 2.8361344537815127, "grad_norm": 0.6882139342020044, "learning_rate": 2.9699094071179938e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.2708072364330292, "step": 2700, "valid_targets_mean": 2551.9, "valid_targets_min": 537 }, { "epoch": 2.841386554621849, "grad_norm": 0.6582888441321656, "learning_rate": 2.9653247176092286e-05, "loss": 0.2684, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539324164390564, "step": 2705, "valid_targets_mean": 3079.0, "valid_targets_min": 845 }, { "epoch": 2.846638655462185, "grad_norm": 0.638833559343612, "learning_rate": 2.9607334052517466e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.28745412826538086, "step": 2710, "valid_targets_mean": 3822.1, "valid_targets_min": 1625 }, { "epoch": 2.851890756302521, "grad_norm": 0.7422015502102081, "learning_rate": 2.9561355015453803e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.29670873284339905, "step": 2715, "valid_targets_mean": 2883.9, "valid_targets_min": 1400 }, { "epoch": 2.857142857142857, "grad_norm": 0.6490748235477826, "learning_rate": 2.9515310380351847e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.24093633890151978, "step": 2720, "valid_targets_mean": 3222.6, "valid_targets_min": 1868 }, { "epoch": 2.8623949579831933, "grad_norm": 0.7372791077034592, "learning_rate": 2.9469200463112186e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.25444963574409485, "step": 2725, "valid_targets_mean": 2862.1, "valid_targets_min": 648 }, { "epoch": 2.8676470588235294, "grad_norm": 0.7192710572965154, "learning_rate": 2.9423025580083298e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.245719313621521, "step": 2730, "valid_targets_mean": 3024.6, "valid_targets_min": 1404 }, { "epoch": 2.8728991596638656, "grad_norm": 0.6647970803562331, "learning_rate": 2.937678604805938e-05, "loss": 0.268, "loss_nan_ranks": 0, "loss_rank_avg": 0.2540484070777893, "step": 2735, "valid_targets_mean": 3429.3, "valid_targets_min": 814 }, { "epoch": 2.8781512605042017, "grad_norm": 0.612522922361621, "learning_rate": 2.9330482184278168e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.2477385699748993, "step": 2740, "valid_targets_mean": 3270.8, "valid_targets_min": 953 }, { "epoch": 2.883403361344538, "grad_norm": 0.7016630866988153, "learning_rate": 2.9284114306418758e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.2649661898612976, "step": 2745, "valid_targets_mean": 3123.0, "valid_targets_min": 1410 }, { "epoch": 2.888655462184874, "grad_norm": 0.6661752773535051, "learning_rate": 2.923768273259942e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.263710081577301, "step": 2750, "valid_targets_mean": 3085.5, "valid_targets_min": 530 }, { "epoch": 2.89390756302521, "grad_norm": 0.6197849509680783, "learning_rate": 2.919118778137546e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.25989899039268494, "step": 2755, "valid_targets_mean": 3491.7, "valid_targets_min": 1066 }, { "epoch": 2.899159663865546, "grad_norm": 0.594389488012544, "learning_rate": 2.9144629771736954e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2792191207408905, "step": 2760, "valid_targets_mean": 3904.9, "valid_targets_min": 1613 }, { "epoch": 2.9044117647058822, "grad_norm": 0.5752638283362668, "learning_rate": 2.9098009023106645e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.23264659941196442, "step": 2765, "valid_targets_mean": 3731.6, "valid_targets_min": 952 }, { "epoch": 2.9096638655462184, "grad_norm": 0.6490696888490648, "learning_rate": 2.9051325855337684e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.26240965723991394, "step": 2770, "valid_targets_mean": 2823.0, "valid_targets_min": 1025 }, { "epoch": 2.9149159663865545, "grad_norm": 0.6126363252048349, "learning_rate": 2.90045805887115e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.27359646558761597, "step": 2775, "valid_targets_mean": 4032.0, "valid_targets_min": 1397 }, { "epoch": 2.9201680672268906, "grad_norm": 0.6068839428847373, "learning_rate": 2.8957773543935518e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.2474924623966217, "step": 2780, "valid_targets_mean": 3534.0, "valid_targets_min": 1920 }, { "epoch": 2.9254201680672267, "grad_norm": 0.6329791757885024, "learning_rate": 2.8910905042141046e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.25704294443130493, "step": 2785, "valid_targets_mean": 3527.5, "valid_targets_min": 1687 }, { "epoch": 2.9306722689075633, "grad_norm": 0.6948103907388832, "learning_rate": 2.8863975404881022e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.30331847071647644, "step": 2790, "valid_targets_mean": 3213.0, "valid_targets_min": 1564 }, { "epoch": 2.935924369747899, "grad_norm": 0.6352221742702212, "learning_rate": 2.881698495412781e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2414446771144867, "step": 2795, "valid_targets_mean": 3689.7, "valid_targets_min": 1947 }, { "epoch": 2.9411764705882355, "grad_norm": 0.6629581821365779, "learning_rate": 2.8769934012271004e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.25725820660591125, "step": 2800, "valid_targets_mean": 2978.2, "valid_targets_min": 1447 }, { "epoch": 2.946428571428571, "grad_norm": 0.6673202572073865, "learning_rate": 2.8722822902115228e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.25360405445098877, "step": 2805, "valid_targets_mean": 3016.5, "valid_targets_min": 1243 }, { "epoch": 2.9516806722689077, "grad_norm": 0.7063504788496237, "learning_rate": 2.8675651946877884e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.27201586961746216, "step": 2810, "valid_targets_mean": 3199.0, "valid_targets_min": 1679 }, { "epoch": 2.956932773109244, "grad_norm": 0.6749918994768315, "learning_rate": 2.862842147018696e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.2709447741508484, "step": 2815, "valid_targets_mean": 3001.2, "valid_targets_min": 1695 }, { "epoch": 2.96218487394958, "grad_norm": 0.6389022545015189, "learning_rate": 2.858113179607881e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.24959295988082886, "step": 2820, "valid_targets_mean": 3370.9, "valid_targets_min": 1469 }, { "epoch": 2.967436974789916, "grad_norm": 0.7014173062929902, "learning_rate": 2.8533783248995938e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.24700427055358887, "step": 2825, "valid_targets_mean": 3245.9, "valid_targets_min": 1593 }, { "epoch": 2.972689075630252, "grad_norm": 0.6469956378099957, "learning_rate": 2.848637615378475e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.27041953802108765, "step": 2830, "valid_targets_mean": 3130.5, "valid_targets_min": 1664 }, { "epoch": 2.9779411764705883, "grad_norm": 0.6169242449395833, "learning_rate": 2.8438910835693314e-05, "loss": 0.2443, "loss_nan_ranks": 0, "loss_rank_avg": 0.22996433079242706, "step": 2835, "valid_targets_mean": 3460.2, "valid_targets_min": 1605 }, { "epoch": 2.9831932773109244, "grad_norm": 0.6394181377322952, "learning_rate": 2.8391387620369192e-05, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803104519844055, "step": 2840, "valid_targets_mean": 3288.6, "valid_targets_min": 842 }, { "epoch": 2.9884453781512605, "grad_norm": 0.6854150282623844, "learning_rate": 2.834380683385714e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2902924418449402, "step": 2845, "valid_targets_mean": 3601.4, "valid_targets_min": 809 }, { "epoch": 2.9936974789915967, "grad_norm": 0.6051689785920974, "learning_rate": 2.8296168802596892e-05, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.2509153187274933, "step": 2850, "valid_targets_mean": 3752.4, "valid_targets_min": 2026 }, { "epoch": 2.9989495798319328, "grad_norm": 0.6083481456927304, "learning_rate": 2.8248473853420933e-05, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585148811340332, "step": 2855, "valid_targets_mean": 3430.5, "valid_targets_min": 1214 }, { "epoch": 3.004201680672269, "grad_norm": 0.7319423401810515, "learning_rate": 2.8200722313552247e-05, "loss": 0.2164, "loss_nan_ranks": 0, "loss_rank_avg": 0.2003440260887146, "step": 2860, "valid_targets_mean": 1489.3, "valid_targets_min": 722 }, { "epoch": 3.009453781512605, "grad_norm": 0.717771718263267, "learning_rate": 2.8152914510602073e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.17707990109920502, "step": 2865, "valid_targets_mean": 1515.6, "valid_targets_min": 725 }, { "epoch": 3.014705882352941, "grad_norm": 0.8226879595885981, "learning_rate": 2.810505077256765e-05, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.18063870072364807, "step": 2870, "valid_targets_mean": 1443.1, "valid_targets_min": 874 }, { "epoch": 3.0199579831932772, "grad_norm": 0.8338357187658497, "learning_rate": 2.8057131427829983e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.17110946774482727, "step": 2875, "valid_targets_mean": 1316.8, "valid_targets_min": 615 }, { "epoch": 3.0252100840336134, "grad_norm": 0.7376091557217379, "learning_rate": 2.800915680515157e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.17430976033210754, "step": 2880, "valid_targets_mean": 1540.8, "valid_targets_min": 715 }, { "epoch": 3.0304621848739495, "grad_norm": 0.7831042239119287, "learning_rate": 2.7961127233674167e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2140425145626068, "step": 2885, "valid_targets_mean": 1648.9, "valid_targets_min": 625 }, { "epoch": 3.0357142857142856, "grad_norm": 0.7415542108375209, "learning_rate": 2.7913043042916513e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.1582803726196289, "step": 2890, "valid_targets_mean": 1354.9, "valid_targets_min": 761 }, { "epoch": 3.0409663865546217, "grad_norm": 0.715142653421594, "learning_rate": 2.786490456277208e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.25299903750419617, "step": 2895, "valid_targets_mean": 1589.9, "valid_targets_min": 703 }, { "epoch": 3.046218487394958, "grad_norm": 0.7873361806067022, "learning_rate": 2.7816712123506796e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710663139820099, "step": 2900, "valid_targets_mean": 1485.4, "valid_targets_min": 733 }, { "epoch": 3.051470588235294, "grad_norm": 0.7770722242990561, "learning_rate": 2.776846605575681e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.1824086308479309, "step": 2905, "valid_targets_mean": 1712.8, "valid_targets_min": 964 }, { "epoch": 3.05672268907563, "grad_norm": 0.7616729738480414, "learning_rate": 2.772016669052618e-05, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.1748737096786499, "step": 2910, "valid_targets_mean": 1498.4, "valid_targets_min": 815 }, { "epoch": 3.0619747899159666, "grad_norm": 0.7583507582473836, "learning_rate": 2.767181435918464e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.1768401861190796, "step": 2915, "valid_targets_mean": 1677.5, "valid_targets_min": 1027 }, { "epoch": 3.0672268907563027, "grad_norm": 0.7278307085282013, "learning_rate": 2.7623409393465298e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1581869125366211, "step": 2920, "valid_targets_mean": 1325.3, "valid_targets_min": 570 }, { "epoch": 3.072478991596639, "grad_norm": 0.7617121869975262, "learning_rate": 2.7574952125462386e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.16011205315589905, "step": 2925, "valid_targets_mean": 1324.7, "valid_targets_min": 548 }, { "epoch": 3.077731092436975, "grad_norm": 0.7554042058432768, "learning_rate": 2.7526442887628962e-05, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.15193405747413635, "step": 2930, "valid_targets_mean": 1288.1, "valid_targets_min": 682 }, { "epoch": 3.082983193277311, "grad_norm": 0.737075733110425, "learning_rate": 2.7477882012774633e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.16672229766845703, "step": 2935, "valid_targets_mean": 1563.0, "valid_targets_min": 911 }, { "epoch": 3.088235294117647, "grad_norm": 0.8359898452206559, "learning_rate": 2.742926983406328e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.16956086456775665, "step": 2940, "valid_targets_mean": 1278.3, "valid_targets_min": 597 }, { "epoch": 3.0934873949579833, "grad_norm": 0.7553756145118757, "learning_rate": 2.7380606685010767e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.17766933143138885, "step": 2945, "valid_targets_mean": 1552.1, "valid_targets_min": 772 }, { "epoch": 3.0987394957983194, "grad_norm": 0.7472526084646638, "learning_rate": 2.7331892899482654e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.1692330241203308, "step": 2950, "valid_targets_mean": 1548.2, "valid_targets_min": 940 }, { "epoch": 3.1039915966386555, "grad_norm": 0.6799508713485111, "learning_rate": 2.7283128811691893e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.146545872092247, "step": 2955, "valid_targets_mean": 1334.6, "valid_targets_min": 785 }, { "epoch": 3.1092436974789917, "grad_norm": 0.7171813544493029, "learning_rate": 2.7234314756196564e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.15770323574543, "step": 2960, "valid_targets_mean": 1404.9, "valid_targets_min": 617 }, { "epoch": 3.1144957983193278, "grad_norm": 0.8566587780828107, "learning_rate": 2.718545106789755e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.17677560448646545, "step": 2965, "valid_targets_mean": 1266.8, "valid_targets_min": 648 }, { "epoch": 3.119747899159664, "grad_norm": 0.8193397073508751, "learning_rate": 2.713653808203626e-05, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.15627950429916382, "step": 2970, "valid_targets_mean": 1427.1, "valid_targets_min": 634 }, { "epoch": 3.125, "grad_norm": 0.8274451736674825, "learning_rate": 2.7087576134192305e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.16775844991207123, "step": 2975, "valid_targets_mean": 1421.0, "valid_targets_min": 774 }, { "epoch": 3.130252100840336, "grad_norm": 0.6953309030381479, "learning_rate": 2.7038565560281252e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.16650184988975525, "step": 2980, "valid_targets_mean": 1685.9, "valid_targets_min": 563 }, { "epoch": 3.1355042016806722, "grad_norm": 0.8099890208928163, "learning_rate": 2.6989506696552224e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.16752278804779053, "step": 2985, "valid_targets_mean": 1378.0, "valid_targets_min": 837 }, { "epoch": 3.1407563025210083, "grad_norm": 0.7795749997325356, "learning_rate": 2.6940399879585685e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.16560722887516022, "step": 2990, "valid_targets_mean": 1599.2, "valid_targets_min": 803 }, { "epoch": 3.1460084033613445, "grad_norm": 0.7336389778027822, "learning_rate": 2.6891245446291093e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.14416930079460144, "step": 2995, "valid_targets_mean": 1380.4, "valid_targets_min": 797 }, { "epoch": 3.1512605042016806, "grad_norm": 0.7490034715901619, "learning_rate": 2.6842043733904578e-05, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.15650300681591034, "step": 3000, "valid_targets_mean": 1571.5, "valid_targets_min": 646 }, { "epoch": 3.1565126050420167, "grad_norm": 0.8401911427116212, "learning_rate": 2.6792795079986634e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.17290136218070984, "step": 3005, "valid_targets_mean": 1447.8, "valid_targets_min": 591 }, { "epoch": 3.161764705882353, "grad_norm": 0.8101203980462212, "learning_rate": 2.6743499822419833e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.18794336915016174, "step": 3010, "valid_targets_mean": 1512.7, "valid_targets_min": 796 }, { "epoch": 3.167016806722689, "grad_norm": 0.7549079816000475, "learning_rate": 2.669415829940646e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.148887038230896, "step": 3015, "valid_targets_mean": 1333.1, "valid_targets_min": 848 }, { "epoch": 3.172268907563025, "grad_norm": 0.8655198786602623, "learning_rate": 2.6644770849466226e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.14870238304138184, "step": 3020, "valid_targets_mean": 1233.6, "valid_targets_min": 665 }, { "epoch": 3.177521008403361, "grad_norm": 0.6869481556598374, "learning_rate": 2.6595337811433925e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471511870622635, "step": 3025, "valid_targets_mean": 1408.1, "valid_targets_min": 652 }, { "epoch": 3.1827731092436973, "grad_norm": 0.8476070443290739, "learning_rate": 2.654585952445714e-05, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.17854884266853333, "step": 3030, "valid_targets_mean": 1573.8, "valid_targets_min": 662 }, { "epoch": 3.1880252100840334, "grad_norm": 0.759943747176002, "learning_rate": 2.6496336327993882e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.17004242539405823, "step": 3035, "valid_targets_mean": 1410.9, "valid_targets_min": 770 }, { "epoch": 3.19327731092437, "grad_norm": 0.7914392244697611, "learning_rate": 2.6446768561810264e-05, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.16128523647785187, "step": 3040, "valid_targets_mean": 1338.0, "valid_targets_min": 842 }, { "epoch": 3.198529411764706, "grad_norm": 0.7573632096372179, "learning_rate": 2.6397156565978198e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.16719350218772888, "step": 3045, "valid_targets_mean": 1522.6, "valid_targets_min": 773 }, { "epoch": 3.203781512605042, "grad_norm": 0.7823159419268372, "learning_rate": 2.6347500680873043e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.170121967792511, "step": 3050, "valid_targets_mean": 1530.2, "valid_targets_min": 807 }, { "epoch": 3.2090336134453783, "grad_norm": 0.7715992991548748, "learning_rate": 2.6297801247171258e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.14779695868492126, "step": 3055, "valid_targets_mean": 1266.6, "valid_targets_min": 782 }, { "epoch": 3.2142857142857144, "grad_norm": 0.7213196908664066, "learning_rate": 2.6248058605848097e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.17193026840686798, "step": 3060, "valid_targets_mean": 1624.2, "valid_targets_min": 634 }, { "epoch": 3.2195378151260505, "grad_norm": 0.7460107195452109, "learning_rate": 2.6198273098175234e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.1723858267068863, "step": 3065, "valid_targets_mean": 1508.1, "valid_targets_min": 573 }, { "epoch": 3.2247899159663866, "grad_norm": 0.7033456921737298, "learning_rate": 2.614844506571844e-05, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.16065514087677002, "step": 3070, "valid_targets_mean": 1645.1, "valid_targets_min": 718 }, { "epoch": 3.2300420168067228, "grad_norm": 0.700948054604266, "learning_rate": 2.609857485033525e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.13682524859905243, "step": 3075, "valid_targets_mean": 1385.9, "valid_targets_min": 685 }, { "epoch": 3.235294117647059, "grad_norm": 0.8365081550151657, "learning_rate": 2.6048662794172595e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1537787914276123, "step": 3080, "valid_targets_mean": 1489.9, "valid_targets_min": 744 }, { "epoch": 3.240546218487395, "grad_norm": 0.9620567262629217, "learning_rate": 2.599870923966447e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.15811693668365479, "step": 3085, "valid_targets_mean": 1253.3, "valid_targets_min": 650 }, { "epoch": 3.245798319327731, "grad_norm": 0.7129512442205985, "learning_rate": 2.5948714529529565e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.16663914918899536, "step": 3090, "valid_targets_mean": 1337.3, "valid_targets_min": 780 }, { "epoch": 3.2510504201680672, "grad_norm": 0.728601631393252, "learning_rate": 2.5898679006768958e-05, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.14995308220386505, "step": 3095, "valid_targets_mean": 1344.5, "valid_targets_min": 677 }, { "epoch": 3.2563025210084033, "grad_norm": 0.7807161695418345, "learning_rate": 2.5848603014663702e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.15245237946510315, "step": 3100, "valid_targets_mean": 1302.3, "valid_targets_min": 727 }, { "epoch": 3.2615546218487395, "grad_norm": 0.7833067221288974, "learning_rate": 2.579848689677252e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.164436474442482, "step": 3105, "valid_targets_mean": 1489.2, "valid_targets_min": 726 }, { "epoch": 3.2668067226890756, "grad_norm": 0.7582720046388419, "learning_rate": 2.5748330996929414e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.17622435092926025, "step": 3110, "valid_targets_mean": 1497.3, "valid_targets_min": 669 }, { "epoch": 3.2720588235294117, "grad_norm": 0.6761627015093946, "learning_rate": 2.5698135659241334e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.14206218719482422, "step": 3115, "valid_targets_mean": 1376.9, "valid_targets_min": 750 }, { "epoch": 3.277310924369748, "grad_norm": 0.7569519780492563, "learning_rate": 2.564790122808579e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.15797209739685059, "step": 3120, "valid_targets_mean": 1475.9, "valid_targets_min": 736 }, { "epoch": 3.282563025210084, "grad_norm": 0.7724507253369616, "learning_rate": 2.5597628048108504e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.1651463806629181, "step": 3125, "valid_targets_mean": 1426.2, "valid_targets_min": 694 }, { "epoch": 3.28781512605042, "grad_norm": 0.7583229755048851, "learning_rate": 2.5547316464221058e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.1635044515132904, "step": 3130, "valid_targets_mean": 1547.6, "valid_targets_min": 753 }, { "epoch": 3.293067226890756, "grad_norm": 0.7492941228082307, "learning_rate": 2.5496966821598493e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.14868690073490143, "step": 3135, "valid_targets_mean": 1277.1, "valid_targets_min": 809 }, { "epoch": 3.2983193277310923, "grad_norm": 0.7918115514025105, "learning_rate": 2.5446579465676977e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.14087459444999695, "step": 3140, "valid_targets_mean": 1292.3, "valid_targets_min": 698 }, { "epoch": 3.3035714285714284, "grad_norm": 0.7674670047525459, "learning_rate": 2.5396154742151407e-05, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.15545767545700073, "step": 3145, "valid_targets_mean": 1448.1, "valid_targets_min": 750 }, { "epoch": 3.3088235294117645, "grad_norm": 0.8361476210011558, "learning_rate": 2.5345692996973075e-05, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.17045646905899048, "step": 3150, "valid_targets_mean": 1472.6, "valid_targets_min": 733 }, { "epoch": 3.314075630252101, "grad_norm": 0.7425956748582699, "learning_rate": 2.5295194576347233e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.15749000012874603, "step": 3155, "valid_targets_mean": 1597.3, "valid_targets_min": 907 }, { "epoch": 3.3193277310924367, "grad_norm": 0.778056511779034, "learning_rate": 2.5244659826730774e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.17436806857585907, "step": 3160, "valid_targets_mean": 1564.9, "valid_targets_min": 898 }, { "epoch": 3.3245798319327733, "grad_norm": 0.7457317148773122, "learning_rate": 2.519408909482984e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.16804683208465576, "step": 3165, "valid_targets_mean": 1660.6, "valid_targets_min": 1119 }, { "epoch": 3.3298319327731094, "grad_norm": 0.8015187816073955, "learning_rate": 2.5143482727597427e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.16357378661632538, "step": 3170, "valid_targets_mean": 1392.3, "valid_targets_min": 700 }, { "epoch": 3.3350840336134455, "grad_norm": 0.7927587699859597, "learning_rate": 2.509284107223102e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.15347766876220703, "step": 3175, "valid_targets_mean": 1407.8, "valid_targets_min": 798 }, { "epoch": 3.3403361344537816, "grad_norm": 0.8291776111318878, "learning_rate": 2.50421644761702e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.14594411849975586, "step": 3180, "valid_targets_mean": 1237.5, "valid_targets_min": 589 }, { "epoch": 3.3455882352941178, "grad_norm": 0.786383044943235, "learning_rate": 2.499145328709429e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1620325744152069, "step": 3185, "valid_targets_mean": 1363.2, "valid_targets_min": 673 }, { "epoch": 3.350840336134454, "grad_norm": 0.8314225202905355, "learning_rate": 2.4940707852919924e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1637428104877472, "step": 3190, "valid_targets_mean": 1297.5, "valid_targets_min": 641 }, { "epoch": 3.35609243697479, "grad_norm": 0.8247848576495689, "learning_rate": 2.488992852179868e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.1613052636384964, "step": 3195, "valid_targets_mean": 1466.3, "valid_targets_min": 701 }, { "epoch": 3.361344537815126, "grad_norm": 0.7169780960903507, "learning_rate": 2.483911564211472e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.1574411392211914, "step": 3200, "valid_targets_mean": 1801.2, "valid_targets_min": 1202 }, { "epoch": 3.366596638655462, "grad_norm": 0.6906945355495036, "learning_rate": 2.4788269562482355e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.15213462710380554, "step": 3205, "valid_targets_mean": 1441.4, "valid_targets_min": 657 }, { "epoch": 3.3718487394957983, "grad_norm": 0.7855731357671363, "learning_rate": 2.4737390631743675e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.15283282101154327, "step": 3210, "valid_targets_mean": 1442.9, "valid_targets_min": 672 }, { "epoch": 3.3771008403361344, "grad_norm": 0.7999940593483418, "learning_rate": 2.4686479198966146e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.16701379418373108, "step": 3215, "valid_targets_mean": 1305.1, "valid_targets_min": 723 }, { "epoch": 3.3823529411764706, "grad_norm": 0.7802222544911187, "learning_rate": 2.463553561344024e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388361155986786, "step": 3220, "valid_targets_mean": 1236.6, "valid_targets_min": 732 }, { "epoch": 3.3876050420168067, "grad_norm": 0.7997658424367834, "learning_rate": 2.4584560224677013e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.14376091957092285, "step": 3225, "valid_targets_mean": 1261.1, "valid_targets_min": 634 }, { "epoch": 3.392857142857143, "grad_norm": 0.7589895889200633, "learning_rate": 2.4533553382405702e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.16269132494926453, "step": 3230, "valid_targets_mean": 1451.1, "valid_targets_min": 905 }, { "epoch": 3.398109243697479, "grad_norm": 0.9088457131074477, "learning_rate": 2.4482515436571365e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.1583980917930603, "step": 3235, "valid_targets_mean": 1466.4, "valid_targets_min": 596 }, { "epoch": 3.403361344537815, "grad_norm": 0.8253891514753098, "learning_rate": 2.4431446737332437e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.16583885252475739, "step": 3240, "valid_targets_mean": 1435.1, "valid_targets_min": 756 }, { "epoch": 3.408613445378151, "grad_norm": 0.7126823695261846, "learning_rate": 2.438034763505833e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.14703774452209473, "step": 3245, "valid_targets_mean": 1411.8, "valid_targets_min": 567 }, { "epoch": 3.4138655462184873, "grad_norm": 0.7389656217215542, "learning_rate": 2.432921848032707e-05, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.14308568835258484, "step": 3250, "valid_targets_mean": 1495.9, "valid_targets_min": 810 }, { "epoch": 3.4191176470588234, "grad_norm": 0.7063481251451478, "learning_rate": 2.427805962392286e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.15941093862056732, "step": 3255, "valid_targets_mean": 1643.2, "valid_targets_min": 868 }, { "epoch": 3.4243697478991595, "grad_norm": 0.7292997254366875, "learning_rate": 2.4226871416833683e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.146925687789917, "step": 3260, "valid_targets_mean": 1451.4, "valid_targets_min": 824 }, { "epoch": 3.4296218487394956, "grad_norm": 0.7542406085374198, "learning_rate": 2.4175654210248848e-05, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.161025732755661, "step": 3265, "valid_targets_mean": 1615.9, "valid_targets_min": 797 }, { "epoch": 3.434873949579832, "grad_norm": 0.6966112598828675, "learning_rate": 2.4124408355556677e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.1535557061433792, "step": 3270, "valid_targets_mean": 1596.5, "valid_targets_min": 1043 }, { "epoch": 3.440126050420168, "grad_norm": 0.7555059854029672, "learning_rate": 2.4073134204342014e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.16238391399383545, "step": 3275, "valid_targets_mean": 1445.5, "valid_targets_min": 920 }, { "epoch": 3.4453781512605044, "grad_norm": 0.8208149984721342, "learning_rate": 2.4021832108383837e-05, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.15757635235786438, "step": 3280, "valid_targets_mean": 1437.9, "valid_targets_min": 847 }, { "epoch": 3.4506302521008405, "grad_norm": 0.7056998799882124, "learning_rate": 2.3970502419652854e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15004190802574158, "step": 3285, "valid_targets_mean": 1559.1, "valid_targets_min": 557 }, { "epoch": 3.4558823529411766, "grad_norm": 0.7958553721684484, "learning_rate": 2.3919145490309076e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.15160951018333435, "step": 3290, "valid_targets_mean": 1341.6, "valid_targets_min": 594 }, { "epoch": 3.4611344537815127, "grad_norm": 0.703390230979893, "learning_rate": 2.38677616726994e-05, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.1494627594947815, "step": 3295, "valid_targets_mean": 1747.5, "valid_targets_min": 760 }, { "epoch": 3.466386554621849, "grad_norm": 0.6829115937221362, "learning_rate": 2.381635131935521e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.27713343501091003, "step": 3300, "valid_targets_mean": 3387.2, "valid_targets_min": 770 }, { "epoch": 3.471638655462185, "grad_norm": 0.5039365129794023, "learning_rate": 2.3764914782989926e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.21012486517429352, "step": 3305, "valid_targets_mean": 4538.6, "valid_targets_min": 1799 }, { "epoch": 3.476890756302521, "grad_norm": 0.5334008441824496, "learning_rate": 2.3713452416496625e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.2371271550655365, "step": 3310, "valid_targets_mean": 4182.4, "valid_targets_min": 1560 }, { "epoch": 3.482142857142857, "grad_norm": 0.5252301039129134, "learning_rate": 2.366196457294558e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.20833566784858704, "step": 3315, "valid_targets_mean": 4361.0, "valid_targets_min": 1681 }, { "epoch": 3.4873949579831933, "grad_norm": 0.617549050257743, "learning_rate": 2.3610451605581858e-05, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.2543012499809265, "step": 3320, "valid_targets_mean": 3627.6, "valid_targets_min": 1374 }, { "epoch": 3.4926470588235294, "grad_norm": 0.6304506600012845, "learning_rate": 2.3558913867822905e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.22949200868606567, "step": 3325, "valid_targets_mean": 3204.2, "valid_targets_min": 1089 }, { "epoch": 3.4978991596638656, "grad_norm": 0.5586583847778026, "learning_rate": 2.3507351713256105e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.23757925629615784, "step": 3330, "valid_targets_mean": 4203.4, "valid_targets_min": 627 }, { "epoch": 3.5031512605042017, "grad_norm": 0.5579364042848073, "learning_rate": 2.3455765495636353e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.23478400707244873, "step": 3335, "valid_targets_mean": 3778.9, "valid_targets_min": 1574 }, { "epoch": 3.508403361344538, "grad_norm": 0.6191817742700788, "learning_rate": 2.3404155568883643e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.25709354877471924, "step": 3340, "valid_targets_mean": 3704.9, "valid_targets_min": 1921 }, { "epoch": 3.513655462184874, "grad_norm": 0.587021701284441, "learning_rate": 2.3352522287080625e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.23616047203540802, "step": 3345, "valid_targets_mean": 3960.9, "valid_targets_min": 1477 }, { "epoch": 3.51890756302521, "grad_norm": 0.6254607818726631, "learning_rate": 2.3300866004470182e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.24480389058589935, "step": 3350, "valid_targets_mean": 3504.5, "valid_targets_min": 1499 }, { "epoch": 3.524159663865546, "grad_norm": 0.5925836663255958, "learning_rate": 2.324918707545302e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.26201432943344116, "step": 3355, "valid_targets_mean": 3803.8, "valid_targets_min": 1013 }, { "epoch": 3.5294117647058822, "grad_norm": 0.5642203624546177, "learning_rate": 2.3197485854585183e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.2236984670162201, "step": 3360, "valid_targets_mean": 4146.8, "valid_targets_min": 1543 }, { "epoch": 3.5346638655462184, "grad_norm": 0.6221598960605759, "learning_rate": 2.3145762696575675e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.24771781265735626, "step": 3365, "valid_targets_mean": 3705.0, "valid_targets_min": 2050 }, { "epoch": 3.5399159663865545, "grad_norm": 0.667308661071586, "learning_rate": 2.3094017956283995e-05, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.2562797963619232, "step": 3370, "valid_targets_mean": 3287.6, "valid_targets_min": 746 }, { "epoch": 3.5451680672268906, "grad_norm": 0.6591430962273881, "learning_rate": 2.3042251988717728e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.24168621003627777, "step": 3375, "valid_targets_mean": 3219.6, "valid_targets_min": 1210 }, { "epoch": 3.5504201680672267, "grad_norm": 0.5861565049376661, "learning_rate": 2.2990465149030077e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.2576037347316742, "step": 3380, "valid_targets_mean": 3420.2, "valid_targets_min": 1064 }, { "epoch": 3.5556722689075633, "grad_norm": 0.676375370367313, "learning_rate": 2.2938657792517446e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.24123093485832214, "step": 3385, "valid_targets_mean": 2978.2, "valid_targets_min": 1173 }, { "epoch": 3.560924369747899, "grad_norm": 0.7090066415466851, "learning_rate": 2.2886830274617017e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.2423102855682373, "step": 3390, "valid_targets_mean": 3106.8, "valid_targets_min": 1165 }, { "epoch": 3.5661764705882355, "grad_norm": 0.6215177878656555, "learning_rate": 2.2834982950904267e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.20194599032402039, "step": 3395, "valid_targets_mean": 3800.3, "valid_targets_min": 1365 }, { "epoch": 3.571428571428571, "grad_norm": 0.6568484423092628, "learning_rate": 2.2783116177090573e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.2180924117565155, "step": 3400, "valid_targets_mean": 3020.4, "valid_targets_min": 1051 }, { "epoch": 3.5766806722689077, "grad_norm": 0.72432526478877, "learning_rate": 2.2731230309020762e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.2589854300022125, "step": 3405, "valid_targets_mean": 2882.1, "valid_targets_min": 1345 }, { "epoch": 3.581932773109244, "grad_norm": 0.647347676568134, "learning_rate": 2.2679325702670642e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.23592257499694824, "step": 3410, "valid_targets_mean": 3123.4, "valid_targets_min": 1747 }, { "epoch": 3.58718487394958, "grad_norm": 0.6321313310777158, "learning_rate": 2.2627402714144586e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.23397618532180786, "step": 3415, "valid_targets_mean": 3041.9, "valid_targets_min": 1166 }, { "epoch": 3.592436974789916, "grad_norm": 0.6163425879015834, "learning_rate": 2.2575461699673085e-05, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.24911564588546753, "step": 3420, "valid_targets_mean": 3629.4, "valid_targets_min": 1511 }, { "epoch": 3.597689075630252, "grad_norm": 0.8662060186406194, "learning_rate": 2.2523503015610303e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.219038188457489, "step": 3425, "valid_targets_mean": 3007.8, "valid_targets_min": 869 }, { "epoch": 3.6029411764705883, "grad_norm": 0.6505678950823406, "learning_rate": 2.2471527018431637e-05, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.2250857800245285, "step": 3430, "valid_targets_mean": 3147.4, "valid_targets_min": 926 }, { "epoch": 3.6081932773109244, "grad_norm": 0.6624584977841851, "learning_rate": 2.2419534064731238e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.22663256525993347, "step": 3435, "valid_targets_mean": 3047.1, "valid_targets_min": 1016 }, { "epoch": 3.6134453781512605, "grad_norm": 0.68180528409829, "learning_rate": 2.236752451121963e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.2614358067512512, "step": 3440, "valid_targets_mean": 3288.3, "valid_targets_min": 1367 }, { "epoch": 3.6186974789915967, "grad_norm": 0.5943225731704131, "learning_rate": 2.2315498714721198e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.2073296308517456, "step": 3445, "valid_targets_mean": 3621.2, "valid_targets_min": 761 }, { "epoch": 3.6239495798319328, "grad_norm": 0.7143384166342921, "learning_rate": 2.2263457032171762e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.22933131456375122, "step": 3450, "valid_targets_mean": 2664.7, "valid_targets_min": 1480 }, { "epoch": 3.629201680672269, "grad_norm": 0.6637253904207627, "learning_rate": 2.2211399820616154e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.21584278345108032, "step": 3455, "valid_targets_mean": 3043.8, "valid_targets_min": 1229 }, { "epoch": 3.634453781512605, "grad_norm": 0.6381313624483769, "learning_rate": 2.2159327437205733e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.23317265510559082, "step": 3460, "valid_targets_mean": 3533.5, "valid_targets_min": 1727 }, { "epoch": 3.639705882352941, "grad_norm": 0.6079366483063177, "learning_rate": 2.210724023919595e-05, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.23725667595863342, "step": 3465, "valid_targets_mean": 3763.2, "valid_targets_min": 1860 }, { "epoch": 3.6449579831932772, "grad_norm": 0.6617853538852045, "learning_rate": 2.205513858394389e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.23891595005989075, "step": 3470, "valid_targets_mean": 3145.0, "valid_targets_min": 1145 }, { "epoch": 3.6502100840336134, "grad_norm": 0.6931454910102819, "learning_rate": 2.2003022828905832e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.24554722011089325, "step": 3475, "valid_targets_mean": 3148.6, "valid_targets_min": 1363 }, { "epoch": 3.6554621848739495, "grad_norm": 0.6830097683535337, "learning_rate": 2.19508933316348e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.2083757519721985, "step": 3480, "valid_targets_mean": 3347.4, "valid_targets_min": 1087 }, { "epoch": 3.6607142857142856, "grad_norm": 0.6284986422875785, "learning_rate": 2.189875044977808e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.22864796221256256, "step": 3485, "valid_targets_mean": 4141.5, "valid_targets_min": 730 }, { "epoch": 3.6659663865546217, "grad_norm": 0.6424551917347495, "learning_rate": 2.1846594541074796e-05, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.21687257289886475, "step": 3490, "valid_targets_mean": 3053.2, "valid_targets_min": 1406 }, { "epoch": 3.671218487394958, "grad_norm": 0.6118476480500536, "learning_rate": 2.179442596335345e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.21437662839889526, "step": 3495, "valid_targets_mean": 3413.8, "valid_targets_min": 1833 }, { "epoch": 3.6764705882352944, "grad_norm": 0.6834904631426817, "learning_rate": 2.174224507452945e-05, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.23827575147151947, "step": 3500, "valid_targets_mean": 3292.0, "valid_targets_min": 1182 }, { "epoch": 3.68172268907563, "grad_norm": 0.6540573235032019, "learning_rate": 2.1690052232602677e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.2561336159706116, "step": 3505, "valid_targets_mean": 3815.1, "valid_targets_min": 1607 }, { "epoch": 3.6869747899159666, "grad_norm": 0.7038556545538145, "learning_rate": 2.1637847795655022e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.23643259704113007, "step": 3510, "valid_targets_mean": 2850.3, "valid_targets_min": 1358 }, { "epoch": 3.6922268907563023, "grad_norm": 0.6142418362337423, "learning_rate": 2.1585632121847925e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.2268371880054474, "step": 3515, "valid_targets_mean": 3897.3, "valid_targets_min": 1757 }, { "epoch": 3.697478991596639, "grad_norm": 0.6018277229359115, "learning_rate": 2.153340556941991e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.19471925497055054, "step": 3520, "valid_targets_mean": 3365.7, "valid_targets_min": 1170 }, { "epoch": 3.7027310924369745, "grad_norm": 0.7817444103413864, "learning_rate": 2.1481168496684145e-05, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.24332907795906067, "step": 3525, "valid_targets_mean": 2908.3, "valid_targets_min": 474 }, { "epoch": 3.707983193277311, "grad_norm": 0.6733856863461328, "learning_rate": 2.142892126202597e-05, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.22530926764011383, "step": 3530, "valid_targets_mean": 3249.9, "valid_targets_min": 1140 }, { "epoch": 3.713235294117647, "grad_norm": 0.6772781803626257, "learning_rate": 2.137666422390045e-05, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.2468833178281784, "step": 3535, "valid_targets_mean": 3621.2, "valid_targets_min": 2266 }, { "epoch": 3.7184873949579833, "grad_norm": 0.596320718539212, "learning_rate": 2.132439774082991e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.19030636548995972, "step": 3540, "valid_targets_mean": 3192.4, "valid_targets_min": 809 }, { "epoch": 3.7237394957983194, "grad_norm": 0.6683616408438122, "learning_rate": 2.1272122171401467e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.2368716150522232, "step": 3545, "valid_targets_mean": 3176.4, "valid_targets_min": 1059 }, { "epoch": 3.7289915966386555, "grad_norm": 0.5993575332277289, "learning_rate": 2.1219837874264573e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.19735181331634521, "step": 3550, "valid_targets_mean": 3426.4, "valid_targets_min": 964 }, { "epoch": 3.7342436974789917, "grad_norm": 0.6105324798756142, "learning_rate": 2.116754520812857e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.22294853627681732, "step": 3555, "valid_targets_mean": 3946.7, "valid_targets_min": 1105 }, { "epoch": 3.7394957983193278, "grad_norm": 0.7317392218199291, "learning_rate": 2.111524453176022e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.23324161767959595, "step": 3560, "valid_targets_mean": 2534.7, "valid_targets_min": 1460 }, { "epoch": 3.744747899159664, "grad_norm": 0.679940437130019, "learning_rate": 2.1062936203981227e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.23880356550216675, "step": 3565, "valid_targets_mean": 3673.0, "valid_targets_min": 1091 }, { "epoch": 3.75, "grad_norm": 0.6386888401169865, "learning_rate": 2.10106205836658e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.21099084615707397, "step": 3570, "valid_targets_mean": 3355.7, "valid_targets_min": 1771 }, { "epoch": 3.755252100840336, "grad_norm": 0.609185135460291, "learning_rate": 2.095829802973817e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.20622901618480682, "step": 3575, "valid_targets_mean": 3403.8, "valid_targets_min": 1625 }, { "epoch": 3.7605042016806722, "grad_norm": 0.6933994920811911, "learning_rate": 2.090596890117016e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.20166133344173431, "step": 3580, "valid_targets_mean": 3379.6, "valid_targets_min": 1180 }, { "epoch": 3.7657563025210083, "grad_norm": 0.7001758773355745, "learning_rate": 2.0853633556978674e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.2164371758699417, "step": 3585, "valid_targets_mean": 3085.8, "valid_targets_min": 1460 }, { "epoch": 3.7710084033613445, "grad_norm": 0.6982893325743658, "learning_rate": 2.0801292356223265e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.22557231783866882, "step": 3590, "valid_targets_mean": 3090.9, "valid_targets_min": 1079 }, { "epoch": 3.7762605042016806, "grad_norm": 0.6862429302576437, "learning_rate": 2.0748945658003695e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.21564340591430664, "step": 3595, "valid_targets_mean": 2751.7, "valid_targets_min": 1143 }, { "epoch": 3.7815126050420167, "grad_norm": 0.7486537584683461, "learning_rate": 2.0696593821457392e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.2403099536895752, "step": 3600, "valid_targets_mean": 3262.4, "valid_targets_min": 914 }, { "epoch": 3.786764705882353, "grad_norm": 0.6292490113807976, "learning_rate": 2.064423720575709e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.21284765005111694, "step": 3605, "valid_targets_mean": 3452.1, "valid_targets_min": 1312 }, { "epoch": 3.792016806722689, "grad_norm": 0.6731713864780883, "learning_rate": 2.0591876170108257e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.23124480247497559, "step": 3610, "valid_targets_mean": 2805.6, "valid_targets_min": 987 }, { "epoch": 3.7972689075630255, "grad_norm": 0.570026508038886, "learning_rate": 2.0539511073746743e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.21886953711509705, "step": 3615, "valid_targets_mean": 4512.7, "valid_targets_min": 1501 }, { "epoch": 3.802521008403361, "grad_norm": 0.6587414192570736, "learning_rate": 2.0487142275936213e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.21692374348640442, "step": 3620, "valid_targets_mean": 3188.2, "valid_targets_min": 1388 }, { "epoch": 3.8077731092436977, "grad_norm": 0.6975757464948207, "learning_rate": 2.0434770135965743e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.23684664070606232, "step": 3625, "valid_targets_mean": 3106.9, "valid_targets_min": 1986 }, { "epoch": 3.8130252100840334, "grad_norm": 0.6390716602559315, "learning_rate": 2.0382395013147347e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.23830687999725342, "step": 3630, "valid_targets_mean": 3893.1, "valid_targets_min": 1671 }, { "epoch": 3.81827731092437, "grad_norm": 0.6520611936803277, "learning_rate": 2.033001726681349e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.19424161314964294, "step": 3635, "valid_targets_mean": 3246.8, "valid_targets_min": 512 }, { "epoch": 3.8235294117647056, "grad_norm": 0.653877417451473, "learning_rate": 2.027763725631463e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.21053674817085266, "step": 3640, "valid_targets_mean": 3285.3, "valid_targets_min": 1202 }, { "epoch": 3.828781512605042, "grad_norm": 0.6519721595841632, "learning_rate": 2.0225255341016794e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.22552523016929626, "step": 3645, "valid_targets_mean": 4012.8, "valid_targets_min": 1645 }, { "epoch": 3.8340336134453783, "grad_norm": 0.6008225197326998, "learning_rate": 2.017287188029904e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.20129550993442535, "step": 3650, "valid_targets_mean": 3525.8, "valid_targets_min": 1434 }, { "epoch": 3.8392857142857144, "grad_norm": 0.7071580358913306, "learning_rate": 2.0120487233551035e-05, "loss": 0.2369, "loss_nan_ranks": 0, "loss_rank_avg": 0.2568947672843933, "step": 3655, "valid_targets_mean": 3044.6, "valid_targets_min": 1055 }, { "epoch": 3.8445378151260505, "grad_norm": 0.7176723110707379, "learning_rate": 2.006810176017059e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.23161205649375916, "step": 3660, "valid_targets_mean": 3179.8, "valid_targets_min": 1625 }, { "epoch": 3.8497899159663866, "grad_norm": 0.6943499018659017, "learning_rate": 2.0015715819561205e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.24318306148052216, "step": 3665, "valid_targets_mean": 3399.9, "valid_targets_min": 1147 }, { "epoch": 3.8550420168067228, "grad_norm": 0.6973815528618685, "learning_rate": 1.9963329771129558e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.24660438299179077, "step": 3670, "valid_targets_mean": 2866.4, "valid_targets_min": 998 }, { "epoch": 3.860294117647059, "grad_norm": 0.6342688826905563, "learning_rate": 1.9910943974283066e-05, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.23309576511383057, "step": 3675, "valid_targets_mean": 3480.4, "valid_targets_min": 1078 }, { "epoch": 3.865546218487395, "grad_norm": 0.735979206541467, "learning_rate": 1.9858558788427447e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.22612996399402618, "step": 3680, "valid_targets_mean": 2920.8, "valid_targets_min": 1005 }, { "epoch": 3.870798319327731, "grad_norm": 0.6974844461519691, "learning_rate": 1.9806174572964205e-05, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.22539496421813965, "step": 3685, "valid_targets_mean": 2983.9, "valid_targets_min": 719 }, { "epoch": 3.8760504201680672, "grad_norm": 0.7806658133125973, "learning_rate": 1.975379168728819e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.25455334782600403, "step": 3690, "valid_targets_mean": 2842.1, "valid_targets_min": 617 }, { "epoch": 3.8813025210084033, "grad_norm": 0.653382148721513, "learning_rate": 1.9701410490785128e-05, "loss": 0.2215, "loss_nan_ranks": 0, "loss_rank_avg": 0.22338590025901794, "step": 3695, "valid_targets_mean": 3210.6, "valid_targets_min": 1665 }, { "epoch": 3.8865546218487395, "grad_norm": 0.6977766979229648, "learning_rate": 1.9649031342829178e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.24201029539108276, "step": 3700, "valid_targets_mean": 3020.0, "valid_targets_min": 1076 }, { "epoch": 3.8918067226890756, "grad_norm": 0.6441901232419098, "learning_rate": 1.9596654602780398e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.2265818864107132, "step": 3705, "valid_targets_mean": 3548.8, "valid_targets_min": 790 }, { "epoch": 3.8970588235294117, "grad_norm": 0.715226965706479, "learning_rate": 1.9544280629982364e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.25313618779182434, "step": 3710, "valid_targets_mean": 3038.7, "valid_targets_min": 937 }, { "epoch": 3.902310924369748, "grad_norm": 0.6360683211422588, "learning_rate": 1.949190978375966e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.22172778844833374, "step": 3715, "valid_targets_mean": 3616.2, "valid_targets_min": 981 }, { "epoch": 3.907563025210084, "grad_norm": 0.6393776390642489, "learning_rate": 1.9439542423415413e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.205665722489357, "step": 3720, "valid_targets_mean": 3152.5, "valid_targets_min": 1351 }, { "epoch": 3.91281512605042, "grad_norm": 0.6380081375418487, "learning_rate": 1.9387178908228838e-05, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.23773056268692017, "step": 3725, "valid_targets_mean": 4153.7, "valid_targets_min": 1307 }, { "epoch": 3.918067226890756, "grad_norm": 0.5502610030856153, "learning_rate": 1.933481959745276e-05, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.2143445611000061, "step": 3730, "valid_targets_mean": 5039.1, "valid_targets_min": 1587 }, { "epoch": 3.9233193277310923, "grad_norm": 0.5822473871522699, "learning_rate": 1.9282464850311184e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.20977917313575745, "step": 3735, "valid_targets_mean": 4101.8, "valid_targets_min": 1741 }, { "epoch": 3.928571428571429, "grad_norm": 0.5793820699573822, "learning_rate": 1.9230115025996764e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.20586253702640533, "step": 3740, "valid_targets_mean": 3830.2, "valid_targets_min": 856 }, { "epoch": 3.9338235294117645, "grad_norm": 0.7167408375172564, "learning_rate": 1.9177770483668416e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.22084660828113556, "step": 3745, "valid_targets_mean": 3468.1, "valid_targets_min": 1886 }, { "epoch": 3.939075630252101, "grad_norm": 0.6404425612951213, "learning_rate": 1.912543158244881e-05, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.2383722960948944, "step": 3750, "valid_targets_mean": 3603.1, "valid_targets_min": 832 }, { "epoch": 3.9443277310924367, "grad_norm": 0.6506827435964047, "learning_rate": 1.9073098681421895e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.19391639530658722, "step": 3755, "valid_targets_mean": 3134.8, "valid_targets_min": 1484 }, { "epoch": 3.9495798319327733, "grad_norm": 0.6963957310682597, "learning_rate": 1.902077213963048e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.21799013018608093, "step": 3760, "valid_targets_mean": 3377.2, "valid_targets_min": 1152 }, { "epoch": 3.9548319327731094, "grad_norm": 0.7783983083913816, "learning_rate": 1.896845231607372e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.27412140369415283, "step": 3765, "valid_targets_mean": 2750.6, "valid_targets_min": 1128 }, { "epoch": 3.9600840336134455, "grad_norm": 0.6595123518563015, "learning_rate": 1.8916139569704704e-05, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.2191227525472641, "step": 3770, "valid_targets_mean": 3052.4, "valid_targets_min": 1156 }, { "epoch": 3.9653361344537816, "grad_norm": 0.6850818119709559, "learning_rate": 1.886383425942795e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.21025024354457855, "step": 3775, "valid_targets_mean": 3002.1, "valid_targets_min": 993 }, { "epoch": 3.9705882352941178, "grad_norm": 0.7391622979048171, "learning_rate": 1.8811536744096956e-05, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.22044730186462402, "step": 3780, "valid_targets_mean": 2914.0, "valid_targets_min": 1275 }, { "epoch": 3.975840336134454, "grad_norm": 0.7238761932845064, "learning_rate": 1.8759247382511748e-05, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.2314056158065796, "step": 3785, "valid_targets_mean": 3362.9, "valid_targets_min": 1669 }, { "epoch": 3.98109243697479, "grad_norm": 0.6629448508084417, "learning_rate": 1.8706966533416413e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.2214796096086502, "step": 3790, "valid_targets_mean": 3065.4, "valid_targets_min": 1233 }, { "epoch": 3.986344537815126, "grad_norm": 0.957526256499955, "learning_rate": 1.8654694555496624e-05, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.21655909717082977, "step": 3795, "valid_targets_mean": 3591.1, "valid_targets_min": 1685 }, { "epoch": 3.991596638655462, "grad_norm": 0.6385611154020212, "learning_rate": 1.860243180737721e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.23146796226501465, "step": 3800, "valid_targets_mean": 3571.6, "valid_targets_min": 1793 }, { "epoch": 3.9968487394957983, "grad_norm": 0.6361743923463639, "learning_rate": 1.8550178647619664e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.23826557397842407, "step": 3805, "valid_targets_mean": 3868.6, "valid_targets_min": 1976 }, { "epoch": 4.0021008403361344, "grad_norm": 0.9276215598529717, "learning_rate": 1.84979354347197e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.17189082503318787, "step": 3810, "valid_targets_mean": 1553.1, "valid_targets_min": 777 }, { "epoch": 4.007352941176471, "grad_norm": 0.866049721179808, "learning_rate": 1.8445702527104782e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.1560104489326477, "step": 3815, "valid_targets_mean": 1315.5, "valid_targets_min": 705 }, { "epoch": 4.012605042016807, "grad_norm": 0.7548114470500479, "learning_rate": 1.8393480283131677e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.1479974240064621, "step": 3820, "valid_targets_mean": 1626.6, "valid_targets_min": 906 }, { "epoch": 4.017857142857143, "grad_norm": 0.8337315927989255, "learning_rate": 1.8341269061083996e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.12990880012512207, "step": 3825, "valid_targets_mean": 1316.2, "valid_targets_min": 680 }, { "epoch": 4.023109243697479, "grad_norm": 0.8291733641726188, "learning_rate": 1.8289069219169717e-05, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.15963760018348694, "step": 3830, "valid_targets_mean": 1752.4, "valid_targets_min": 819 }, { "epoch": 4.0283613445378155, "grad_norm": 0.8304874985400824, "learning_rate": 1.8236881115518766e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.14934542775154114, "step": 3835, "valid_targets_mean": 1383.9, "valid_targets_min": 734 }, { "epoch": 4.033613445378151, "grad_norm": 0.8052129046929378, "learning_rate": 1.8184705108180516e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.15371397137641907, "step": 3840, "valid_targets_mean": 1573.9, "valid_targets_min": 930 }, { "epoch": 4.038865546218488, "grad_norm": 0.8085904112301928, "learning_rate": 1.8132541555121353e-05, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.14829567074775696, "step": 3845, "valid_targets_mean": 1383.1, "valid_targets_min": 737 }, { "epoch": 4.044117647058823, "grad_norm": 0.8018131771688088, "learning_rate": 1.808039081422223e-05, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.1333727240562439, "step": 3850, "valid_targets_mean": 1518.7, "valid_targets_min": 759 }, { "epoch": 4.04936974789916, "grad_norm": 0.8491004069838234, "learning_rate": 1.802825324327618e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.15288317203521729, "step": 3855, "valid_targets_mean": 1489.7, "valid_targets_min": 753 }, { "epoch": 4.054621848739496, "grad_norm": 0.8165835733627114, "learning_rate": 1.7976129199985886e-05, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.1399635225534439, "step": 3860, "valid_targets_mean": 1304.5, "valid_targets_min": 572 }, { "epoch": 4.059873949579832, "grad_norm": 0.7748737501704929, "learning_rate": 1.7924019041961228e-05, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.14403750002384186, "step": 3865, "valid_targets_mean": 1409.2, "valid_targets_min": 679 }, { "epoch": 4.065126050420168, "grad_norm": 0.8803098411860152, "learning_rate": 1.7871923126716827e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.15918989479541779, "step": 3870, "valid_targets_mean": 1331.1, "valid_targets_min": 771 }, { "epoch": 4.070378151260504, "grad_norm": 0.753689435569324, "learning_rate": 1.7819841811669573e-05, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.13107150793075562, "step": 3875, "valid_targets_mean": 1473.2, "valid_targets_min": 842 }, { "epoch": 4.07563025210084, "grad_norm": 0.7637352369796083, "learning_rate": 1.7767775454136194e-05, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.12565407156944275, "step": 3880, "valid_targets_mean": 1367.2, "valid_targets_min": 822 }, { "epoch": 4.080882352941177, "grad_norm": 0.8931529994254264, "learning_rate": 1.7715724411330806e-05, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.1554366648197174, "step": 3885, "valid_targets_mean": 1507.5, "valid_targets_min": 675 }, { "epoch": 4.086134453781512, "grad_norm": 0.8058581428686146, "learning_rate": 1.7663689040362446e-05, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.14042530953884125, "step": 3890, "valid_targets_mean": 1363.7, "valid_targets_min": 892 }, { "epoch": 4.091386554621849, "grad_norm": 0.8507202166895215, "learning_rate": 1.761166969823262e-05, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.13831481337547302, "step": 3895, "valid_targets_mean": 1315.4, "valid_targets_min": 656 }, { "epoch": 4.0966386554621845, "grad_norm": 0.7947736774793486, "learning_rate": 1.7559666741832896e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.12960849702358246, "step": 3900, "valid_targets_mean": 1341.5, "valid_targets_min": 681 }, { "epoch": 4.101890756302521, "grad_norm": 0.8251862770713435, "learning_rate": 1.750768052794239e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.15292903780937195, "step": 3905, "valid_targets_mean": 1436.5, "valid_targets_min": 548 }, { "epoch": 4.107142857142857, "grad_norm": 0.799156965792982, "learning_rate": 1.7455711413225372e-05, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.13684728741645813, "step": 3910, "valid_targets_mean": 1338.8, "valid_targets_min": 658 }, { "epoch": 4.112394957983193, "grad_norm": 0.8117329071283277, "learning_rate": 1.7403759754228794e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.13306397199630737, "step": 3915, "valid_targets_mean": 1343.0, "valid_targets_min": 650 }, { "epoch": 4.117647058823529, "grad_norm": 0.8678892755082293, "learning_rate": 1.7351825907379837e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.1487090289592743, "step": 3920, "valid_targets_mean": 1398.7, "valid_targets_min": 734 }, { "epoch": 4.1228991596638656, "grad_norm": 0.8732015715863755, "learning_rate": 1.7299910228983513e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.14107802510261536, "step": 3925, "valid_targets_mean": 1339.1, "valid_targets_min": 704 }, { "epoch": 4.128151260504202, "grad_norm": 0.8358116761683432, "learning_rate": 1.7248013075220128e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.13086049258708954, "step": 3930, "valid_targets_mean": 1377.6, "valid_targets_min": 686 }, { "epoch": 4.133403361344538, "grad_norm": 0.882675069386114, "learning_rate": 1.7196134802142945e-05, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.1546640843153, "step": 3935, "valid_targets_mean": 1540.8, "valid_targets_min": 697 }, { "epoch": 4.138655462184874, "grad_norm": 0.7673275063053835, "learning_rate": 1.7144275765675673e-05, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.13223353028297424, "step": 3940, "valid_targets_mean": 1435.7, "valid_targets_min": 779 }, { "epoch": 4.14390756302521, "grad_norm": 0.8161750428827426, "learning_rate": 1.7092436321610042e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.147655189037323, "step": 3945, "valid_targets_mean": 1520.5, "valid_targets_min": 729 }, { "epoch": 4.149159663865547, "grad_norm": 0.8361768379372263, "learning_rate": 1.704061682560336e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.13745343685150146, "step": 3950, "valid_targets_mean": 1408.2, "valid_targets_min": 661 }, { "epoch": 4.154411764705882, "grad_norm": 0.8345898800935504, "learning_rate": 1.698881763317609e-05, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.13992251455783844, "step": 3955, "valid_targets_mean": 1531.4, "valid_targets_min": 847 }, { "epoch": 4.159663865546219, "grad_norm": 0.7875946022995587, "learning_rate": 1.69370390997094e-05, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.13176432251930237, "step": 3960, "valid_targets_mean": 1391.6, "valid_targets_min": 758 }, { "epoch": 4.1649159663865545, "grad_norm": 0.7017178626610292, "learning_rate": 1.6885281580442677e-05, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.114842988550663, "step": 3965, "valid_targets_mean": 1312.7, "valid_targets_min": 800 }, { "epoch": 4.170168067226891, "grad_norm": 0.7974602402640565, "learning_rate": 1.6833545430471194e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1272060126066208, "step": 3970, "valid_targets_mean": 1347.1, "valid_targets_min": 803 }, { "epoch": 4.175420168067227, "grad_norm": 0.8100956763693268, "learning_rate": 1.678183100474359e-05, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.13280612230300903, "step": 3975, "valid_targets_mean": 1394.2, "valid_targets_min": 749 }, { "epoch": 4.180672268907563, "grad_norm": 0.8839233586552578, "learning_rate": 1.6730138658059448e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.13839851319789886, "step": 3980, "valid_targets_mean": 1372.1, "valid_targets_min": 837 }, { "epoch": 4.185924369747899, "grad_norm": 0.7770716555066293, "learning_rate": 1.667846874506689e-05, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.12787684798240662, "step": 3985, "valid_targets_mean": 1425.2, "valid_targets_min": 719 }, { "epoch": 4.1911764705882355, "grad_norm": 0.8263514960899874, "learning_rate": 1.662682162026012e-05, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.14100591838359833, "step": 3990, "valid_targets_mean": 1423.1, "valid_targets_min": 765 }, { "epoch": 4.196428571428571, "grad_norm": 0.8174867184649295, "learning_rate": 1.6575197637976995e-05, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.14689315855503082, "step": 3995, "valid_targets_mean": 1509.8, "valid_targets_min": 875 }, { "epoch": 4.201680672268908, "grad_norm": 0.8589762302363031, "learning_rate": 1.652359715239661e-05, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13010036945343018, "step": 4000, "valid_targets_mean": 1292.4, "valid_targets_min": 655 }, { "epoch": 4.206932773109243, "grad_norm": 0.8425688419243291, "learning_rate": 1.6472020517536828e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.1463192105293274, "step": 4005, "valid_targets_mean": 1474.6, "valid_targets_min": 669 }, { "epoch": 4.21218487394958, "grad_norm": 0.8171247963907109, "learning_rate": 1.6420468087251907e-05, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.13386958837509155, "step": 4010, "valid_targets_mean": 1377.2, "valid_targets_min": 1046 }, { "epoch": 4.217436974789916, "grad_norm": 0.8221524193856137, "learning_rate": 1.6368940215230026e-05, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.14860522747039795, "step": 4015, "valid_targets_mean": 1693.8, "valid_targets_min": 703 }, { "epoch": 4.222689075630252, "grad_norm": 0.8080758516493216, "learning_rate": 1.6317437254990875e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.13878750801086426, "step": 4020, "valid_targets_mean": 1473.4, "valid_targets_min": 846 }, { "epoch": 4.227941176470588, "grad_norm": 0.8329372613650491, "learning_rate": 1.626595955988325e-05, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.14070574939250946, "step": 4025, "valid_targets_mean": 1439.1, "valid_targets_min": 764 }, { "epoch": 4.233193277310924, "grad_norm": 0.7819540997359885, "learning_rate": 1.6214507483082593e-05, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.13133744895458221, "step": 4030, "valid_targets_mean": 1577.8, "valid_targets_min": 822 }, { "epoch": 4.23844537815126, "grad_norm": 0.7658805060914474, "learning_rate": 1.6163081377588588e-05, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.13184303045272827, "step": 4035, "valid_targets_mean": 1500.7, "valid_targets_min": 982 }, { "epoch": 4.243697478991597, "grad_norm": 0.7854703396401594, "learning_rate": 1.6111681596222732e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.13113921880722046, "step": 4040, "valid_targets_mean": 1402.2, "valid_targets_min": 713 }, { "epoch": 4.248949579831933, "grad_norm": 0.765545221207553, "learning_rate": 1.606030849162593e-05, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.1270998865365982, "step": 4045, "valid_targets_mean": 1522.0, "valid_targets_min": 721 }, { "epoch": 4.254201680672269, "grad_norm": 0.80112535205176, "learning_rate": 1.600896241625605e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.13291269540786743, "step": 4050, "valid_targets_mean": 1373.8, "valid_targets_min": 741 }, { "epoch": 4.2594537815126055, "grad_norm": 0.8177224842495399, "learning_rate": 1.5957643722385532e-05, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.14079031348228455, "step": 4055, "valid_targets_mean": 1517.9, "valid_targets_min": 734 }, { "epoch": 4.264705882352941, "grad_norm": 0.795808535657422, "learning_rate": 1.590635276209896e-05, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.13821426033973694, "step": 4060, "valid_targets_mean": 1521.1, "valid_targets_min": 744 }, { "epoch": 4.269957983193278, "grad_norm": 0.8258679101265551, "learning_rate": 1.5855089887290634e-05, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.14685073494911194, "step": 4065, "valid_targets_mean": 1565.1, "valid_targets_min": 620 }, { "epoch": 4.275210084033613, "grad_norm": 0.8117779327857177, "learning_rate": 1.5803855449662175e-05, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.13573217391967773, "step": 4070, "valid_targets_mean": 1411.9, "valid_targets_min": 622 }, { "epoch": 4.28046218487395, "grad_norm": 0.7103133306723244, "learning_rate": 1.5752649800720096e-05, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.14503194391727448, "step": 4075, "valid_targets_mean": 1797.2, "valid_targets_min": 740 }, { "epoch": 4.285714285714286, "grad_norm": 0.7877525685043663, "learning_rate": 1.5701473291773395e-05, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.12483812868595123, "step": 4080, "valid_targets_mean": 1316.6, "valid_targets_min": 694 }, { "epoch": 4.290966386554622, "grad_norm": 0.7744871393889592, "learning_rate": 1.5650326273931166e-05, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.13510701060295105, "step": 4085, "valid_targets_mean": 1644.8, "valid_targets_min": 902 }, { "epoch": 4.296218487394958, "grad_norm": 0.7786406479142675, "learning_rate": 1.559920909810016e-05, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.13013191521167755, "step": 4090, "valid_targets_mean": 1388.4, "valid_targets_min": 674 }, { "epoch": 4.301470588235294, "grad_norm": 0.7764860246380487, "learning_rate": 1.5548122114982393e-05, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.12222108244895935, "step": 4095, "valid_targets_mean": 1277.5, "valid_targets_min": 661 }, { "epoch": 4.30672268907563, "grad_norm": 0.8106042463016419, "learning_rate": 1.5497065675072728e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.14016015827655792, "step": 4100, "valid_targets_mean": 1502.6, "valid_targets_min": 912 }, { "epoch": 4.311974789915967, "grad_norm": 0.8543220451468436, "learning_rate": 1.5446040128656485e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.14713945984840393, "step": 4105, "valid_targets_mean": 1561.8, "valid_targets_min": 1181 }, { "epoch": 4.317226890756302, "grad_norm": 0.7953069524968457, "learning_rate": 1.539504582580704e-05, "loss": 0.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.12721598148345947, "step": 4110, "valid_targets_mean": 1307.5, "valid_targets_min": 773 }, { "epoch": 4.322478991596639, "grad_norm": 0.8097826390836019, "learning_rate": 1.5344083116383395e-05, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.12812337279319763, "step": 4115, "valid_targets_mean": 1381.6, "valid_targets_min": 679 }, { "epoch": 4.3277310924369745, "grad_norm": 0.7958890094736837, "learning_rate": 1.529315235002781e-05, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.14337149262428284, "step": 4120, "valid_targets_mean": 1599.2, "valid_targets_min": 818 }, { "epoch": 4.332983193277311, "grad_norm": 0.783528991087372, "learning_rate": 1.5242253876163399e-05, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.12217546254396439, "step": 4125, "valid_targets_mean": 1385.0, "valid_targets_min": 635 }, { "epoch": 4.338235294117647, "grad_norm": 0.8168471451852063, "learning_rate": 1.5191388043991712e-05, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.12848719954490662, "step": 4130, "valid_targets_mean": 1420.3, "valid_targets_min": 592 }, { "epoch": 4.343487394957983, "grad_norm": 0.8687088982404517, "learning_rate": 1.5140555202490359e-05, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.1381555199623108, "step": 4135, "valid_targets_mean": 1435.8, "valid_targets_min": 662 }, { "epoch": 4.348739495798319, "grad_norm": 0.824701387692817, "learning_rate": 1.5089755700410602e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.13314849138259888, "step": 4140, "valid_targets_mean": 1477.9, "valid_targets_min": 622 }, { "epoch": 4.3539915966386555, "grad_norm": 1.1187004100398168, "learning_rate": 1.5038989886274992e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.1633179783821106, "step": 4145, "valid_targets_mean": 1382.3, "valid_targets_min": 625 }, { "epoch": 4.359243697478991, "grad_norm": 0.843059495998902, "learning_rate": 1.498825810837492e-05, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.12570440769195557, "step": 4150, "valid_targets_mean": 1461.6, "valid_targets_min": 888 }, { "epoch": 4.364495798319328, "grad_norm": 0.816554096771243, "learning_rate": 1.4937560714768283e-05, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.1403723806142807, "step": 4155, "valid_targets_mean": 1461.2, "valid_targets_min": 635 }, { "epoch": 4.369747899159664, "grad_norm": 0.8797104989098917, "learning_rate": 1.4886898053277086e-05, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.15383698046207428, "step": 4160, "valid_targets_mean": 1542.3, "valid_targets_min": 522 }, { "epoch": 4.375, "grad_norm": 0.7898626242305901, "learning_rate": 1.4836270471485029e-05, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.12376511842012405, "step": 4165, "valid_targets_mean": 1244.7, "valid_targets_min": 697 }, { "epoch": 4.380252100840336, "grad_norm": 0.8780197054651814, "learning_rate": 1.4785678316735144e-05, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.14664515852928162, "step": 4170, "valid_targets_mean": 1673.9, "valid_targets_min": 730 }, { "epoch": 4.385504201680672, "grad_norm": 0.9346525477732902, "learning_rate": 1.4735121936127406e-05, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.15194876492023468, "step": 4175, "valid_targets_mean": 1695.9, "valid_targets_min": 719 }, { "epoch": 4.390756302521009, "grad_norm": 0.9211785858456039, "learning_rate": 1.4684601676516366e-05, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.138489231467247, "step": 4180, "valid_targets_mean": 1400.1, "valid_targets_min": 745 }, { "epoch": 4.3960084033613445, "grad_norm": 0.8373085168906266, "learning_rate": 1.4634117884508738e-05, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.12678782641887665, "step": 4185, "valid_targets_mean": 1299.4, "valid_targets_min": 680 }, { "epoch": 4.401260504201681, "grad_norm": 0.8325212171741512, "learning_rate": 1.458367090646105e-05, "loss": 0.1278, "loss_nan_ranks": 0, "loss_rank_avg": 0.1405733823776245, "step": 4190, "valid_targets_mean": 1521.1, "valid_targets_min": 778 }, { "epoch": 4.406512605042017, "grad_norm": 0.9073092150371975, "learning_rate": 1.4533261088477257e-05, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.16051650047302246, "step": 4195, "valid_targets_mean": 1617.8, "valid_targets_min": 851 }, { "epoch": 4.411764705882353, "grad_norm": 0.7397162950148408, "learning_rate": 1.448288877640637e-05, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.11534975469112396, "step": 4200, "valid_targets_mean": 1434.4, "valid_targets_min": 692 }, { "epoch": 4.417016806722689, "grad_norm": 0.7733942072643732, "learning_rate": 1.4432554315840082e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.12870749831199646, "step": 4205, "valid_targets_mean": 1500.7, "valid_targets_min": 741 }, { "epoch": 4.4222689075630255, "grad_norm": 0.8287058084711577, "learning_rate": 1.438225805211039e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.12352833896875381, "step": 4210, "valid_targets_mean": 1306.1, "valid_targets_min": 639 }, { "epoch": 4.427521008403361, "grad_norm": 0.8460146278274804, "learning_rate": 1.4332000330287248e-05, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.11612292379140854, "step": 4215, "valid_targets_mean": 1381.9, "valid_targets_min": 772 }, { "epoch": 4.432773109243698, "grad_norm": 0.8428338799366506, "learning_rate": 1.428178149517617e-05, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.1271061897277832, "step": 4220, "valid_targets_mean": 1532.2, "valid_targets_min": 765 }, { "epoch": 4.438025210084033, "grad_norm": 0.7764971458397468, "learning_rate": 1.4231601891315876e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.1206718236207962, "step": 4225, "valid_targets_mean": 1425.2, "valid_targets_min": 695 }, { "epoch": 4.44327731092437, "grad_norm": 0.8017610552892988, "learning_rate": 1.418146186297594e-05, "loss": 0.1257, "loss_nan_ranks": 0, "loss_rank_avg": 0.12809637188911438, "step": 4230, "valid_targets_mean": 1575.6, "valid_targets_min": 807 }, { "epoch": 4.448529411764706, "grad_norm": 0.8204445283311675, "learning_rate": 1.413136175415441e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1299220323562622, "step": 4235, "valid_targets_mean": 1367.1, "valid_targets_min": 873 }, { "epoch": 4.453781512605042, "grad_norm": 0.8229673951166021, "learning_rate": 1.4081301908575457e-05, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.13332301378250122, "step": 4240, "valid_targets_mean": 1369.4, "valid_targets_min": 591 }, { "epoch": 4.459033613445378, "grad_norm": 0.8025930909766332, "learning_rate": 1.4031282669687035e-05, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.11734200268983841, "step": 4245, "valid_targets_mean": 1319.9, "valid_targets_min": 646 }, { "epoch": 4.464285714285714, "grad_norm": 0.9239894606873152, "learning_rate": 1.3981304380658474e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.21401086449623108, "step": 4250, "valid_targets_mean": 4488.5, "valid_targets_min": 1323 }, { "epoch": 4.46953781512605, "grad_norm": 0.6598274422549769, "learning_rate": 1.3931367384378183e-05, "loss": 0.2242, "loss_nan_ranks": 0, "loss_rank_avg": 0.2256534993648529, "step": 4255, "valid_targets_mean": 4344.8, "valid_targets_min": 1631 }, { "epoch": 4.474789915966387, "grad_norm": 0.5777142536216642, "learning_rate": 1.3881472023451262e-05, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.21953260898590088, "step": 4260, "valid_targets_mean": 4358.4, "valid_targets_min": 1509 }, { "epoch": 4.480042016806722, "grad_norm": 0.5644265671396247, "learning_rate": 1.3831618640197153e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.19617916643619537, "step": 4265, "valid_targets_mean": 4067.4, "valid_targets_min": 2689 }, { "epoch": 4.485294117647059, "grad_norm": 0.6800329773093203, "learning_rate": 1.3781807576647315e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.19588659703731537, "step": 4270, "valid_targets_mean": 3231.8, "valid_targets_min": 1184 }, { "epoch": 4.4905462184873945, "grad_norm": 0.583998108779037, "learning_rate": 1.373203917454285e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.18826688826084137, "step": 4275, "valid_targets_mean": 4015.0, "valid_targets_min": 1413 }, { "epoch": 4.495798319327731, "grad_norm": 0.5993018924234834, "learning_rate": 1.3682313775332186e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.20078253746032715, "step": 4280, "valid_targets_mean": 4218.1, "valid_targets_min": 2160 }, { "epoch": 4.501050420168067, "grad_norm": 0.6213345974417059, "learning_rate": 1.3632631720168705e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.21006864309310913, "step": 4285, "valid_targets_mean": 3998.2, "valid_targets_min": 1654 }, { "epoch": 4.506302521008403, "grad_norm": 0.6454438419555589, "learning_rate": 1.358299334990842e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.21891412138938904, "step": 4290, "valid_targets_mean": 3480.9, "valid_targets_min": 1462 }, { "epoch": 4.51155462184874, "grad_norm": 0.5793855112485845, "learning_rate": 1.3533399005107635e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.19543211162090302, "step": 4295, "valid_targets_mean": 4008.8, "valid_targets_min": 874 }, { "epoch": 4.516806722689076, "grad_norm": 0.5886149747788205, "learning_rate": 1.3483849026020603e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.19601313769817352, "step": 4300, "valid_targets_mean": 3658.9, "valid_targets_min": 953 }, { "epoch": 4.522058823529412, "grad_norm": 0.6162622988474424, "learning_rate": 1.3434343752597199e-05, "loss": 0.2143, "loss_nan_ranks": 0, "loss_rank_avg": 0.2158222198486328, "step": 4305, "valid_targets_mean": 4291.2, "valid_targets_min": 1265 }, { "epoch": 4.527310924369748, "grad_norm": 0.5225855536952907, "learning_rate": 1.3384883524480576e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.1962510198354721, "step": 4310, "valid_targets_mean": 4939.0, "valid_targets_min": 1596 }, { "epoch": 4.532563025210084, "grad_norm": 0.639285317945504, "learning_rate": 1.333546868100486e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.20231905579566956, "step": 4315, "valid_targets_mean": 3340.8, "valid_targets_min": 1759 }, { "epoch": 4.53781512605042, "grad_norm": 0.6692843580892279, "learning_rate": 1.3286099561192784e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.21312329173088074, "step": 4320, "valid_targets_mean": 3084.3, "valid_targets_min": 1353 }, { "epoch": 4.543067226890757, "grad_norm": 0.6120205294157653, "learning_rate": 1.3236776503753397e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.19397076964378357, "step": 4325, "valid_targets_mean": 3763.4, "valid_targets_min": 1643 }, { "epoch": 4.548319327731092, "grad_norm": 0.668479121847745, "learning_rate": 1.3187499847079713e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.2041492760181427, "step": 4330, "valid_targets_mean": 3227.9, "valid_targets_min": 1269 }, { "epoch": 4.553571428571429, "grad_norm": 0.6752786859520122, "learning_rate": 1.3138269929246427e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.22046181559562683, "step": 4335, "valid_targets_mean": 3324.2, "valid_targets_min": 1681 }, { "epoch": 4.5588235294117645, "grad_norm": 0.6548319871768743, "learning_rate": 1.308908708800753e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.2117079198360443, "step": 4340, "valid_targets_mean": 3792.3, "valid_targets_min": 1477 }, { "epoch": 4.564075630252101, "grad_norm": 0.6879232525076725, "learning_rate": 1.3039951660794063e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.20829437673091888, "step": 4345, "valid_targets_mean": 3502.8, "valid_targets_min": 662 }, { "epoch": 4.569327731092437, "grad_norm": 0.6897322297757514, "learning_rate": 1.2990863984711773e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.21518868207931519, "step": 4350, "valid_targets_mean": 3320.8, "valid_targets_min": 2077 }, { "epoch": 4.574579831932773, "grad_norm": 0.688837675359442, "learning_rate": 1.294182439653878e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.18814504146575928, "step": 4355, "valid_targets_mean": 2756.4, "valid_targets_min": 1505 }, { "epoch": 4.579831932773109, "grad_norm": 0.7330677533755521, "learning_rate": 1.2892833232723297e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.24092328548431396, "step": 4360, "valid_targets_mean": 3447.9, "valid_targets_min": 1978 }, { "epoch": 4.5850840336134455, "grad_norm": 0.7241849761685287, "learning_rate": 1.2843890829381303e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.26030996441841125, "step": 4365, "valid_targets_mean": 4194.2, "valid_targets_min": 1490 }, { "epoch": 4.590336134453781, "grad_norm": 0.7026396424067808, "learning_rate": 1.2794997522294263e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.21944516897201538, "step": 4370, "valid_targets_mean": 2970.4, "valid_targets_min": 1422 }, { "epoch": 4.595588235294118, "grad_norm": 0.6259185795346857, "learning_rate": 1.2746153646906766e-05, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.1922265887260437, "step": 4375, "valid_targets_mean": 3396.0, "valid_targets_min": 1603 }, { "epoch": 4.600840336134453, "grad_norm": 0.7438486179833006, "learning_rate": 1.2697359538324303e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.21673396229743958, "step": 4380, "valid_targets_mean": 2728.2, "valid_targets_min": 863 }, { "epoch": 4.60609243697479, "grad_norm": 0.6370907634088678, "learning_rate": 1.2648615531310907e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.19770187139511108, "step": 4385, "valid_targets_mean": 3677.7, "valid_targets_min": 1208 }, { "epoch": 4.6113445378151265, "grad_norm": 0.68482682086709, "learning_rate": 1.259992196028688e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.2116718888282776, "step": 4390, "valid_targets_mean": 3316.8, "valid_targets_min": 1501 }, { "epoch": 4.616596638655462, "grad_norm": 0.7052208338762722, "learning_rate": 1.2551279159326495e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.2252679467201233, "step": 4395, "valid_targets_mean": 3425.5, "valid_targets_min": 1828 }, { "epoch": 4.621848739495798, "grad_norm": 0.6124764309205445, "learning_rate": 1.2502687462155709e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.1903487741947174, "step": 4400, "valid_targets_mean": 3237.6, "valid_targets_min": 1110 }, { "epoch": 4.6271008403361344, "grad_norm": 0.8771050749310795, "learning_rate": 1.2454147202149865e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.21824470162391663, "step": 4405, "valid_targets_mean": 2931.8, "valid_targets_min": 1283 }, { "epoch": 4.632352941176471, "grad_norm": 0.681928418139891, "learning_rate": 1.2405658712331409e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.20178645849227905, "step": 4410, "valid_targets_mean": 3311.4, "valid_targets_min": 1714 }, { "epoch": 4.637605042016807, "grad_norm": 0.7118807798201505, "learning_rate": 1.2357222325367604e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.21912041306495667, "step": 4415, "valid_targets_mean": 3572.0, "valid_targets_min": 1216 }, { "epoch": 4.642857142857143, "grad_norm": 0.6823054558978693, "learning_rate": 1.2308838373568249e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.20421810448169708, "step": 4420, "valid_targets_mean": 3451.4, "valid_targets_min": 924 }, { "epoch": 4.648109243697479, "grad_norm": 0.6938843637670672, "learning_rate": 1.2260507188883395e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.19850008189678192, "step": 4425, "valid_targets_mean": 3175.6, "valid_targets_min": 1292 }, { "epoch": 4.6533613445378155, "grad_norm": 0.7077142011650852, "learning_rate": 1.2212229102901077e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.2047484815120697, "step": 4430, "valid_targets_mean": 3533.4, "valid_targets_min": 1265 }, { "epoch": 4.658613445378151, "grad_norm": 0.7159319249656814, "learning_rate": 1.2164004446845037e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.20691466331481934, "step": 4435, "valid_targets_mean": 3325.9, "valid_targets_min": 1394 }, { "epoch": 4.663865546218488, "grad_norm": 0.7559645592765224, "learning_rate": 1.2115833551572438e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.2295243889093399, "step": 4440, "valid_targets_mean": 3590.2, "valid_targets_min": 1844 }, { "epoch": 4.669117647058823, "grad_norm": 0.7415198687787329, "learning_rate": 1.2067716747571616e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.23479296267032623, "step": 4445, "valid_targets_mean": 3564.9, "valid_targets_min": 1482 }, { "epoch": 4.67436974789916, "grad_norm": 0.688853324893974, "learning_rate": 1.201965436495978e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.21714499592781067, "step": 4450, "valid_targets_mean": 3340.8, "valid_targets_min": 1654 }, { "epoch": 4.679621848739496, "grad_norm": 0.7016909162355258, "learning_rate": 1.1971646733480784e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.20046481490135193, "step": 4455, "valid_targets_mean": 2951.6, "valid_targets_min": 584 }, { "epoch": 4.684873949579832, "grad_norm": 0.6941971218245336, "learning_rate": 1.1923694182502848e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.2116384208202362, "step": 4460, "valid_targets_mean": 3478.9, "valid_targets_min": 1049 }, { "epoch": 4.690126050420168, "grad_norm": 0.6893303247496907, "learning_rate": 1.1875797041016286e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.2102683186531067, "step": 4465, "valid_targets_mean": 3287.8, "valid_targets_min": 1350 }, { "epoch": 4.695378151260504, "grad_norm": 0.7350721707173831, "learning_rate": 1.1827955637631283e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.21726731956005096, "step": 4470, "valid_targets_mean": 3590.0, "valid_targets_min": 1624 }, { "epoch": 4.70063025210084, "grad_norm": 0.6938494286562441, "learning_rate": 1.1780170300575602e-05, "loss": 0.1884, "loss_nan_ranks": 0, "loss_rank_avg": 0.18289947509765625, "step": 4475, "valid_targets_mean": 2807.6, "valid_targets_min": 916 }, { "epoch": 4.705882352941177, "grad_norm": 0.6412962232296662, "learning_rate": 1.1732441357692353e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.18760257959365845, "step": 4480, "valid_targets_mean": 3658.0, "valid_targets_min": 2032 }, { "epoch": 4.711134453781512, "grad_norm": 0.7583818317813796, "learning_rate": 1.1684769136437742e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.21241483092308044, "step": 4485, "valid_targets_mean": 3141.9, "valid_targets_min": 1259 }, { "epoch": 4.716386554621849, "grad_norm": 0.6326913726737966, "learning_rate": 1.1637153963878815e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.19029675424098969, "step": 4490, "valid_targets_mean": 3575.4, "valid_targets_min": 1183 }, { "epoch": 4.7216386554621845, "grad_norm": 0.6290790387214149, "learning_rate": 1.1589596166691231e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.21391956508159637, "step": 4495, "valid_targets_mean": 4193.9, "valid_targets_min": 1101 }, { "epoch": 4.726890756302521, "grad_norm": 0.6475834579736413, "learning_rate": 1.1542096071157012e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.20298393070697784, "step": 4500, "valid_targets_mean": 3821.9, "valid_targets_min": 1726 }, { "epoch": 4.732142857142857, "grad_norm": 0.6979196464072809, "learning_rate": 1.1494654003162285e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.20892876386642456, "step": 4505, "valid_targets_mean": 3171.0, "valid_targets_min": 1669 }, { "epoch": 4.737394957983193, "grad_norm": 0.6535989262032701, "learning_rate": 1.1447270288195089e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.20477300882339478, "step": 4510, "valid_targets_mean": 3491.4, "valid_targets_min": 1185 }, { "epoch": 4.742647058823529, "grad_norm": 0.7434999336674271, "learning_rate": 1.1399945251343114e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.23692408204078674, "step": 4515, "valid_targets_mean": 3283.9, "valid_targets_min": 1091 }, { "epoch": 4.7478991596638656, "grad_norm": 0.7222774058425186, "learning_rate": 1.1352679217291457e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.2167915254831314, "step": 4520, "valid_targets_mean": 3654.3, "valid_targets_min": 1352 }, { "epoch": 4.753151260504202, "grad_norm": 0.5928834886740821, "learning_rate": 1.1305472510320419e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.1938672959804535, "step": 4525, "valid_targets_mean": 4265.6, "valid_targets_min": 1535 }, { "epoch": 4.758403361344538, "grad_norm": 0.7282043659742619, "learning_rate": 1.1258325454303286e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.1851435899734497, "step": 4530, "valid_targets_mean": 2997.0, "valid_targets_min": 854 }, { "epoch": 4.7636554621848735, "grad_norm": 0.7451730107148029, "learning_rate": 1.1211238372704073e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.18663758039474487, "step": 4535, "valid_targets_mean": 2795.1, "valid_targets_min": 1179 }, { "epoch": 4.76890756302521, "grad_norm": 0.7184545671700696, "learning_rate": 1.1164211588575339e-05, "loss": 0.1969, "loss_nan_ranks": 0, "loss_rank_avg": 0.19145233929157257, "step": 4540, "valid_targets_mean": 3652.7, "valid_targets_min": 1444 }, { "epoch": 4.774159663865547, "grad_norm": 0.7397780134283227, "learning_rate": 1.1117245424555967e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.1895849108695984, "step": 4545, "valid_targets_mean": 2500.1, "valid_targets_min": 642 }, { "epoch": 4.779411764705882, "grad_norm": 0.6713856995898463, "learning_rate": 1.1070340202868915e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.1881069391965866, "step": 4550, "valid_targets_mean": 3590.1, "valid_targets_min": 1637 }, { "epoch": 4.784663865546219, "grad_norm": 0.8087445793498248, "learning_rate": 1.1023496245319056e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.24480175971984863, "step": 4555, "valid_targets_mean": 3466.0, "valid_targets_min": 1175 }, { "epoch": 4.7899159663865545, "grad_norm": 0.7068565649556457, "learning_rate": 1.0976713873290925e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.20139086246490479, "step": 4560, "valid_targets_mean": 3205.6, "valid_targets_min": 1612 }, { "epoch": 4.795168067226891, "grad_norm": 0.6620926828840262, "learning_rate": 1.0929993407746543e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.19388242065906525, "step": 4565, "valid_targets_mean": 3423.2, "valid_targets_min": 1743 }, { "epoch": 4.800420168067227, "grad_norm": 0.6727413718092184, "learning_rate": 1.0883335169223212e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.1882367581129074, "step": 4570, "valid_targets_mean": 3168.8, "valid_targets_min": 1398 }, { "epoch": 4.805672268907563, "grad_norm": 0.6558248286205179, "learning_rate": 1.0836739477831297e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.20704635977745056, "step": 4575, "valid_targets_mean": 3489.9, "valid_targets_min": 1558 }, { "epoch": 4.810924369747899, "grad_norm": 0.6847057248913088, "learning_rate": 1.0790206653252055e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.20168985426425934, "step": 4580, "valid_targets_mean": 3278.1, "valid_targets_min": 1445 }, { "epoch": 4.8161764705882355, "grad_norm": 0.6533366829855569, "learning_rate": 1.0743737014735434e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.18918371200561523, "step": 4585, "valid_targets_mean": 3682.9, "valid_targets_min": 2000 }, { "epoch": 4.821428571428571, "grad_norm": 0.7708553362949551, "learning_rate": 1.0697330881097857e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.19962045550346375, "step": 4590, "valid_targets_mean": 3065.2, "valid_targets_min": 1243 }, { "epoch": 4.826680672268908, "grad_norm": 0.7089419295191447, "learning_rate": 1.0650988570720077e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.20890700817108154, "step": 4595, "valid_targets_mean": 3286.4, "valid_targets_min": 1223 }, { "epoch": 4.831932773109243, "grad_norm": 0.7147247615274656, "learning_rate": 1.0604710401544963e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.19596712291240692, "step": 4600, "valid_targets_mean": 3027.9, "valid_targets_min": 869 }, { "epoch": 4.83718487394958, "grad_norm": 0.7304597580233416, "learning_rate": 1.0558496691075318e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.20904818177223206, "step": 4605, "valid_targets_mean": 3077.8, "valid_targets_min": 1603 }, { "epoch": 4.842436974789916, "grad_norm": 0.7224217938478468, "learning_rate": 1.0512347756371726e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.18744680285453796, "step": 4610, "valid_targets_mean": 2883.4, "valid_targets_min": 721 }, { "epoch": 4.847689075630252, "grad_norm": 0.7107738441028865, "learning_rate": 1.0466263914050362e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.2116435468196869, "step": 4615, "valid_targets_mean": 3873.2, "valid_targets_min": 1994 }, { "epoch": 4.852941176470588, "grad_norm": 0.7236551319922022, "learning_rate": 1.0420245480280804e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.18254084885120392, "step": 4620, "valid_targets_mean": 3090.9, "valid_targets_min": 1066 }, { "epoch": 4.858193277310924, "grad_norm": 0.6924268052728789, "learning_rate": 1.0374292770783891e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.21132606267929077, "step": 4625, "valid_targets_mean": 3609.6, "valid_targets_min": 1648 }, { "epoch": 4.86344537815126, "grad_norm": 0.710132639844148, "learning_rate": 1.0328406100829542e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.19806388020515442, "step": 4630, "valid_targets_mean": 3135.9, "valid_targets_min": 1889 }, { "epoch": 4.868697478991597, "grad_norm": 8.223593196499644, "learning_rate": 1.0282585785234578e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.21035614609718323, "step": 4635, "valid_targets_mean": 2491.6, "valid_targets_min": 885 }, { "epoch": 4.873949579831933, "grad_norm": 0.6950690926035392, "learning_rate": 1.023683213836061e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.20301932096481323, "step": 4640, "valid_targets_mean": 3529.4, "valid_targets_min": 1257 }, { "epoch": 4.879201680672269, "grad_norm": 0.7338702013416679, "learning_rate": 1.0191145474111823e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.20622602105140686, "step": 4645, "valid_targets_mean": 3178.1, "valid_targets_min": 1372 }, { "epoch": 4.884453781512605, "grad_norm": 0.6717591588502287, "learning_rate": 1.0145526105932872e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.2017562985420227, "step": 4650, "valid_targets_mean": 3422.6, "valid_targets_min": 1598 }, { "epoch": 4.889705882352941, "grad_norm": 0.76533252784604, "learning_rate": 1.0099974346806714e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.1944223940372467, "step": 4655, "valid_targets_mean": 2925.1, "valid_targets_min": 1074 }, { "epoch": 4.894957983193278, "grad_norm": 0.6637317114328515, "learning_rate": 1.0054490509252423e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.19309523701667786, "step": 4660, "valid_targets_mean": 3366.2, "valid_targets_min": 980 }, { "epoch": 4.900210084033613, "grad_norm": 0.6982820833530574, "learning_rate": 1.0009074905323118e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.21207424998283386, "step": 4665, "valid_targets_mean": 3100.1, "valid_targets_min": 793 }, { "epoch": 4.90546218487395, "grad_norm": 0.6432617078880017, "learning_rate": 9.963727846603784e-06, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.21252809464931488, "step": 4670, "valid_targets_mean": 3674.5, "valid_targets_min": 852 }, { "epoch": 4.910714285714286, "grad_norm": 0.7841146093401851, "learning_rate": 9.918449644209087e-06, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.18188413977622986, "step": 4675, "valid_targets_mean": 2951.1, "valid_targets_min": 1107 }, { "epoch": 4.915966386554622, "grad_norm": 0.7711023446249636, "learning_rate": 9.873240608781341e-06, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.20018140971660614, "step": 4680, "valid_targets_mean": 2839.9, "valid_targets_min": 1298 }, { "epoch": 4.921218487394958, "grad_norm": 0.6720914422866899, "learning_rate": 9.828101050488308e-06, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.19184359908103943, "step": 4685, "valid_targets_mean": 3508.3, "valid_targets_min": 1428 }, { "epoch": 4.926470588235294, "grad_norm": 0.6979997171728765, "learning_rate": 9.783031279021063e-06, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.1979558765888214, "step": 4690, "valid_targets_mean": 3186.6, "valid_targets_min": 1193 }, { "epoch": 4.93172268907563, "grad_norm": 0.6375536515405493, "learning_rate": 9.738031603591926e-06, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.18585914373397827, "step": 4695, "valid_targets_mean": 3687.8, "valid_targets_min": 1210 }, { "epoch": 4.936974789915967, "grad_norm": 0.6740300095798715, "learning_rate": 9.69310233293227e-06, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.1872563362121582, "step": 4700, "valid_targets_mean": 3261.6, "valid_targets_min": 974 }, { "epoch": 4.942226890756302, "grad_norm": 0.6728949238979616, "learning_rate": 9.648243775290476e-06, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.1736118197441101, "step": 4705, "valid_targets_mean": 2934.8, "valid_targets_min": 1575 }, { "epoch": 4.947478991596639, "grad_norm": 0.7317387069659124, "learning_rate": 9.60345623842974e-06, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.19196751713752747, "step": 4710, "valid_targets_mean": 3090.5, "valid_targets_min": 1697 }, { "epoch": 4.9527310924369745, "grad_norm": 0.7423800247961655, "learning_rate": 9.558740029626046e-06, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.19240882992744446, "step": 4715, "valid_targets_mean": 3297.7, "valid_targets_min": 897 }, { "epoch": 4.957983193277311, "grad_norm": 0.79806625760805, "learning_rate": 9.51409545566597e-06, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.22060896456241608, "step": 4720, "valid_targets_mean": 3071.2, "valid_targets_min": 887 }, { "epoch": 4.963235294117647, "grad_norm": 0.7615537115059738, "learning_rate": 9.469522822844663e-06, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.20150801539421082, "step": 4725, "valid_targets_mean": 2714.7, "valid_targets_min": 1279 }, { "epoch": 4.968487394957983, "grad_norm": 0.7230728317576487, "learning_rate": 9.425022436963664e-06, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.17812782526016235, "step": 4730, "valid_targets_mean": 3112.9, "valid_targets_min": 1021 }, { "epoch": 4.973739495798319, "grad_norm": 0.8017286637803975, "learning_rate": 9.380594603328875e-06, "loss": 0.2056, "loss_nan_ranks": 0, "loss_rank_avg": 0.21535563468933105, "step": 4735, "valid_targets_mean": 3526.3, "valid_targets_min": 654 }, { "epoch": 4.9789915966386555, "grad_norm": 0.7962974276395127, "learning_rate": 9.336239626748432e-06, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.24022144079208374, "step": 4740, "valid_targets_mean": 2941.2, "valid_targets_min": 1039 }, { "epoch": 4.984243697478991, "grad_norm": 0.6987990811270663, "learning_rate": 9.291957811530602e-06, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.20734629034996033, "step": 4745, "valid_targets_mean": 3804.6, "valid_targets_min": 1737 }, { "epoch": 4.989495798319328, "grad_norm": 0.6320507915977177, "learning_rate": 9.247749461481712e-06, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.17486436665058136, "step": 4750, "valid_targets_mean": 3503.6, "valid_targets_min": 1276 }, { "epoch": 4.994747899159664, "grad_norm": 0.6565835428886582, "learning_rate": 9.203614879904083e-06, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.21443158388137817, "step": 4755, "valid_targets_mean": 4137.7, "valid_targets_min": 1572 }, { "epoch": 5.0, "grad_norm": 0.7198533786254716, "learning_rate": 9.159554369593901e-06, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.2270594984292984, "step": 4760, "valid_targets_mean": 3715.1, "valid_targets_min": 791 }, { "epoch": 5.005252100840337, "grad_norm": 0.7571959238315181, "learning_rate": 9.115568232839193e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.13461460173130035, "step": 4765, "valid_targets_mean": 1423.4, "valid_targets_min": 715 }, { "epoch": 5.010504201680672, "grad_norm": 0.8301602733718247, "learning_rate": 9.071656771417721e-06, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.12977659702301025, "step": 4770, "valid_targets_mean": 1407.8, "valid_targets_min": 612 }, { "epoch": 5.015756302521009, "grad_norm": 0.8166485961728386, "learning_rate": 9.027820286594902e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.13986307382583618, "step": 4775, "valid_targets_mean": 1413.5, "valid_targets_min": 714 }, { "epoch": 5.0210084033613445, "grad_norm": 0.8634652135372101, "learning_rate": 8.984059079121785e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.12289293855428696, "step": 4780, "valid_targets_mean": 1450.1, "valid_targets_min": 754 }, { "epoch": 5.026260504201681, "grad_norm": 1.0868991923247484, "learning_rate": 8.940373449232935e-06, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.1558552235364914, "step": 4785, "valid_targets_mean": 1481.1, "valid_targets_min": 718 }, { "epoch": 5.031512605042017, "grad_norm": 0.8280248464569533, "learning_rate": 8.896763696644405e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.13719496130943298, "step": 4790, "valid_targets_mean": 1530.8, "valid_targets_min": 731 }, { "epoch": 5.036764705882353, "grad_norm": 0.8223621736586295, "learning_rate": 8.853230120551693e-06, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12621982395648956, "step": 4795, "valid_targets_mean": 1416.6, "valid_targets_min": 725 }, { "epoch": 5.042016806722689, "grad_norm": 0.870763805985631, "learning_rate": 8.809773019627635e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.13102170825004578, "step": 4800, "valid_targets_mean": 1371.5, "valid_targets_min": 610 }, { "epoch": 5.0472689075630255, "grad_norm": 0.8397454624147834, "learning_rate": 8.766392692020413e-06, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.12862995266914368, "step": 4805, "valid_targets_mean": 1484.7, "valid_targets_min": 720 }, { "epoch": 5.052521008403361, "grad_norm": 0.7882246072954778, "learning_rate": 8.723089435351497e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.11443109065294266, "step": 4810, "valid_targets_mean": 1365.5, "valid_targets_min": 765 }, { "epoch": 5.057773109243698, "grad_norm": 0.8742920757552072, "learning_rate": 8.679863546713559e-06, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.127573624253273, "step": 4815, "valid_targets_mean": 1234.7, "valid_targets_min": 593 }, { "epoch": 5.063025210084033, "grad_norm": 0.7920380834226816, "learning_rate": 8.636715322668498e-06, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.11717408895492554, "step": 4820, "valid_targets_mean": 1540.4, "valid_targets_min": 704 }, { "epoch": 5.06827731092437, "grad_norm": 0.780341581121388, "learning_rate": 8.593645059245365e-06, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.11017392575740814, "step": 4825, "valid_targets_mean": 1329.9, "valid_targets_min": 722 }, { "epoch": 5.073529411764706, "grad_norm": 0.7603227971883492, "learning_rate": 8.550653051938333e-06, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11557639390230179, "step": 4830, "valid_targets_mean": 1549.6, "valid_targets_min": 865 }, { "epoch": 5.078781512605042, "grad_norm": 0.9030555834076215, "learning_rate": 8.507739595704695e-06, "loss": 0.1192, "loss_nan_ranks": 0, "loss_rank_avg": 0.13490742444992065, "step": 4835, "valid_targets_mean": 1507.4, "valid_targets_min": 797 }, { "epoch": 5.084033613445378, "grad_norm": 0.954349785672474, "learning_rate": 8.464904984962832e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.14801670610904694, "step": 4840, "valid_targets_mean": 1542.4, "valid_targets_min": 728 }, { "epoch": 5.089285714285714, "grad_norm": 0.9125020805445457, "learning_rate": 8.422149513590151e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.13509975373744965, "step": 4845, "valid_targets_mean": 1595.2, "valid_targets_min": 683 }, { "epoch": 5.09453781512605, "grad_norm": 0.871199900697412, "learning_rate": 8.37947347492115e-06, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.13447391986846924, "step": 4850, "valid_targets_mean": 1401.6, "valid_targets_min": 706 }, { "epoch": 5.099789915966387, "grad_norm": 0.8629277026545269, "learning_rate": 8.33687716174532e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.11550725251436234, "step": 4855, "valid_targets_mean": 1298.4, "valid_targets_min": 625 }, { "epoch": 5.105042016806722, "grad_norm": 0.8030715253201013, "learning_rate": 8.294360866305192e-06, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.1309053897857666, "step": 4860, "valid_targets_mean": 1659.7, "valid_targets_min": 790 }, { "epoch": 5.110294117647059, "grad_norm": 0.9265947353354664, "learning_rate": 8.251924880294317e-06, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.13342975080013275, "step": 4865, "valid_targets_mean": 1600.4, "valid_targets_min": 684 }, { "epoch": 5.1155462184873945, "grad_norm": 0.8041955738679034, "learning_rate": 8.20956949485527e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1035323292016983, "step": 4870, "valid_targets_mean": 1338.3, "valid_targets_min": 739 }, { "epoch": 5.120798319327731, "grad_norm": 0.8494495064085696, "learning_rate": 8.167295000577622e-06, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.11942795664072037, "step": 4875, "valid_targets_mean": 1456.2, "valid_targets_min": 657 }, { "epoch": 5.126050420168067, "grad_norm": 1.0365198065360532, "learning_rate": 8.125101687496e-06, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11641368269920349, "step": 4880, "valid_targets_mean": 1340.2, "valid_targets_min": 783 }, { "epoch": 5.131302521008403, "grad_norm": 0.8635148283698016, "learning_rate": 8.082989845088038e-06, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.11869832128286362, "step": 4885, "valid_targets_mean": 1394.4, "valid_targets_min": 734 }, { "epoch": 5.13655462184874, "grad_norm": 0.877173265352079, "learning_rate": 8.040959762272441e-06, "loss": 0.1232, "loss_nan_ranks": 0, "loss_rank_avg": 0.12606994807720184, "step": 4890, "valid_targets_mean": 1501.8, "valid_targets_min": 678 }, { "epoch": 5.141806722689076, "grad_norm": 0.9671178369518909, "learning_rate": 7.999011727406995e-06, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.12263111025094986, "step": 4895, "valid_targets_mean": 1651.7, "valid_targets_min": 843 }, { "epoch": 5.147058823529412, "grad_norm": 0.8799343051970719, "learning_rate": 7.957146028286524e-06, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.13233694434165955, "step": 4900, "valid_targets_mean": 1632.1, "valid_targets_min": 782 }, { "epoch": 5.152310924369748, "grad_norm": 0.8281302903839795, "learning_rate": 7.915362952141017e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.13629840314388275, "step": 4905, "valid_targets_mean": 1615.3, "valid_targets_min": 957 }, { "epoch": 5.157563025210084, "grad_norm": 0.9542718681795296, "learning_rate": 7.873662785633594e-06, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.14337027072906494, "step": 4910, "valid_targets_mean": 1482.9, "valid_targets_min": 713 }, { "epoch": 5.16281512605042, "grad_norm": 1.3637598590452737, "learning_rate": 7.832045814858538e-06, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.12161692976951599, "step": 4915, "valid_targets_mean": 1552.8, "valid_targets_min": 726 }, { "epoch": 5.168067226890757, "grad_norm": 0.821599075602171, "learning_rate": 7.790512325339367e-06, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.12724722921848297, "step": 4920, "valid_targets_mean": 1590.4, "valid_targets_min": 1147 }, { "epoch": 5.173319327731092, "grad_norm": 0.8859043037264651, "learning_rate": 7.74906260202685e-06, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.1232469454407692, "step": 4925, "valid_targets_mean": 1417.6, "valid_targets_min": 700 }, { "epoch": 5.178571428571429, "grad_norm": 0.8207302664180218, "learning_rate": 7.707696929297053e-06, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.10313037782907486, "step": 4930, "valid_targets_mean": 1255.4, "valid_targets_min": 640 }, { "epoch": 5.1838235294117645, "grad_norm": 0.8196199367733106, "learning_rate": 7.666415590949382e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.12141343951225281, "step": 4935, "valid_targets_mean": 1566.6, "valid_targets_min": 817 }, { "epoch": 5.189075630252101, "grad_norm": 0.8397722105470354, "learning_rate": 7.625218870204676e-06, "loss": 0.1157, "loss_nan_ranks": 0, "loss_rank_avg": 0.11369533091783524, "step": 4940, "valid_targets_mean": 1440.9, "valid_targets_min": 724 }, { "epoch": 5.194327731092437, "grad_norm": 0.84723032993192, "learning_rate": 7.584107049703195e-06, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.1220942959189415, "step": 4945, "valid_targets_mean": 1399.1, "valid_targets_min": 657 }, { "epoch": 5.199579831932773, "grad_norm": 1.1583713663548252, "learning_rate": 7.5430804115027615e-06, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.1239510029554367, "step": 4950, "valid_targets_mean": 1334.3, "valid_targets_min": 746 }, { "epoch": 5.204831932773109, "grad_norm": 0.940619146388919, "learning_rate": 7.502139237076744e-06, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.13509805500507355, "step": 4955, "valid_targets_mean": 1452.8, "valid_targets_min": 692 }, { "epoch": 5.2100840336134455, "grad_norm": 0.9031648217368532, "learning_rate": 7.461283807312194e-06, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.10953864455223083, "step": 4960, "valid_targets_mean": 1338.4, "valid_targets_min": 682 }, { "epoch": 5.215336134453781, "grad_norm": 0.7885774798170768, "learning_rate": 7.420514402507886e-06, "loss": 0.1134, "loss_nan_ranks": 0, "loss_rank_avg": 0.11579865217208862, "step": 4965, "valid_targets_mean": 1360.2, "valid_targets_min": 703 }, { "epoch": 5.220588235294118, "grad_norm": 0.8567753502507811, "learning_rate": 7.379831302372389e-06, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.12191884219646454, "step": 4970, "valid_targets_mean": 1520.9, "valid_targets_min": 864 }, { "epoch": 5.225840336134453, "grad_norm": 0.9494851235486876, "learning_rate": 7.3392347860221556e-06, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.16232752799987793, "step": 4975, "valid_targets_mean": 1814.6, "valid_targets_min": 734 }, { "epoch": 5.23109243697479, "grad_norm": 0.8077534069393267, "learning_rate": 7.298725131979629e-06, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.11486963927745819, "step": 4980, "valid_targets_mean": 1478.3, "valid_targets_min": 607 }, { "epoch": 5.236344537815126, "grad_norm": 0.8359577317112136, "learning_rate": 7.258302618171287e-06, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.11313410103321075, "step": 4985, "valid_targets_mean": 1497.9, "valid_targets_min": 551 }, { "epoch": 5.241596638655462, "grad_norm": 0.9503036196925028, "learning_rate": 7.217967521925775e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.12508943676948547, "step": 4990, "valid_targets_mean": 1550.5, "valid_targets_min": 676 }, { "epoch": 5.246848739495798, "grad_norm": 0.8718205924513632, "learning_rate": 7.177720119971998e-06, "loss": 0.1179, "loss_nan_ranks": 0, "loss_rank_avg": 0.11915310472249985, "step": 4995, "valid_targets_mean": 1372.5, "valid_targets_min": 904 }, { "epoch": 5.2521008403361344, "grad_norm": 0.9288193265136786, "learning_rate": 7.137560688437184e-06, "loss": 0.1122, "loss_nan_ranks": 0, "loss_rank_avg": 0.12416621297597885, "step": 5000, "valid_targets_mean": 1479.0, "valid_targets_min": 859 }, { "epoch": 5.257352941176471, "grad_norm": 0.8635518493795323, "learning_rate": 7.097489502845047e-06, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.09854140877723694, "step": 5005, "valid_targets_mean": 1234.8, "valid_targets_min": 737 }, { "epoch": 5.262605042016807, "grad_norm": 0.9381227734247657, "learning_rate": 7.0575068381138525e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.12833383679389954, "step": 5010, "valid_targets_mean": 1363.2, "valid_targets_min": 791 }, { "epoch": 5.267857142857143, "grad_norm": 0.8806803188401461, "learning_rate": 7.0176129685545414e-06, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.12506265938282013, "step": 5015, "valid_targets_mean": 1532.1, "valid_targets_min": 786 }, { "epoch": 5.273109243697479, "grad_norm": 0.8640788078067893, "learning_rate": 6.977808167868867e-06, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.1157342940568924, "step": 5020, "valid_targets_mean": 1471.0, "valid_targets_min": 944 }, { "epoch": 5.2783613445378155, "grad_norm": 0.8116063638815398, "learning_rate": 6.9380927091475085e-06, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.10994266718626022, "step": 5025, "valid_targets_mean": 1494.1, "valid_targets_min": 1075 }, { "epoch": 5.283613445378151, "grad_norm": 0.8409841937184768, "learning_rate": 6.898466864868165e-06, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.1092015877366066, "step": 5030, "valid_targets_mean": 1340.9, "valid_targets_min": 740 }, { "epoch": 5.288865546218488, "grad_norm": 0.8012571565338946, "learning_rate": 6.858930906893751e-06, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.12151382863521576, "step": 5035, "valid_targets_mean": 1530.9, "valid_targets_min": 727 }, { "epoch": 5.294117647058823, "grad_norm": 1.0099731756987655, "learning_rate": 6.819485106470454e-06, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.115475133061409, "step": 5040, "valid_targets_mean": 1233.0, "valid_targets_min": 636 }, { "epoch": 5.29936974789916, "grad_norm": 0.8353570829541407, "learning_rate": 6.780129734225949e-06, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.1095833033323288, "step": 5045, "valid_targets_mean": 1246.8, "valid_targets_min": 684 }, { "epoch": 5.304621848739496, "grad_norm": 0.8983751034814326, "learning_rate": 6.740865060167483e-06, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.1118505597114563, "step": 5050, "valid_targets_mean": 1392.5, "valid_targets_min": 798 }, { "epoch": 5.309873949579832, "grad_norm": 0.8427967821093256, "learning_rate": 6.701691353680049e-06, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1080687940120697, "step": 5055, "valid_targets_mean": 1319.9, "valid_targets_min": 661 }, { "epoch": 5.315126050420168, "grad_norm": 0.8079776828047187, "learning_rate": 6.662608883524542e-06, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.11414103209972382, "step": 5060, "valid_targets_mean": 1554.4, "valid_targets_min": 665 }, { "epoch": 5.320378151260504, "grad_norm": 0.9308438137878955, "learning_rate": 6.6236179178359115e-06, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.12251292169094086, "step": 5065, "valid_targets_mean": 1417.8, "valid_targets_min": 692 }, { "epoch": 5.32563025210084, "grad_norm": 1.0492334793929392, "learning_rate": 6.5847187241213e-06, "loss": 0.1171, "loss_nan_ranks": 0, "loss_rank_avg": 0.11902189999818802, "step": 5070, "valid_targets_mean": 1223.8, "valid_targets_min": 632 }, { "epoch": 5.330882352941177, "grad_norm": 0.8741745375157363, "learning_rate": 6.5459115692582386e-06, "loss": 0.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.1177992969751358, "step": 5075, "valid_targets_mean": 1550.6, "valid_targets_min": 922 }, { "epoch": 5.336134453781512, "grad_norm": 0.8231983027778437, "learning_rate": 6.507196719492819e-06, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.11274613440036774, "step": 5080, "valid_targets_mean": 1542.2, "valid_targets_min": 710 }, { "epoch": 5.341386554621849, "grad_norm": 0.838222313849615, "learning_rate": 6.468574440437801e-06, "loss": 0.1162, "loss_nan_ranks": 0, "loss_rank_avg": 0.11383190006017685, "step": 5085, "valid_targets_mean": 1390.6, "valid_targets_min": 750 }, { "epoch": 5.3466386554621845, "grad_norm": 0.8704926336132325, "learning_rate": 6.43004499707089e-06, "loss": 0.1154, "loss_nan_ranks": 0, "loss_rank_avg": 0.12034046649932861, "step": 5090, "valid_targets_mean": 1515.5, "valid_targets_min": 766 }, { "epoch": 5.351890756302521, "grad_norm": 0.7942910330002284, "learning_rate": 6.3916086537328545e-06, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.09943848103284836, "step": 5095, "valid_targets_mean": 1333.3, "valid_targets_min": 748 }, { "epoch": 5.357142857142857, "grad_norm": 0.8272207055546795, "learning_rate": 6.3532656741257145e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.11656372249126434, "step": 5100, "valid_targets_mean": 1395.2, "valid_targets_min": 682 }, { "epoch": 5.362394957983193, "grad_norm": 0.8835103895559686, "learning_rate": 6.315016321310965e-06, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.11481855809688568, "step": 5105, "valid_targets_mean": 1515.6, "valid_targets_min": 738 }, { "epoch": 5.367647058823529, "grad_norm": 0.8627265594469545, "learning_rate": 6.276860857707727e-06, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.11496169120073318, "step": 5110, "valid_targets_mean": 1312.8, "valid_targets_min": 731 }, { "epoch": 5.3728991596638656, "grad_norm": 0.909694468472037, "learning_rate": 6.238799545090994e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.12938551604747772, "step": 5115, "valid_targets_mean": 1492.9, "valid_targets_min": 646 }, { "epoch": 5.378151260504202, "grad_norm": 0.8310216699675694, "learning_rate": 6.20083264458981e-06, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.10411947965621948, "step": 5120, "valid_targets_mean": 1369.1, "valid_targets_min": 780 }, { "epoch": 5.383403361344538, "grad_norm": 0.8711155777854998, "learning_rate": 6.162960416685469e-06, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.11428333818912506, "step": 5125, "valid_targets_mean": 1521.9, "valid_targets_min": 676 }, { "epoch": 5.388655462184874, "grad_norm": 0.870482484994608, "learning_rate": 6.125183121209741e-06, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.10633750259876251, "step": 5130, "valid_targets_mean": 1277.9, "valid_targets_min": 687 }, { "epoch": 5.39390756302521, "grad_norm": 0.8795820034570103, "learning_rate": 6.087501017343107e-06, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.10446271300315857, "step": 5135, "valid_targets_mean": 1336.5, "valid_targets_min": 703 }, { "epoch": 5.399159663865547, "grad_norm": 0.8575277820951928, "learning_rate": 6.0499143636129384e-06, "loss": 0.1105, "loss_nan_ranks": 0, "loss_rank_avg": 0.10649226605892181, "step": 5140, "valid_targets_mean": 1288.1, "valid_targets_min": 522 }, { "epoch": 5.404411764705882, "grad_norm": 0.8701860188774736, "learning_rate": 6.012423417891766e-06, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.11557996273040771, "step": 5145, "valid_targets_mean": 1526.9, "valid_targets_min": 764 }, { "epoch": 5.409663865546219, "grad_norm": 0.9973788403003421, "learning_rate": 5.975028437395493e-06, "loss": 0.124, "loss_nan_ranks": 0, "loss_rank_avg": 0.1302410513162613, "step": 5150, "valid_targets_mean": 1372.4, "valid_targets_min": 548 }, { "epoch": 5.4149159663865545, "grad_norm": 0.8939645783701128, "learning_rate": 5.937729678681612e-06, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.11539514362812042, "step": 5155, "valid_targets_mean": 1356.8, "valid_targets_min": 694 }, { "epoch": 5.420168067226891, "grad_norm": 0.8246273501078926, "learning_rate": 5.9005273976474684e-06, "loss": 0.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.11548338830471039, "step": 5160, "valid_targets_mean": 1540.9, "valid_targets_min": 823 }, { "epoch": 5.425420168067227, "grad_norm": 0.7236132877010878, "learning_rate": 5.8634218495285126e-06, "loss": 0.0987, "loss_nan_ranks": 0, "loss_rank_avg": 0.08354189991950989, "step": 5165, "valid_targets_mean": 1442.4, "valid_targets_min": 682 }, { "epoch": 5.430672268907563, "grad_norm": 0.8988049282372673, "learning_rate": 5.8264132888965155e-06, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.11418993771076202, "step": 5170, "valid_targets_mean": 1407.6, "valid_targets_min": 693 }, { "epoch": 5.435924369747899, "grad_norm": 0.8655375216766177, "learning_rate": 5.789501969657853e-06, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.10003848373889923, "step": 5175, "valid_targets_mean": 1197.8, "valid_targets_min": 639 }, { "epoch": 5.4411764705882355, "grad_norm": 0.8362323911596797, "learning_rate": 5.752688145051761e-06, "loss": 0.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.09275621920824051, "step": 5180, "valid_targets_mean": 1423.3, "valid_targets_min": 685 }, { "epoch": 5.446428571428571, "grad_norm": 0.8296465425650306, "learning_rate": 5.715972067648561e-06, "loss": 0.1078, "loss_nan_ranks": 0, "loss_rank_avg": 0.10052791237831116, "step": 5185, "valid_targets_mean": 1331.5, "valid_targets_min": 827 }, { "epoch": 5.451680672268908, "grad_norm": 0.8321903503583684, "learning_rate": 5.679353989347989e-06, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.10639987140893936, "step": 5190, "valid_targets_mean": 1381.7, "valid_targets_min": 686 }, { "epoch": 5.456932773109243, "grad_norm": 0.8907023908538945, "learning_rate": 5.642834161377408e-06, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.11636456847190857, "step": 5195, "valid_targets_mean": 1472.2, "valid_targets_min": 713 }, { "epoch": 5.46218487394958, "grad_norm": 1.304588509837649, "learning_rate": 5.606412834290121e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.2201894223690033, "step": 5200, "valid_targets_mean": 2248.9, "valid_targets_min": 920 }, { "epoch": 5.467436974789916, "grad_norm": 1.075014973641161, "learning_rate": 5.570090257963645e-06, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.2059841752052307, "step": 5205, "valid_targets_mean": 3664.4, "valid_targets_min": 746 }, { "epoch": 5.472689075630252, "grad_norm": 0.8446914601975626, "learning_rate": 5.533866681597981e-06, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.20752739906311035, "step": 5210, "valid_targets_mean": 3591.1, "valid_targets_min": 1635 }, { "epoch": 5.477941176470588, "grad_norm": 0.6615718547643281, "learning_rate": 5.497742353713928e-06, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.1898113489151001, "step": 5215, "valid_targets_mean": 4172.7, "valid_targets_min": 777 }, { "epoch": 5.483193277310924, "grad_norm": 0.6331051011117288, "learning_rate": 5.461717522151371e-06, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.2003975212574005, "step": 5220, "valid_targets_mean": 4040.2, "valid_targets_min": 2187 }, { "epoch": 5.48844537815126, "grad_norm": 0.6969541078527951, "learning_rate": 5.4257924340675535e-06, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.18878155946731567, "step": 5225, "valid_targets_mean": 3156.3, "valid_targets_min": 1432 }, { "epoch": 5.493697478991597, "grad_norm": 0.5916400175296245, "learning_rate": 5.389967335935429e-06, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.17551878094673157, "step": 5230, "valid_targets_mean": 3529.7, "valid_targets_min": 767 }, { "epoch": 5.498949579831933, "grad_norm": 0.624324534174277, "learning_rate": 5.3542424735419306e-06, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.17499442398548126, "step": 5235, "valid_targets_mean": 3485.6, "valid_targets_min": 1488 }, { "epoch": 5.504201680672269, "grad_norm": 0.6222898231435748, "learning_rate": 5.318618091986294e-06, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.17875801026821136, "step": 5240, "valid_targets_mean": 3707.0, "valid_targets_min": 578 }, { "epoch": 5.509453781512605, "grad_norm": 0.6245877514119683, "learning_rate": 5.283094435678398e-06, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.19261011481285095, "step": 5245, "valid_targets_mean": 4252.4, "valid_targets_min": 1241 }, { "epoch": 5.514705882352941, "grad_norm": 0.6826116098814055, "learning_rate": 5.2476717483370685e-06, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.21187934279441833, "step": 5250, "valid_targets_mean": 4029.2, "valid_targets_min": 807 }, { "epoch": 5.519957983193278, "grad_norm": 0.5667810450047195, "learning_rate": 5.212350272988394e-06, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.17751820385456085, "step": 5255, "valid_targets_mean": 4507.0, "valid_targets_min": 2011 }, { "epoch": 5.525210084033613, "grad_norm": 0.6114125208911464, "learning_rate": 5.177130251964088e-06, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.17235472798347473, "step": 5260, "valid_targets_mean": 4268.2, "valid_targets_min": 1329 }, { "epoch": 5.53046218487395, "grad_norm": 0.6625902480426628, "learning_rate": 5.1420119268998085e-06, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.18950673937797546, "step": 5265, "valid_targets_mean": 3858.9, "valid_targets_min": 1366 }, { "epoch": 5.535714285714286, "grad_norm": 0.6651401874085916, "learning_rate": 5.106995538733488e-06, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.17550374567508698, "step": 5270, "valid_targets_mean": 3169.1, "valid_targets_min": 1334 }, { "epoch": 5.540966386554622, "grad_norm": 0.6231114187474077, "learning_rate": 5.07208132770372e-06, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.18051046133041382, "step": 5275, "valid_targets_mean": 4130.4, "valid_targets_min": 1762 }, { "epoch": 5.546218487394958, "grad_norm": 0.6708862310223077, "learning_rate": 5.037269533348075e-06, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.19089899957180023, "step": 5280, "valid_targets_mean": 3285.0, "valid_targets_min": 855 }, { "epoch": 5.551470588235294, "grad_norm": 0.7236660627737345, "learning_rate": 5.002560394501463e-06, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.2103574275970459, "step": 5285, "valid_targets_mean": 3298.2, "valid_targets_min": 1269 }, { "epoch": 5.55672268907563, "grad_norm": 0.7530081580597202, "learning_rate": 4.9679541492945135e-06, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.1874314844608307, "step": 5290, "valid_targets_mean": 2740.4, "valid_targets_min": 1041 }, { "epoch": 5.561974789915967, "grad_norm": 0.7386136479775732, "learning_rate": 4.933451035151913e-06, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.19821321964263916, "step": 5295, "valid_targets_mean": 2995.1, "valid_targets_min": 1291 }, { "epoch": 5.567226890756302, "grad_norm": 0.72395057035861, "learning_rate": 4.899051288790806e-06, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.18655264377593994, "step": 5300, "valid_targets_mean": 2811.6, "valid_targets_min": 1133 }, { "epoch": 5.572478991596639, "grad_norm": 0.7470437002909036, "learning_rate": 4.86475514621916e-06, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.19498442113399506, "step": 5305, "valid_targets_mean": 3709.5, "valid_targets_min": 865 }, { "epoch": 5.5777310924369745, "grad_norm": 0.7302797839356747, "learning_rate": 4.830562842734112e-06, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.18496988713741302, "step": 5310, "valid_targets_mean": 2960.6, "valid_targets_min": 958 }, { "epoch": 5.582983193277311, "grad_norm": 0.7028513017526096, "learning_rate": 4.796474612920421e-06, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.19564983248710632, "step": 5315, "valid_targets_mean": 3189.2, "valid_targets_min": 771 }, { "epoch": 5.588235294117647, "grad_norm": 0.6143075180595077, "learning_rate": 4.762490690648813e-06, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.1765946000814438, "step": 5320, "valid_targets_mean": 3823.1, "valid_targets_min": 1631 }, { "epoch": 5.593487394957983, "grad_norm": 0.7331719157365119, "learning_rate": 4.728611309074374e-06, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.15561848878860474, "step": 5325, "valid_targets_mean": 2639.4, "valid_targets_min": 908 }, { "epoch": 5.598739495798319, "grad_norm": 0.799889226199126, "learning_rate": 4.694836700634975e-06, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.20055752992630005, "step": 5330, "valid_targets_mean": 2988.3, "valid_targets_min": 1264 }, { "epoch": 5.6039915966386555, "grad_norm": 0.7723682554917705, "learning_rate": 4.661167097049668e-06, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.19730721414089203, "step": 5335, "valid_targets_mean": 3563.1, "valid_targets_min": 1889 }, { "epoch": 5.609243697478991, "grad_norm": 0.6899888581366523, "learning_rate": 4.62760272931708e-06, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.17451027035713196, "step": 5340, "valid_targets_mean": 3737.9, "valid_targets_min": 1075 }, { "epoch": 5.614495798319328, "grad_norm": 0.7422252794353547, "learning_rate": 4.594143827713844e-06, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.17348533868789673, "step": 5345, "valid_targets_mean": 2745.8, "valid_targets_min": 1036 }, { "epoch": 5.619747899159664, "grad_norm": 0.7524666990737761, "learning_rate": 4.56079062179303e-06, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.1979708969593048, "step": 5350, "valid_targets_mean": 3516.4, "valid_targets_min": 1162 }, { "epoch": 5.625, "grad_norm": 0.6922592034045233, "learning_rate": 4.527543340382538e-06, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.17850226163864136, "step": 5355, "valid_targets_mean": 3279.4, "valid_targets_min": 1281 }, { "epoch": 5.630252100840336, "grad_norm": 0.6631764263997426, "learning_rate": 4.494402211583569e-06, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.16947326064109802, "step": 5360, "valid_targets_mean": 3180.4, "valid_targets_min": 1816 }, { "epoch": 5.635504201680672, "grad_norm": 0.7291414927160216, "learning_rate": 4.461367462769009e-06, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.18259739875793457, "step": 5365, "valid_targets_mean": 2939.2, "valid_targets_min": 1629 }, { "epoch": 5.640756302521009, "grad_norm": 0.7503072179394285, "learning_rate": 4.428439320581923e-06, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.1907494068145752, "step": 5370, "valid_targets_mean": 2755.7, "valid_targets_min": 1254 }, { "epoch": 5.6460084033613445, "grad_norm": 0.7463064226667883, "learning_rate": 4.3956180109339705e-06, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.19494910538196564, "step": 5375, "valid_targets_mean": 3390.2, "valid_targets_min": 1973 }, { "epoch": 5.651260504201681, "grad_norm": 0.7574766718662052, "learning_rate": 4.362903759003849e-06, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.175164133310318, "step": 5380, "valid_targets_mean": 2960.4, "valid_targets_min": 1195 }, { "epoch": 5.656512605042017, "grad_norm": 0.7408855986734103, "learning_rate": 4.33029678923576e-06, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.19168353080749512, "step": 5385, "valid_targets_mean": 3181.4, "valid_targets_min": 1244 }, { "epoch": 5.661764705882353, "grad_norm": 0.7242394613336414, "learning_rate": 4.297797325337889e-06, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1881379634141922, "step": 5390, "valid_targets_mean": 3464.2, "valid_targets_min": 1421 }, { "epoch": 5.667016806722689, "grad_norm": 0.729199912715331, "learning_rate": 4.265405590280822e-06, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.18175436556339264, "step": 5395, "valid_targets_mean": 3443.1, "valid_targets_min": 1097 }, { "epoch": 5.6722689075630255, "grad_norm": 0.7780886091437504, "learning_rate": 4.233121806296072e-06, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.20643776655197144, "step": 5400, "valid_targets_mean": 3891.4, "valid_targets_min": 1168 }, { "epoch": 5.677521008403361, "grad_norm": 2.0082601362553083, "learning_rate": 4.200946194874514e-06, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.19502270221710205, "step": 5405, "valid_targets_mean": 3368.9, "valid_targets_min": 1700 }, { "epoch": 5.682773109243698, "grad_norm": 0.7542156394780143, "learning_rate": 4.168878976764872e-06, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.17632341384887695, "step": 5410, "valid_targets_mean": 2497.1, "valid_targets_min": 1261 }, { "epoch": 5.688025210084033, "grad_norm": 0.7204058422362926, "learning_rate": 4.136920371972228e-06, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.1968623399734497, "step": 5415, "valid_targets_mean": 3391.2, "valid_targets_min": 1124 }, { "epoch": 5.69327731092437, "grad_norm": 0.7514367050409141, "learning_rate": 4.105070599756482e-06, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.1881876438856125, "step": 5420, "valid_targets_mean": 3003.8, "valid_targets_min": 1361 }, { "epoch": 5.698529411764706, "grad_norm": 0.671835209360093, "learning_rate": 4.073329878630856e-06, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.16645438969135284, "step": 5425, "valid_targets_mean": 3239.7, "valid_targets_min": 1679 }, { "epoch": 5.703781512605042, "grad_norm": 0.7151451061634367, "learning_rate": 4.041698426360425e-06, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.190008282661438, "step": 5430, "valid_targets_mean": 3101.2, "valid_targets_min": 1739 }, { "epoch": 5.709033613445378, "grad_norm": 0.8510471746451064, "learning_rate": 4.010176459960569e-06, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.172542542219162, "step": 5435, "valid_targets_mean": 2844.4, "valid_targets_min": 1278 }, { "epoch": 5.714285714285714, "grad_norm": 0.6595419486913193, "learning_rate": 3.978764195695528e-06, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.1725081354379654, "step": 5440, "valid_targets_mean": 3563.4, "valid_targets_min": 1522 }, { "epoch": 5.71953781512605, "grad_norm": 0.7513983043013762, "learning_rate": 3.947461849076912e-06, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.1882949024438858, "step": 5445, "valid_targets_mean": 3589.0, "valid_targets_min": 464 }, { "epoch": 5.724789915966387, "grad_norm": 0.6781411607065908, "learning_rate": 3.916269634862193e-06, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.1876165270805359, "step": 5450, "valid_targets_mean": 3827.1, "valid_targets_min": 1003 }, { "epoch": 5.730042016806722, "grad_norm": 0.7521498102078784, "learning_rate": 3.885187767053269e-06, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.18409094214439392, "step": 5455, "valid_targets_mean": 3042.1, "valid_targets_min": 1446 }, { "epoch": 5.735294117647059, "grad_norm": 0.6989125002761396, "learning_rate": 3.854216458894973e-06, "loss": 0.1915, "loss_nan_ranks": 0, "loss_rank_avg": 0.18674632906913757, "step": 5460, "valid_targets_mean": 3257.8, "valid_targets_min": 1256 }, { "epoch": 5.740546218487395, "grad_norm": 0.7363983943406658, "learning_rate": 3.823355922873606e-06, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.20742374658584595, "step": 5465, "valid_targets_mean": 3858.5, "valid_targets_min": 1336 }, { "epoch": 5.745798319327731, "grad_norm": 0.6688145340655683, "learning_rate": 3.792606370715508e-06, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.18492421507835388, "step": 5470, "valid_targets_mean": 3821.1, "valid_targets_min": 1275 }, { "epoch": 5.751050420168067, "grad_norm": 0.7198758184286466, "learning_rate": 3.761968013385584e-06, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842348277568817, "step": 5475, "valid_targets_mean": 2914.6, "valid_targets_min": 644 }, { "epoch": 5.756302521008403, "grad_norm": 0.71314811892582, "learning_rate": 3.731441061085843e-06, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.17556104063987732, "step": 5480, "valid_targets_mean": 3083.4, "valid_targets_min": 1397 }, { "epoch": 5.76155462184874, "grad_norm": 0.7631003279463335, "learning_rate": 3.701025723253988e-06, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.17353874444961548, "step": 5485, "valid_targets_mean": 2747.4, "valid_targets_min": 1557 }, { "epoch": 5.766806722689076, "grad_norm": 0.7552536091187607, "learning_rate": 3.67072220856197e-06, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.18228024244308472, "step": 5490, "valid_targets_mean": 3405.2, "valid_targets_min": 1405 }, { "epoch": 5.772058823529412, "grad_norm": 0.7052066859512669, "learning_rate": 3.640530724914517e-06, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.17114409804344177, "step": 5495, "valid_targets_mean": 3507.1, "valid_targets_min": 1042 }, { "epoch": 5.777310924369748, "grad_norm": 0.7275066681746295, "learning_rate": 3.61045147944777e-06, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.1737072765827179, "step": 5500, "valid_targets_mean": 3079.7, "valid_targets_min": 858 }, { "epoch": 5.782563025210084, "grad_norm": 0.738557032225339, "learning_rate": 3.5804846785278315e-06, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.17162227630615234, "step": 5505, "valid_targets_mean": 2934.3, "valid_targets_min": 1288 }, { "epoch": 5.78781512605042, "grad_norm": 0.6881422147874104, "learning_rate": 3.5506305277493326e-06, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.17860713601112366, "step": 5510, "valid_targets_mean": 3428.2, "valid_targets_min": 1915 }, { "epoch": 5.793067226890757, "grad_norm": 0.8082399213846237, "learning_rate": 3.520889231934057e-06, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.2075139284133911, "step": 5515, "valid_targets_mean": 3764.9, "valid_targets_min": 1244 }, { "epoch": 5.798319327731092, "grad_norm": 0.7470662206853251, "learning_rate": 3.4912609951295084e-06, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.18600235879421234, "step": 5520, "valid_targets_mean": 3006.5, "valid_targets_min": 1255 }, { "epoch": 5.803571428571429, "grad_norm": 0.7396369320045814, "learning_rate": 3.461746020607526e-06, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.21041221916675568, "step": 5525, "valid_targets_mean": 3326.2, "valid_targets_min": 1586 }, { "epoch": 5.8088235294117645, "grad_norm": 0.6985035686259948, "learning_rate": 3.432344510862895e-06, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.16554896533489227, "step": 5530, "valid_targets_mean": 3205.2, "valid_targets_min": 1181 }, { "epoch": 5.814075630252101, "grad_norm": 0.7863118868734756, "learning_rate": 3.403056667611917e-06, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.17784982919692993, "step": 5535, "valid_targets_mean": 2735.1, "valid_targets_min": 974 }, { "epoch": 5.819327731092437, "grad_norm": 0.740543140779203, "learning_rate": 3.373882691791088e-06, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.19035407900810242, "step": 5540, "valid_targets_mean": 3735.8, "valid_targets_min": 1681 }, { "epoch": 5.824579831932773, "grad_norm": 0.774595013152137, "learning_rate": 3.344822783555679e-06, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.20152834057807922, "step": 5545, "valid_targets_mean": 2883.7, "valid_targets_min": 1171 }, { "epoch": 5.829831932773109, "grad_norm": 0.807774445390228, "learning_rate": 3.315877142278363e-06, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.21530133485794067, "step": 5550, "valid_targets_mean": 3324.1, "valid_targets_min": 1455 }, { "epoch": 5.8350840336134455, "grad_norm": 0.6932108713568098, "learning_rate": 3.287045966547866e-06, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.19992104172706604, "step": 5555, "valid_targets_mean": 3948.6, "valid_targets_min": 1529 }, { "epoch": 5.840336134453781, "grad_norm": 0.7588685281732017, "learning_rate": 3.258329454167599e-06, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.20404741168022156, "step": 5560, "valid_targets_mean": 3419.9, "valid_targets_min": 1450 }, { "epoch": 5.845588235294118, "grad_norm": 0.6654008948279083, "learning_rate": 3.2297278021542833e-06, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.1653444766998291, "step": 5565, "valid_targets_mean": 3465.6, "valid_targets_min": 1431 }, { "epoch": 5.850840336134453, "grad_norm": 0.7617245678374055, "learning_rate": 3.201241206736614e-06, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.19317778944969177, "step": 5570, "valid_targets_mean": 3085.4, "valid_targets_min": 802 }, { "epoch": 5.85609243697479, "grad_norm": 0.7601710209752651, "learning_rate": 3.1728698633539266e-06, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.1923319697380066, "step": 5575, "valid_targets_mean": 3230.6, "valid_targets_min": 1433 }, { "epoch": 5.8613445378151265, "grad_norm": 0.8026621042498756, "learning_rate": 3.1446139666548212e-06, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.19206663966178894, "step": 5580, "valid_targets_mean": 2908.7, "valid_targets_min": 614 }, { "epoch": 5.866596638655462, "grad_norm": 0.8143821059911558, "learning_rate": 3.1164737104958707e-06, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.2039254605770111, "step": 5585, "valid_targets_mean": 2748.8, "valid_targets_min": 637 }, { "epoch": 5.871848739495798, "grad_norm": 0.7917201537427566, "learning_rate": 3.0884492879402452e-06, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.2050473690032959, "step": 5590, "valid_targets_mean": 3297.7, "valid_targets_min": 1683 }, { "epoch": 5.8771008403361344, "grad_norm": 0.7656092656857109, "learning_rate": 3.0605408912564184e-06, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.18506518006324768, "step": 5595, "valid_targets_mean": 3406.1, "valid_targets_min": 1913 }, { "epoch": 5.882352941176471, "grad_norm": 0.7130368872222834, "learning_rate": 3.032748711916851e-06, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.18892902135849, "step": 5600, "valid_targets_mean": 3848.1, "valid_targets_min": 1659 }, { "epoch": 5.887605042016807, "grad_norm": 0.7127010208647905, "learning_rate": 3.0050729405966495e-06, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.17573906481266022, "step": 5605, "valid_targets_mean": 3390.7, "valid_targets_min": 1390 }, { "epoch": 5.892857142857143, "grad_norm": 0.7730291184647539, "learning_rate": 2.9775137671722754e-06, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.2364846169948578, "step": 5610, "valid_targets_mean": 3338.5, "valid_targets_min": 611 }, { "epoch": 5.898109243697479, "grad_norm": 0.7437425304974528, "learning_rate": 2.9500713807202565e-06, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.1972287893295288, "step": 5615, "valid_targets_mean": 3389.6, "valid_targets_min": 1451 }, { "epoch": 5.9033613445378155, "grad_norm": 0.7338868027074469, "learning_rate": 2.9227459695158543e-06, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.165279358625412, "step": 5620, "valid_targets_mean": 3097.9, "valid_targets_min": 1459 }, { "epoch": 5.908613445378151, "grad_norm": 0.8398618395284945, "learning_rate": 2.895537721031809e-06, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.20163550972938538, "step": 5625, "valid_targets_mean": 2619.4, "valid_targets_min": 999 }, { "epoch": 5.913865546218488, "grad_norm": 0.6872190021050335, "learning_rate": 2.8684468219370364e-06, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.17330724000930786, "step": 5630, "valid_targets_mean": 3791.2, "valid_targets_min": 1564 }, { "epoch": 5.919117647058823, "grad_norm": 0.7915970239951657, "learning_rate": 2.841473458095334e-06, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.19606292247772217, "step": 5635, "valid_targets_mean": 3223.3, "valid_targets_min": 1233 }, { "epoch": 5.92436974789916, "grad_norm": 0.7371089384298193, "learning_rate": 2.8146178145641355e-06, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.18127654492855072, "step": 5640, "valid_targets_mean": 3439.2, "valid_targets_min": 1524 }, { "epoch": 5.929621848739496, "grad_norm": 0.7111215478308646, "learning_rate": 2.787880075593217e-06, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.18391185998916626, "step": 5645, "valid_targets_mean": 3744.9, "valid_targets_min": 1375 }, { "epoch": 5.934873949579832, "grad_norm": 0.7280994223942271, "learning_rate": 2.7612604246234355e-06, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.17705269157886505, "step": 5650, "valid_targets_mean": 3036.2, "valid_targets_min": 906 }, { "epoch": 5.940126050420168, "grad_norm": 0.6242246207880907, "learning_rate": 2.7347590442854867e-06, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.1647983193397522, "step": 5655, "valid_targets_mean": 3766.5, "valid_targets_min": 1246 }, { "epoch": 5.945378151260504, "grad_norm": 0.7653759814637277, "learning_rate": 2.7083761163986433e-06, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.20250293612480164, "step": 5660, "valid_targets_mean": 3225.9, "valid_targets_min": 1333 }, { "epoch": 5.95063025210084, "grad_norm": 0.7475006568229906, "learning_rate": 2.682111821969493e-06, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.19375839829444885, "step": 5665, "valid_targets_mean": 3751.3, "valid_targets_min": 2264 }, { "epoch": 5.955882352941177, "grad_norm": 0.737881904148586, "learning_rate": 2.6559663411907233e-06, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.1940421611070633, "step": 5670, "valid_targets_mean": 3505.2, "valid_targets_min": 1454 }, { "epoch": 5.961134453781512, "grad_norm": 0.7664181534172059, "learning_rate": 2.629939853439856e-06, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.18167239427566528, "step": 5675, "valid_targets_mean": 3385.7, "valid_targets_min": 1430 }, { "epoch": 5.966386554621849, "grad_norm": 0.7497306698153924, "learning_rate": 2.604032537278052e-06, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1727236807346344, "step": 5680, "valid_targets_mean": 3201.6, "valid_targets_min": 1433 }, { "epoch": 5.9716386554621845, "grad_norm": 0.7405178705998576, "learning_rate": 2.5782445704488447e-06, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.1837659776210785, "step": 5685, "valid_targets_mean": 3362.1, "valid_targets_min": 1512 }, { "epoch": 5.976890756302521, "grad_norm": 0.697865915003433, "learning_rate": 2.5525761298769515e-06, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.18182769417762756, "step": 5690, "valid_targets_mean": 3643.9, "valid_targets_min": 2048 }, { "epoch": 5.982142857142857, "grad_norm": 0.7426309465732394, "learning_rate": 2.527027391667054e-06, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.1931290328502655, "step": 5695, "valid_targets_mean": 3107.1, "valid_targets_min": 815 }, { "epoch": 5.987394957983193, "grad_norm": 0.7413852866874329, "learning_rate": 2.501598531102587e-06, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.20602191984653473, "step": 5700, "valid_targets_mean": 3339.4, "valid_targets_min": 1878 }, { "epoch": 5.992647058823529, "grad_norm": 0.8082149132119589, "learning_rate": 2.47628972264452e-06, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.21446332335472107, "step": 5705, "valid_targets_mean": 3394.6, "valid_targets_min": 1727 }, { "epoch": 5.9978991596638656, "grad_norm": 0.673717887910672, "learning_rate": 2.4511011399301944e-06, "loss": 0.1884, "loss_nan_ranks": 0, "loss_rank_avg": 0.1594567894935608, "step": 5710, "valid_targets_mean": 2924.3, "valid_targets_min": 1622 }, { "epoch": 6.003151260504202, "grad_norm": 0.888726685758785, "learning_rate": 2.4260329557721107e-06, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.1586988866329193, "step": 5715, "valid_targets_mean": 1587.9, "valid_targets_min": 788 }, { "epoch": 6.008403361344538, "grad_norm": 0.7892723724374661, "learning_rate": 2.4010853421567237e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.12804922461509705, "step": 5720, "valid_targets_mean": 1591.2, "valid_targets_min": 957 }, { "epoch": 6.013655462184874, "grad_norm": 0.7624099131843867, "learning_rate": 2.376258470243309e-06, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.11783352494239807, "step": 5725, "valid_targets_mean": 1418.7, "valid_targets_min": 796 }, { "epoch": 6.01890756302521, "grad_norm": 0.7792462436940873, "learning_rate": 2.351552510362758e-06, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.11473619192838669, "step": 5730, "valid_targets_mean": 1389.0, "valid_targets_min": 704 }, { "epoch": 6.024159663865547, "grad_norm": 0.8703079476348818, "learning_rate": 2.326967632016406e-06, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.11579575389623642, "step": 5735, "valid_targets_mean": 1513.9, "valid_targets_min": 638 }, { "epoch": 6.029411764705882, "grad_norm": 0.8915876673258326, "learning_rate": 2.302504003874888e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.12122771143913269, "step": 5740, "valid_targets_mean": 1482.3, "valid_targets_min": 727 }, { "epoch": 6.034663865546219, "grad_norm": 0.8177570400824066, "learning_rate": 2.2781617937769675e-06, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.10171643644571304, "step": 5745, "valid_targets_mean": 1189.1, "valid_targets_min": 655 }, { "epoch": 6.0399159663865545, "grad_norm": 1.025573849186844, "learning_rate": 2.2539411687283907e-06, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.1116051971912384, "step": 5750, "valid_targets_mean": 1299.6, "valid_targets_min": 714 }, { "epoch": 6.045168067226891, "grad_norm": 0.873608647534603, "learning_rate": 2.229842294900744e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.1157689318060875, "step": 5755, "valid_targets_mean": 1407.6, "valid_targets_min": 741 }, { "epoch": 6.050420168067227, "grad_norm": 0.9798749449474746, "learning_rate": 2.205865337630302e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.13768497109413147, "step": 5760, "valid_targets_mean": 1544.1, "valid_targets_min": 663 }, { "epoch": 6.055672268907563, "grad_norm": 0.916099508349051, "learning_rate": 2.182010461416899e-06, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.11846692860126495, "step": 5765, "valid_targets_mean": 1511.1, "valid_targets_min": 632 }, { "epoch": 6.060924369747899, "grad_norm": 0.8853677750337303, "learning_rate": 2.158277829922817e-06, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.12952449917793274, "step": 5770, "valid_targets_mean": 1638.0, "valid_targets_min": 933 }, { "epoch": 6.0661764705882355, "grad_norm": 0.7694796846656141, "learning_rate": 2.1346676059716253e-06, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.11292778700590134, "step": 5775, "valid_targets_mean": 1526.9, "valid_targets_min": 717 }, { "epoch": 6.071428571428571, "grad_norm": 0.8108257454301182, "learning_rate": 2.1111799515471066e-06, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.1118139773607254, "step": 5780, "valid_targets_mean": 1387.4, "valid_targets_min": 659 }, { "epoch": 6.076680672268908, "grad_norm": 0.816088021557387, "learning_rate": 2.0878150277921195e-06, "loss": 0.1076, "loss_nan_ranks": 0, "loss_rank_avg": 0.1065862700343132, "step": 5785, "valid_targets_mean": 1382.9, "valid_targets_min": 642 }, { "epoch": 6.081932773109243, "grad_norm": 0.8469714058115316, "learning_rate": 2.064572995007492e-06, "loss": 0.1093, "loss_nan_ranks": 0, "loss_rank_avg": 0.09756132960319519, "step": 5790, "valid_targets_mean": 1312.1, "valid_targets_min": 765 }, { "epoch": 6.08718487394958, "grad_norm": 0.9292126584824716, "learning_rate": 2.0414540126509274e-06, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.11742901057004929, "step": 5795, "valid_targets_mean": 1397.6, "valid_targets_min": 631 }, { "epoch": 6.092436974789916, "grad_norm": 0.9989157343383366, "learning_rate": 2.0184582393359253e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.12957970798015594, "step": 5800, "valid_targets_mean": 1419.4, "valid_targets_min": 623 }, { "epoch": 6.097689075630252, "grad_norm": 0.8687109853494948, "learning_rate": 1.99558583283066e-06, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.12820440530776978, "step": 5805, "valid_targets_mean": 1647.7, "valid_targets_min": 818 }, { "epoch": 6.102941176470588, "grad_norm": 0.8429889291483497, "learning_rate": 1.9728369500569333e-06, "loss": 0.1183, "loss_nan_ranks": 0, "loss_rank_avg": 0.11039917171001434, "step": 5810, "valid_targets_mean": 1545.5, "valid_targets_min": 776 }, { "epoch": 6.108193277310924, "grad_norm": 0.9401593816021946, "learning_rate": 1.950211747089077e-06, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.11282265186309814, "step": 5815, "valid_targets_mean": 1411.8, "valid_targets_min": 623 }, { "epoch": 6.11344537815126, "grad_norm": 0.8579915255635823, "learning_rate": 1.927710379152881e-06, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.11633343994617462, "step": 5820, "valid_targets_mean": 1437.3, "valid_targets_min": 742 }, { "epoch": 6.118697478991597, "grad_norm": 0.8470196779150363, "learning_rate": 1.9053330006245452e-06, "loss": 0.1086, "loss_nan_ranks": 0, "loss_rank_avg": 0.0939580649137497, "step": 5825, "valid_targets_mean": 1193.6, "valid_targets_min": 611 }, { "epoch": 6.123949579831933, "grad_norm": 0.8951203579512895, "learning_rate": 1.8830797650296006e-06, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.11357836425304413, "step": 5830, "valid_targets_mean": 1514.0, "valid_targets_min": 793 }, { "epoch": 6.129201680672269, "grad_norm": 0.8204950266453027, "learning_rate": 1.8609508250418628e-06, "loss": 0.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.10361876338720322, "step": 5835, "valid_targets_mean": 1379.1, "valid_targets_min": 886 }, { "epoch": 6.1344537815126055, "grad_norm": 0.827334438729143, "learning_rate": 1.8389463324823986e-06, "loss": 0.1121, "loss_nan_ranks": 0, "loss_rank_avg": 0.10381718724966049, "step": 5840, "valid_targets_mean": 1455.5, "valid_targets_min": 991 }, { "epoch": 6.139705882352941, "grad_norm": 1.0670876809595125, "learning_rate": 1.81706643831846e-06, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.11400048434734344, "step": 5845, "valid_targets_mean": 1525.2, "valid_targets_min": 908 }, { "epoch": 6.144957983193278, "grad_norm": 0.9783834172435171, "learning_rate": 1.7953112926624715e-06, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.11489921063184738, "step": 5850, "valid_targets_mean": 1476.6, "valid_targets_min": 680 }, { "epoch": 6.150210084033613, "grad_norm": 0.8766319864539988, "learning_rate": 1.7736810447709852e-06, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.11097388714551926, "step": 5855, "valid_targets_mean": 1467.1, "valid_targets_min": 803 }, { "epoch": 6.15546218487395, "grad_norm": 0.8785524728820334, "learning_rate": 1.7521758430436553e-06, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.10426779836416245, "step": 5860, "valid_targets_mean": 1341.3, "valid_targets_min": 765 }, { "epoch": 6.160714285714286, "grad_norm": 0.8829153848682123, "learning_rate": 1.7307958350222366e-06, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.11685581505298615, "step": 5865, "valid_targets_mean": 1556.4, "valid_targets_min": 804 }, { "epoch": 6.165966386554622, "grad_norm": 0.8180165865392631, "learning_rate": 1.7095411673895545e-06, "loss": 0.1147, "loss_nan_ranks": 0, "loss_rank_avg": 0.11777027696371078, "step": 5870, "valid_targets_mean": 1509.7, "valid_targets_min": 675 }, { "epoch": 6.171218487394958, "grad_norm": 0.8375114382633897, "learning_rate": 1.6884119859685034e-06, "loss": 0.1098, "loss_nan_ranks": 0, "loss_rank_avg": 0.11995431780815125, "step": 5875, "valid_targets_mean": 1408.4, "valid_targets_min": 882 }, { "epoch": 6.176470588235294, "grad_norm": 0.7972330265214028, "learning_rate": 1.6674084357210562e-06, "loss": 0.1071, "loss_nan_ranks": 0, "loss_rank_avg": 0.10255067050457001, "step": 5880, "valid_targets_mean": 1449.8, "valid_targets_min": 660 }, { "epoch": 6.18172268907563, "grad_norm": 0.8858809578498907, "learning_rate": 1.6465306607472608e-06, "loss": 0.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.10549542307853699, "step": 5885, "valid_targets_mean": 1489.8, "valid_targets_min": 678 }, { "epoch": 6.186974789915967, "grad_norm": 0.9235725158063691, "learning_rate": 1.625778804284246e-06, "loss": 0.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.10902103036642075, "step": 5890, "valid_targets_mean": 1379.1, "valid_targets_min": 676 }, { "epoch": 6.192226890756302, "grad_norm": 0.8610604938191373, "learning_rate": 1.6051530087052558e-06, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.10405048727989197, "step": 5895, "valid_targets_mean": 1347.1, "valid_targets_min": 794 }, { "epoch": 6.197478991596639, "grad_norm": 0.844841243204075, "learning_rate": 1.5846534155186511e-06, "loss": 0.1103, "loss_nan_ranks": 0, "loss_rank_avg": 0.1075349748134613, "step": 5900, "valid_targets_mean": 1372.6, "valid_targets_min": 607 }, { "epoch": 6.2027310924369745, "grad_norm": 0.9299916077128926, "learning_rate": 1.564280165366956e-06, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.11143974959850311, "step": 5905, "valid_targets_mean": 1323.6, "valid_targets_min": 722 }, { "epoch": 6.207983193277311, "grad_norm": 0.9520206844500675, "learning_rate": 1.544033398025886e-06, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.12437736988067627, "step": 5910, "valid_targets_mean": 1597.7, "valid_targets_min": 858 }, { "epoch": 6.213235294117647, "grad_norm": 0.8264419715144223, "learning_rate": 1.5239132524033951e-06, "loss": 0.0983, "loss_nan_ranks": 0, "loss_rank_avg": 0.09098273515701294, "step": 5915, "valid_targets_mean": 1270.8, "valid_targets_min": 689 }, { "epoch": 6.218487394957983, "grad_norm": 0.9121347316675537, "learning_rate": 1.50391986653871e-06, "loss": 0.1151, "loss_nan_ranks": 0, "loss_rank_avg": 0.10781864076852798, "step": 5920, "valid_targets_mean": 1388.2, "valid_targets_min": 692 }, { "epoch": 6.223739495798319, "grad_norm": 0.8183103322870855, "learning_rate": 1.4840533776013954e-06, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.0995546281337738, "step": 5925, "valid_targets_mean": 1447.2, "valid_targets_min": 828 }, { "epoch": 6.2289915966386555, "grad_norm": 0.8695709319336882, "learning_rate": 1.4643139218904035e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.1060028076171875, "step": 5930, "valid_targets_mean": 1399.7, "valid_targets_min": 618 }, { "epoch": 6.234243697478991, "grad_norm": 0.7936160826191869, "learning_rate": 1.4447016348331477e-06, "loss": 0.1041, "loss_nan_ranks": 0, "loss_rank_avg": 0.10275650769472122, "step": 5935, "valid_targets_mean": 1454.3, "valid_targets_min": 629 }, { "epoch": 6.239495798319328, "grad_norm": 1.0003364025533468, "learning_rate": 1.4252166509845777e-06, "loss": 0.1087, "loss_nan_ranks": 0, "loss_rank_avg": 0.1305723935365677, "step": 5940, "valid_targets_mean": 1746.1, "valid_targets_min": 1071 }, { "epoch": 6.244747899159663, "grad_norm": 0.9039823804020426, "learning_rate": 1.4058591040262259e-06, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.1077783852815628, "step": 5945, "valid_targets_mean": 1282.2, "valid_targets_min": 677 }, { "epoch": 6.25, "grad_norm": 0.8985676998446693, "learning_rate": 1.3866291267653309e-06, "loss": 0.1031, "loss_nan_ranks": 0, "loss_rank_avg": 0.09621434658765793, "step": 5950, "valid_targets_mean": 1227.6, "valid_targets_min": 679 }, { "epoch": 6.255252100840336, "grad_norm": 0.8526105872349939, "learning_rate": 1.3675268511339067e-06, "loss": 0.1043, "loss_nan_ranks": 0, "loss_rank_avg": 0.09855210781097412, "step": 5955, "valid_targets_mean": 1319.1, "valid_targets_min": 504 }, { "epoch": 6.260504201680672, "grad_norm": 0.8620937247837483, "learning_rate": 1.3485524081878288e-06, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.1124173030257225, "step": 5960, "valid_targets_mean": 1616.5, "valid_targets_min": 1023 }, { "epoch": 6.265756302521009, "grad_norm": 0.8269435472596893, "learning_rate": 1.3297059281059533e-06, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.10087428987026215, "step": 5965, "valid_targets_mean": 1453.0, "valid_targets_min": 661 }, { "epoch": 6.2710084033613445, "grad_norm": 0.8464773093003739, "learning_rate": 1.3109875401892146e-06, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.10120785981416702, "step": 5970, "valid_targets_mean": 1442.0, "valid_targets_min": 889 }, { "epoch": 6.276260504201681, "grad_norm": 0.809843624015962, "learning_rate": 1.2923973728597373e-06, "loss": 0.1037, "loss_nan_ranks": 0, "loss_rank_avg": 0.10031883418560028, "step": 5975, "valid_targets_mean": 1548.4, "valid_targets_min": 723 }, { "epoch": 6.281512605042017, "grad_norm": 0.8939758957054761, "learning_rate": 1.2739355536599508e-06, "loss": 0.1095, "loss_nan_ranks": 0, "loss_rank_avg": 0.10138392448425293, "step": 5980, "valid_targets_mean": 1359.8, "valid_targets_min": 793 }, { "epoch": 6.286764705882353, "grad_norm": 0.9990516754583353, "learning_rate": 1.2556022092517362e-06, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.11516615748405457, "step": 5985, "valid_targets_mean": 1478.6, "valid_targets_min": 861 }, { "epoch": 6.292016806722689, "grad_norm": 0.8483028409836717, "learning_rate": 1.237397465415524e-06, "loss": 0.1076, "loss_nan_ranks": 0, "loss_rank_avg": 0.0986555963754654, "step": 5990, "valid_targets_mean": 1332.7, "valid_targets_min": 752 }, { "epoch": 6.2972689075630255, "grad_norm": 0.9848150205283159, "learning_rate": 1.2193214470494664e-06, "loss": 0.1076, "loss_nan_ranks": 0, "loss_rank_avg": 0.11558929085731506, "step": 5995, "valid_targets_mean": 1622.7, "valid_targets_min": 789 }, { "epoch": 6.302521008403361, "grad_norm": 0.9238690287611016, "learning_rate": 1.201374278168541e-06, "loss": 0.0962, "loss_nan_ranks": 0, "loss_rank_avg": 0.08862060308456421, "step": 6000, "valid_targets_mean": 1195.4, "valid_targets_min": 567 }, { "epoch": 6.307773109243698, "grad_norm": 0.9550625507498628, "learning_rate": 1.1835560819037429e-06, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.12365525960922241, "step": 6005, "valid_targets_mean": 1504.5, "valid_targets_min": 605 }, { "epoch": 6.313025210084033, "grad_norm": 0.8977013451179156, "learning_rate": 1.1658669805012112e-06, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.10444406419992447, "step": 6010, "valid_targets_mean": 1580.1, "valid_targets_min": 746 }, { "epoch": 6.31827731092437, "grad_norm": 0.9626620928600009, "learning_rate": 1.1483070953213904e-06, "loss": 0.1017, "loss_nan_ranks": 0, "loss_rank_avg": 0.09486856311559677, "step": 6015, "valid_targets_mean": 1158.2, "valid_targets_min": 723 }, { "epoch": 6.323529411764706, "grad_norm": 0.857918445866971, "learning_rate": 1.130876546838211e-06, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.107955202460289, "step": 6020, "valid_targets_mean": 1430.4, "valid_targets_min": 855 }, { "epoch": 6.328781512605042, "grad_norm": 0.8446463752304134, "learning_rate": 1.1135754546382627e-06, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.10878735780715942, "step": 6025, "valid_targets_mean": 1590.4, "valid_targets_min": 902 }, { "epoch": 6.334033613445378, "grad_norm": 0.8359256112732846, "learning_rate": 1.0964039374199564e-06, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.10430100560188293, "step": 6030, "valid_targets_mean": 1521.5, "valid_targets_min": 803 }, { "epoch": 6.339285714285714, "grad_norm": 0.9402998650985804, "learning_rate": 1.07936211299273e-06, "loss": 0.1083, "loss_nan_ranks": 0, "loss_rank_avg": 0.11771460622549057, "step": 6035, "valid_targets_mean": 1455.2, "valid_targets_min": 740 }, { "epoch": 6.34453781512605, "grad_norm": 0.8950360049257687, "learning_rate": 1.0624500982762376e-06, "loss": 0.1031, "loss_nan_ranks": 0, "loss_rank_avg": 0.09641949832439423, "step": 6040, "valid_targets_mean": 1279.4, "valid_targets_min": 244 }, { "epoch": 6.349789915966387, "grad_norm": 0.8797683867630403, "learning_rate": 1.045668009299523e-06, "loss": 0.1104, "loss_nan_ranks": 0, "loss_rank_avg": 0.10380536317825317, "step": 6045, "valid_targets_mean": 1366.9, "valid_targets_min": 714 }, { "epoch": 6.355042016806722, "grad_norm": 0.8500779068020419, "learning_rate": 1.029015961200266e-06, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.08908183872699738, "step": 6050, "valid_targets_mean": 1220.5, "valid_targets_min": 585 }, { "epoch": 6.360294117647059, "grad_norm": 0.963766954956786, "learning_rate": 1.012494068223946e-06, "loss": 0.1142, "loss_nan_ranks": 0, "loss_rank_avg": 0.11748844385147095, "step": 6055, "valid_targets_mean": 1596.4, "valid_targets_min": 1041 }, { "epoch": 6.3655462184873945, "grad_norm": 1.013786349356977, "learning_rate": 9.961024437230948e-07, "loss": 0.1081, "loss_nan_ranks": 0, "loss_rank_avg": 0.10118795186281204, "step": 6060, "valid_targets_mean": 1401.3, "valid_targets_min": 777 }, { "epoch": 6.370798319327731, "grad_norm": 0.8907088069055336, "learning_rate": 9.798412001565038e-07, "loss": 0.1095, "loss_nan_ranks": 0, "loss_rank_avg": 0.10110174119472504, "step": 6065, "valid_targets_mean": 1546.8, "valid_targets_min": 959 }, { "epoch": 6.376050420168067, "grad_norm": 0.836878249917925, "learning_rate": 9.63710449088453e-07, "loss": 0.1052, "loss_nan_ranks": 0, "loss_rank_avg": 0.0972297191619873, "step": 6070, "valid_targets_mean": 1284.4, "valid_targets_min": 620 }, { "epoch": 6.381302521008403, "grad_norm": 0.8342602387448971, "learning_rate": 9.477103011879408e-07, "loss": 0.1035, "loss_nan_ranks": 0, "loss_rank_avg": 0.0927862748503685, "step": 6075, "valid_targets_mean": 1356.6, "valid_targets_min": 656 }, { "epoch": 6.38655462184874, "grad_norm": 0.9521526310876444, "learning_rate": 9.318408662279399e-07, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.12353593111038208, "step": 6080, "valid_targets_mean": 1564.5, "valid_targets_min": 697 }, { "epoch": 6.391806722689076, "grad_norm": 0.8338141493940605, "learning_rate": 9.161022530846253e-07, "loss": 0.0993, "loss_nan_ranks": 0, "loss_rank_avg": 0.09638993442058563, "step": 6085, "valid_targets_mean": 1604.7, "valid_targets_min": 682 }, { "epoch": 6.397058823529412, "grad_norm": 0.9780093813312944, "learning_rate": 9.004945697366452e-07, "loss": 0.1, "loss_nan_ranks": 0, "loss_rank_avg": 0.09383905678987503, "step": 6090, "valid_targets_mean": 1383.4, "valid_targets_min": 730 }, { "epoch": 6.402310924369748, "grad_norm": 0.891231287791507, "learning_rate": 8.850179232643641e-07, "loss": 0.1047, "loss_nan_ranks": 0, "loss_rank_avg": 0.10458773374557495, "step": 6095, "valid_targets_mean": 1482.5, "valid_targets_min": 747 }, { "epoch": 6.407563025210084, "grad_norm": 0.8092854746476409, "learning_rate": 8.696724198491369e-07, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.10784599184989929, "step": 6100, "valid_targets_mean": 1603.6, "valid_targets_min": 933 }, { "epoch": 6.41281512605042, "grad_norm": 0.9405797225301739, "learning_rate": 8.544581647725825e-07, "loss": 0.1025, "loss_nan_ranks": 0, "loss_rank_avg": 0.10436847805976868, "step": 6105, "valid_targets_mean": 1517.9, "valid_targets_min": 799 }, { "epoch": 6.418067226890757, "grad_norm": 0.8958196229325652, "learning_rate": 8.393752624158603e-07, "loss": 0.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.10442647337913513, "step": 6110, "valid_targets_mean": 1516.2, "valid_targets_min": 909 }, { "epoch": 6.423319327731092, "grad_norm": 0.8319689597681014, "learning_rate": 8.244238162589435e-07, "loss": 0.0991, "loss_nan_ranks": 0, "loss_rank_avg": 0.10206621140241623, "step": 6115, "valid_targets_mean": 1606.8, "valid_targets_min": 741 }, { "epoch": 6.428571428571429, "grad_norm": 0.8710279467847112, "learning_rate": 8.096039288799251e-07, "loss": 0.0907, "loss_nan_ranks": 0, "loss_rank_avg": 0.09631064534187317, "step": 6120, "valid_targets_mean": 1328.7, "valid_targets_min": 720 }, { "epoch": 6.4338235294117645, "grad_norm": 0.8396789652735168, "learning_rate": 7.949157019543064e-07, "loss": 0.1038, "loss_nan_ranks": 0, "loss_rank_avg": 0.10037371516227722, "step": 6125, "valid_targets_mean": 1396.2, "valid_targets_min": 610 }, { "epoch": 6.439075630252101, "grad_norm": 0.8987178018129869, "learning_rate": 7.803592362542911e-07, "loss": 0.0992, "loss_nan_ranks": 0, "loss_rank_avg": 0.10167519003152847, "step": 6130, "valid_targets_mean": 1352.9, "valid_targets_min": 684 }, { "epoch": 6.444327731092437, "grad_norm": 0.8464981713812435, "learning_rate": 7.659346316481086e-07, "loss": 0.0978, "loss_nan_ranks": 0, "loss_rank_avg": 0.09975661337375641, "step": 6135, "valid_targets_mean": 1479.4, "valid_targets_min": 874 }, { "epoch": 6.449579831932773, "grad_norm": 0.8500419492524814, "learning_rate": 7.516419870993296e-07, "loss": 0.1026, "loss_nan_ranks": 0, "loss_rank_avg": 0.09866391867399216, "step": 6140, "valid_targets_mean": 1501.2, "valid_targets_min": 765 }, { "epoch": 6.454831932773109, "grad_norm": 0.8846021286748634, "learning_rate": 7.374814006661667e-07, "loss": 0.1004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0995045006275177, "step": 6145, "valid_targets_mean": 1419.9, "valid_targets_min": 589 }, { "epoch": 6.4600840336134455, "grad_norm": 0.9586129744458028, "learning_rate": 7.234529695008241e-07, "loss": 0.1043, "loss_nan_ranks": 0, "loss_rank_avg": 0.1108023077249527, "step": 6150, "valid_targets_mean": 1587.2, "valid_targets_min": 918 }, { "epoch": 6.465336134453781, "grad_norm": 1.136739780639734, "learning_rate": 7.095567898488175e-07, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.20650501549243927, "step": 6155, "valid_targets_mean": 3546.9, "valid_targets_min": 702 }, { "epoch": 6.470588235294118, "grad_norm": 1.156568540868847, "learning_rate": 6.957929570483224e-07, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.2196894884109497, "step": 6160, "valid_targets_mean": 4000.6, "valid_targets_min": 1005 }, { "epoch": 6.475840336134453, "grad_norm": 1.0910237455501957, "learning_rate": 6.821615655295155e-07, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.19706688821315765, "step": 6165, "valid_targets_mean": 4063.9, "valid_targets_min": 1296 }, { "epoch": 6.48109243697479, "grad_norm": 0.9433508198462144, "learning_rate": 6.686627088139253e-07, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.18134765326976776, "step": 6170, "valid_targets_mean": 3747.0, "valid_targets_min": 1561 }, { "epoch": 6.486344537815126, "grad_norm": 0.9443013244173882, "learning_rate": 6.552964795137895e-07, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.206732839345932, "step": 6175, "valid_targets_mean": 3562.5, "valid_targets_min": 1044 }, { "epoch": 6.491596638655462, "grad_norm": 0.7981181274477949, "learning_rate": 6.420629693314317e-07, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.1745770275592804, "step": 6180, "valid_targets_mean": 3911.4, "valid_targets_min": 920 }, { "epoch": 6.496848739495798, "grad_norm": 1.0053288601599724, "learning_rate": 6.289622690586151e-07, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.21677300333976746, "step": 6185, "valid_targets_mean": 5753.8, "valid_targets_min": 2060 }, { "epoch": 6.5021008403361344, "grad_norm": 0.8097609883366772, "learning_rate": 6.159944685759289e-07, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.19428494572639465, "step": 6190, "valid_targets_mean": 3728.6, "valid_targets_min": 467 }, { "epoch": 6.507352941176471, "grad_norm": 0.8064900139004815, "learning_rate": 6.031596568521792e-07, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.20241563022136688, "step": 6195, "valid_targets_mean": 3554.0, "valid_targets_min": 1689 }, { "epoch": 6.512605042016807, "grad_norm": 0.776184144360134, "learning_rate": 5.904579219437567e-07, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.1855916827917099, "step": 6200, "valid_targets_mean": 3708.1, "valid_targets_min": 1697 }, { "epoch": 6.517857142857143, "grad_norm": 0.7831624701562231, "learning_rate": 5.778893509940497e-07, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.2027127742767334, "step": 6205, "valid_targets_mean": 3652.6, "valid_targets_min": 1223 }, { "epoch": 6.523109243697479, "grad_norm": 0.7592030323419526, "learning_rate": 5.654540302328526e-07, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.18956655263900757, "step": 6210, "valid_targets_mean": 4036.1, "valid_targets_min": 1552 }, { "epoch": 6.5283613445378155, "grad_norm": 0.7395667543125498, "learning_rate": 5.531520449757465e-07, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.1876063048839569, "step": 6215, "valid_targets_mean": 3543.5, "valid_targets_min": 1439 }, { "epoch": 6.533613445378151, "grad_norm": 0.7046765053549935, "learning_rate": 5.409834796235447e-07, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.1793154776096344, "step": 6220, "valid_targets_mean": 3287.0, "valid_targets_min": 1402 }, { "epoch": 6.538865546218488, "grad_norm": 0.7352367532176454, "learning_rate": 5.28948417661701e-07, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.19139184057712555, "step": 6225, "valid_targets_mean": 3423.9, "valid_targets_min": 1586 }, { "epoch": 6.544117647058823, "grad_norm": 0.7217587370221558, "learning_rate": 5.170469416597223e-07, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.18540339171886444, "step": 6230, "valid_targets_mean": 3406.0, "valid_targets_min": 1538 }, { "epoch": 6.54936974789916, "grad_norm": 0.8448265208591422, "learning_rate": 5.05279133270633e-07, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.18816813826560974, "step": 6235, "valid_targets_mean": 2954.0, "valid_targets_min": 1058 }, { "epoch": 6.554621848739496, "grad_norm": 0.7796897965938916, "learning_rate": 4.936450732303866e-07, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.198177307844162, "step": 6240, "valid_targets_mean": 3051.8, "valid_targets_min": 1362 }, { "epoch": 6.559873949579832, "grad_norm": 0.6964707697678552, "learning_rate": 4.821448413573237e-07, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.1926005631685257, "step": 6245, "valid_targets_mean": 3620.5, "valid_targets_min": 1392 }, { "epoch": 6.565126050420168, "grad_norm": 0.7685525826201484, "learning_rate": 4.70778516551631e-07, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.18368004262447357, "step": 6250, "valid_targets_mean": 3103.6, "valid_targets_min": 1267 }, { "epoch": 6.570378151260504, "grad_norm": 0.7299698999315323, "learning_rate": 4.595461767947829e-07, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.19365397095680237, "step": 6255, "valid_targets_mean": 3592.7, "valid_targets_min": 1026 }, { "epoch": 6.57563025210084, "grad_norm": 0.7134849644818172, "learning_rate": 4.484478991490249e-07, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.18238605558872223, "step": 6260, "valid_targets_mean": 3632.1, "valid_targets_min": 1785 }, { "epoch": 6.580882352941177, "grad_norm": 0.7566638135613766, "learning_rate": 4.374837597568338e-07, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.17180000245571136, "step": 6265, "valid_targets_mean": 3557.1, "valid_targets_min": 1957 }, { "epoch": 6.586134453781512, "grad_norm": 0.7212160746237427, "learning_rate": 4.266538338403936e-07, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.17052122950553894, "step": 6270, "valid_targets_mean": 3230.6, "valid_targets_min": 1570 }, { "epoch": 6.591386554621849, "grad_norm": 0.7590336258795505, "learning_rate": 4.159581957010894e-07, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.18137861788272858, "step": 6275, "valid_targets_mean": 3023.7, "valid_targets_min": 997 }, { "epoch": 6.5966386554621845, "grad_norm": 0.7939812548685019, "learning_rate": 4.0539691871898545e-07, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.20064428448677063, "step": 6280, "valid_targets_mean": 3056.6, "valid_targets_min": 1293 }, { "epoch": 6.601890756302521, "grad_norm": 0.7459390024198103, "learning_rate": 3.949700753523344e-07, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.16911663115024567, "step": 6285, "valid_targets_mean": 2915.6, "valid_targets_min": 1687 }, { "epoch": 6.607142857142857, "grad_norm": 0.8123891604766348, "learning_rate": 3.8467773713707134e-07, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.19759421050548553, "step": 6290, "valid_targets_mean": 2985.1, "valid_targets_min": 1108 }, { "epoch": 6.612394957983193, "grad_norm": 0.7820274649796405, "learning_rate": 3.7451997468632486e-07, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.17913171648979187, "step": 6295, "valid_targets_mean": 3195.0, "valid_targets_min": 571 }, { "epoch": 6.617647058823529, "grad_norm": 0.7958593118852751, "learning_rate": 3.6449685768993327e-07, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.19205614924430847, "step": 6300, "valid_targets_mean": 3106.2, "valid_targets_min": 738 }, { "epoch": 6.6228991596638656, "grad_norm": 0.727974701275133, "learning_rate": 3.5460845491396944e-07, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842992901802063, "step": 6305, "valid_targets_mean": 3189.5, "valid_targets_min": 1896 }, { "epoch": 6.628151260504202, "grad_norm": 0.737246932634588, "learning_rate": 3.448548342002589e-07, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.18911173939704895, "step": 6310, "valid_targets_mean": 3278.9, "valid_targets_min": 1177 }, { "epoch": 6.633403361344538, "grad_norm": 0.7200101677641911, "learning_rate": 3.352360624659312e-07, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.19001314043998718, "step": 6315, "valid_targets_mean": 3398.8, "valid_targets_min": 1270 }, { "epoch": 6.6386554621848735, "grad_norm": 0.6991330740624144, "learning_rate": 3.2575220570294276e-07, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.1835232377052307, "step": 6320, "valid_targets_mean": 3829.2, "valid_targets_min": 1668 }, { "epoch": 6.64390756302521, "grad_norm": 0.6942560490970551, "learning_rate": 3.164033289776369e-07, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.18814723193645477, "step": 6325, "valid_targets_mean": 3426.9, "valid_targets_min": 1184 }, { "epoch": 6.649159663865547, "grad_norm": 0.7240553846645934, "learning_rate": 3.071894964302935e-07, "loss": 0.1851, "loss_nan_ranks": 0, "loss_rank_avg": 0.19533832371234894, "step": 6330, "valid_targets_mean": 3523.6, "valid_targets_min": 1858 }, { "epoch": 6.654411764705882, "grad_norm": 0.6784877207352158, "learning_rate": 2.981107712746867e-07, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.16024400293827057, "step": 6335, "valid_targets_mean": 3161.2, "valid_targets_min": 922 }, { "epoch": 6.659663865546219, "grad_norm": 0.8123686861228415, "learning_rate": 2.891672157976522e-07, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.212624192237854, "step": 6340, "valid_targets_mean": 2948.9, "valid_targets_min": 1812 }, { "epoch": 6.6649159663865545, "grad_norm": 0.7276516066486569, "learning_rate": 2.803588913586608e-07, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.17187952995300293, "step": 6345, "valid_targets_mean": 3107.7, "valid_targets_min": 977 }, { "epoch": 6.670168067226891, "grad_norm": 0.6887997469688529, "learning_rate": 2.716858583894033e-07, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.16475774347782135, "step": 6350, "valid_targets_mean": 3372.6, "valid_targets_min": 810 }, { "epoch": 6.675420168067227, "grad_norm": 0.7520402794788272, "learning_rate": 2.6314817639335964e-07, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.17598888278007507, "step": 6355, "valid_targets_mean": 3305.2, "valid_targets_min": 1673 }, { "epoch": 6.680672268907563, "grad_norm": 0.6523534201108536, "learning_rate": 2.547459039454103e-07, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.15471762418746948, "step": 6360, "valid_targets_mean": 3933.0, "valid_targets_min": 1869 }, { "epoch": 6.685924369747899, "grad_norm": 0.8552212655149624, "learning_rate": 2.4647909869142117e-07, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.20678521692752838, "step": 6365, "valid_targets_mean": 3010.2, "valid_targets_min": 1377 }, { "epoch": 6.6911764705882355, "grad_norm": 0.7322859160819369, "learning_rate": 2.3834781734784817e-07, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.18106794357299805, "step": 6370, "valid_targets_mean": 3055.6, "valid_targets_min": 1219 }, { "epoch": 6.696428571428571, "grad_norm": 0.738490804680364, "learning_rate": 2.3035211570135995e-07, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.17908601462841034, "step": 6375, "valid_targets_mean": 3442.4, "valid_targets_min": 1168 }, { "epoch": 6.701680672268908, "grad_norm": 0.7971361125915069, "learning_rate": 2.224920486084403e-07, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.18598723411560059, "step": 6380, "valid_targets_mean": 3041.9, "valid_targets_min": 1955 }, { "epoch": 6.706932773109243, "grad_norm": 0.7900277569565785, "learning_rate": 2.1476766999502408e-07, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18570013344287872, "step": 6385, "valid_targets_mean": 3640.2, "valid_targets_min": 1628 }, { "epoch": 6.71218487394958, "grad_norm": 0.6556232945874763, "learning_rate": 2.071790328561152e-07, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.1550453007221222, "step": 6390, "valid_targets_mean": 3358.4, "valid_targets_min": 1482 }, { "epoch": 6.717436974789916, "grad_norm": 0.6812790984777259, "learning_rate": 1.997261892554403e-07, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.15719173848628998, "step": 6395, "valid_targets_mean": 3460.4, "valid_targets_min": 904 }, { "epoch": 6.722689075630252, "grad_norm": 0.7769101571262454, "learning_rate": 1.9240919032506688e-07, "loss": 0.1875, "loss_nan_ranks": 0, "loss_rank_avg": 0.2275974154472351, "step": 6400, "valid_targets_mean": 3728.4, "valid_targets_min": 1194 }, { "epoch": 6.727941176470588, "grad_norm": 0.7389737083348429, "learning_rate": 1.8522808626507683e-07, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.1957985758781433, "step": 6405, "valid_targets_mean": 3940.4, "valid_targets_min": 1658 }, { "epoch": 6.733193277310924, "grad_norm": 0.77498392264914, "learning_rate": 1.781829263432111e-07, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1999933421611786, "step": 6410, "valid_targets_mean": 3536.9, "valid_targets_min": 1423 }, { "epoch": 6.73844537815126, "grad_norm": 0.7005856165044073, "learning_rate": 1.7127375889452569e-07, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.1850917786359787, "step": 6415, "valid_targets_mean": 3351.2, "valid_targets_min": 2010 }, { "epoch": 6.743697478991597, "grad_norm": 0.7167520426399059, "learning_rate": 1.6450063132107396e-07, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.18986815214157104, "step": 6420, "valid_targets_mean": 3498.6, "valid_targets_min": 1172 }, { "epoch": 6.748949579831933, "grad_norm": 0.6942759631181366, "learning_rate": 1.5786359009156928e-07, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.18716512620449066, "step": 6425, "valid_targets_mean": 3863.8, "valid_targets_min": 1229 }, { "epoch": 6.754201680672269, "grad_norm": 0.6936745579008864, "learning_rate": 1.5136268074107398e-07, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.1890535056591034, "step": 6430, "valid_targets_mean": 3600.5, "valid_targets_min": 1523 }, { "epoch": 6.759453781512605, "grad_norm": 0.7070845571059466, "learning_rate": 1.44997947870682e-07, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.17694947123527527, "step": 6435, "valid_targets_mean": 3623.9, "valid_targets_min": 997 }, { "epoch": 6.764705882352941, "grad_norm": 0.7375315587768612, "learning_rate": 1.3876943514721465e-07, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.17876756191253662, "step": 6440, "valid_targets_mean": 3535.2, "valid_targets_min": 621 }, { "epoch": 6.769957983193278, "grad_norm": 0.7430227920142868, "learning_rate": 1.3267718530292296e-07, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.18011704087257385, "step": 6445, "valid_targets_mean": 3071.5, "valid_targets_min": 1282 }, { "epoch": 6.775210084033613, "grad_norm": 0.6530774473575953, "learning_rate": 1.267212401351925e-07, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.1584375500679016, "step": 6450, "valid_targets_mean": 3779.1, "valid_targets_min": 1421 }, { "epoch": 6.78046218487395, "grad_norm": 0.6882124626090157, "learning_rate": 1.2090164050625907e-07, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.1654224693775177, "step": 6455, "valid_targets_mean": 3330.2, "valid_targets_min": 1853 }, { "epoch": 6.785714285714286, "grad_norm": 0.7044440655396256, "learning_rate": 1.1521842634292013e-07, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.17785203456878662, "step": 6460, "valid_targets_mean": 3327.8, "valid_targets_min": 1410 }, { "epoch": 6.790966386554622, "grad_norm": 0.8200049965639139, "learning_rate": 1.0967163663627044e-07, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.18418024480342865, "step": 6465, "valid_targets_mean": 2920.6, "valid_targets_min": 1305 }, { "epoch": 6.796218487394958, "grad_norm": 0.7154441982579451, "learning_rate": 1.0426130944143353e-07, "loss": 0.1827, "loss_nan_ranks": 0, "loss_rank_avg": 0.1741981953382492, "step": 6470, "valid_targets_mean": 3539.7, "valid_targets_min": 996 }, { "epoch": 6.801470588235294, "grad_norm": 0.6654603332753054, "learning_rate": 9.898748187729513e-08, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.16577930748462677, "step": 6475, "valid_targets_mean": 3357.1, "valid_targets_min": 1349 }, { "epoch": 6.80672268907563, "grad_norm": 0.8172505155020807, "learning_rate": 9.385019012625007e-08, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.21172448992729187, "step": 6480, "valid_targets_mean": 3613.5, "valid_targets_min": 1248 }, { "epoch": 6.811974789915967, "grad_norm": 0.6891423541136645, "learning_rate": 8.884946943395811e-08, "loss": 0.1703, "loss_nan_ranks": 0, "loss_rank_avg": 0.14347678422927856, "step": 6485, "valid_targets_mean": 3327.4, "valid_targets_min": 1109 }, { "epoch": 6.817226890756302, "grad_norm": 0.7516599357315075, "learning_rate": 8.398535410910402e-08, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.18097805976867676, "step": 6490, "valid_targets_mean": 2790.8, "valid_targets_min": 1649 }, { "epoch": 6.822478991596639, "grad_norm": 0.7616811039107437, "learning_rate": 7.925787752314674e-08, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.18834054470062256, "step": 6495, "valid_targets_mean": 2811.8, "valid_targets_min": 1197 }, { "epoch": 6.8277310924369745, "grad_norm": 0.7317487761588832, "learning_rate": 7.466707211010838e-08, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.20096731185913086, "step": 6500, "valid_targets_mean": 3420.2, "valid_targets_min": 1720 }, { "epoch": 6.832983193277311, "grad_norm": 0.6976502515107287, "learning_rate": 7.02129693663478e-08, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.18510772287845612, "step": 6505, "valid_targets_mean": 3542.7, "valid_targets_min": 1054 }, { "epoch": 6.838235294117647, "grad_norm": 0.8023438462902227, "learning_rate": 6.589559985033189e-08, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.17661021649837494, "step": 6510, "valid_targets_mean": 3049.7, "valid_targets_min": 1643 }, { "epoch": 6.843487394957983, "grad_norm": 0.6905962109077173, "learning_rate": 6.171499318244234e-08, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.19038131833076477, "step": 6515, "valid_targets_mean": 3757.8, "valid_targets_min": 1135 }, { "epoch": 6.848739495798319, "grad_norm": 0.7819298312536493, "learning_rate": 5.767117804476696e-08, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.188393235206604, "step": 6520, "valid_targets_mean": 3715.1, "valid_targets_min": 1174 }, { "epoch": 6.8539915966386555, "grad_norm": 0.7603239023118682, "learning_rate": 5.376418218089541e-08, "loss": 0.1934, "loss_nan_ranks": 0, "loss_rank_avg": 0.20249368250370026, "step": 6525, "valid_targets_mean": 3321.9, "valid_targets_min": 992 }, { "epoch": 6.859243697478991, "grad_norm": 0.8027496504534014, "learning_rate": 4.99940323957393e-08, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.2095927596092224, "step": 6530, "valid_targets_mean": 3713.2, "valid_targets_min": 1133 }, { "epoch": 6.864495798319328, "grad_norm": 0.7827471840659329, "learning_rate": 4.63607545553435e-08, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.19427041709423065, "step": 6535, "valid_targets_mean": 2961.8, "valid_targets_min": 1195 }, { "epoch": 6.869747899159664, "grad_norm": 0.8495916082471087, "learning_rate": 4.2864373586706254e-08, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.20868608355522156, "step": 6540, "valid_targets_mean": 3012.6, "valid_targets_min": 484 }, { "epoch": 6.875, "grad_norm": 0.7058473937236638, "learning_rate": 3.950491347761487e-08, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.19130313396453857, "step": 6545, "valid_targets_mean": 3639.9, "valid_targets_min": 1434 }, { "epoch": 6.880252100840336, "grad_norm": 0.8058046651510254, "learning_rate": 3.628239727647254e-08, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.17615005373954773, "step": 6550, "valid_targets_mean": 4017.4, "valid_targets_min": 1349 }, { "epoch": 6.885504201680672, "grad_norm": 0.7986547158784268, "learning_rate": 3.319684709215176e-08, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.20986217260360718, "step": 6555, "valid_targets_mean": 3178.8, "valid_targets_min": 1434 }, { "epoch": 6.890756302521009, "grad_norm": 0.7069871681601839, "learning_rate": 3.024828409383007e-08, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.18144480884075165, "step": 6560, "valid_targets_mean": 3633.9, "valid_targets_min": 521 }, { "epoch": 6.8960084033613445, "grad_norm": 0.747775716498079, "learning_rate": 2.743672851085233e-08, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.19807741045951843, "step": 6565, "valid_targets_mean": 3981.0, "valid_targets_min": 1464 }, { "epoch": 6.901260504201681, "grad_norm": 1.0660860736808098, "learning_rate": 2.4762199632588634e-08, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.1948835551738739, "step": 6570, "valid_targets_mean": 2612.0, "valid_targets_min": 1239 }, { "epoch": 6.906512605042017, "grad_norm": 0.8171298625094956, "learning_rate": 2.2224715808309983e-08, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.18982771039009094, "step": 6575, "valid_targets_mean": 3489.8, "valid_targets_min": 1457 }, { "epoch": 6.911764705882353, "grad_norm": 0.7615110154926487, "learning_rate": 1.9824294447043923e-08, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.186547189950943, "step": 6580, "valid_targets_mean": 3059.1, "valid_targets_min": 1460 }, { "epoch": 6.917016806722689, "grad_norm": 0.7778984161564974, "learning_rate": 1.7560952017481313e-08, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.19061462581157684, "step": 6585, "valid_targets_mean": 3259.2, "valid_targets_min": 1084 }, { "epoch": 6.9222689075630255, "grad_norm": 0.7069596850632259, "learning_rate": 1.5434704047836424e-08, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.17042481899261475, "step": 6590, "valid_targets_mean": 3337.9, "valid_targets_min": 1035 }, { "epoch": 6.927521008403361, "grad_norm": 0.7072879579761938, "learning_rate": 1.344556512576256e-08, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.19188648462295532, "step": 6595, "valid_targets_mean": 4091.9, "valid_targets_min": 1876 }, { "epoch": 6.932773109243698, "grad_norm": 0.7505076999505291, "learning_rate": 1.1593548898236606e-08, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.1926942616701126, "step": 6600, "valid_targets_mean": 3705.8, "valid_targets_min": 1062 }, { "epoch": 6.938025210084033, "grad_norm": 0.831906921551297, "learning_rate": 9.878668071474639e-09, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.16769427061080933, "step": 6605, "valid_targets_mean": 3030.8, "valid_targets_min": 993 }, { "epoch": 6.94327731092437, "grad_norm": 0.7424388421322633, "learning_rate": 8.3009344108409e-09, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.17962056398391724, "step": 6610, "valid_targets_mean": 3366.9, "valid_targets_min": 873 }, { "epoch": 6.948529411764706, "grad_norm": 0.676120936221246, "learning_rate": 6.860358740763406e-09, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.17056873440742493, "step": 6615, "valid_targets_mean": 3651.0, "valid_targets_min": 1295 }, { "epoch": 6.953781512605042, "grad_norm": 0.7276545536651401, "learning_rate": 5.55695094467179e-09, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.19623544812202454, "step": 6620, "valid_targets_mean": 3583.6, "valid_targets_min": 1598 }, { "epoch": 6.959033613445378, "grad_norm": 0.7364736521570804, "learning_rate": 4.3907199649151355e-09, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.17404237389564514, "step": 6625, "valid_targets_mean": 2903.2, "valid_targets_min": 1123 }, { "epoch": 6.964285714285714, "grad_norm": 0.8283192384968932, "learning_rate": 3.361673802708687e-09, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2022954821586609, "step": 6630, "valid_targets_mean": 3116.1, "valid_targets_min": 1621 }, { "epoch": 6.96953781512605, "grad_norm": 0.853057291277257, "learning_rate": 2.469819518080563e-09, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.19089040160179138, "step": 6635, "valid_targets_mean": 3081.4, "valid_targets_min": 1858 }, { "epoch": 6.974789915966387, "grad_norm": 0.6873113252451049, "learning_rate": 1.7151632298140209e-09, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.15922731161117554, "step": 6640, "valid_targets_mean": 3470.7, "valid_targets_min": 420 }, { "epoch": 6.980042016806722, "grad_norm": 0.754724576359931, "learning_rate": 1.0977101154163727e-09, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.19214347004890442, "step": 6645, "valid_targets_mean": 3584.2, "valid_targets_min": 757 }, { "epoch": 6.985294117647059, "grad_norm": 0.8029047273305313, "learning_rate": 6.174644110767958e-10, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.17756588757038116, "step": 6650, "valid_targets_mean": 2940.8, "valid_targets_min": 732 }, { "epoch": 6.990546218487395, "grad_norm": 0.7749949104741897, "learning_rate": 2.744294116419077e-10, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.18697890639305115, "step": 6655, "valid_targets_mean": 3248.2, "valid_targets_min": 929 }, { "epoch": 6.995798319327731, "grad_norm": 0.7329373554307617, "learning_rate": 6.860747058468064e-11, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.18864449858665466, "step": 6660, "valid_targets_mean": 3728.8, "valid_targets_min": 1217 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101745903491974, "step": 6664, "total_flos": 1189003618287616.0, "train_loss": 0.21699104300674413, "train_runtime": 24543.5183, "train_samples_per_second": 4.344, "train_steps_per_second": 0.272, "valid_targets_mean": 3715.1, "valid_targets_min": 791 } ], "logging_steps": 5, "max_steps": 6664, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1189003618287616.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }